diff --git a/CMakeLists.txt b/CMakeLists.txt
index 6500ba013e28f..c23d403bcb6a1 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -154,7 +154,11 @@ file(GLOB_RECURSE NNVM_COMPILER_SRCS
 file(GLOB TOPI_SRCS
     topi/src/*.cc
 )
-file(GLOB_RECURSE HALIDEIR_SRCS 3rdparty/HalideIR/src/*.cpp)
+file(GLOB_RECURSE HALIDEIR_SRCS
+  3rdparty/HalideIR/src/base/*.cpp
+  3rdparty/HalideIR/src/ir/*.cpp
+  3rdparty/HalideIR/src/tvm/*.cpp
+)
 list(APPEND COMPILER_SRCS ${HALIDEIR_SRCS})
 file(GLOB RUNTIME_SRCS
   src/runtime/*.cc
diff --git a/Jenkinsfile b/Jenkinsfile
index 53645eb14b280..c38ec5296bf35 100644
--- a/Jenkinsfile
+++ b/Jenkinsfile
@@ -309,6 +309,24 @@ stage('Integration Test') {
   }
 }
 
+/*
+stage('Build packages') {
+  parallel 'conda CPU': {
+    node('CPU') {
+      sh "${docker_run} tvmai/conda-cpu ./conda/build_cpu.sh
+    }
+  },
+  'conda cuda': {
+    node('CPU') {
+      sh "${docker_run} tvmai/conda-cuda90 ./conda/build_cuda.sh
+      sh "${docker_run} tvmai/conda-cuda100 ./conda/build_cuda.sh
+    }
+  }
+  // Here we could upload the packages to anaconda for releases
+  // and/or the master branch
+}
+*/
+
 stage('Deploy') {
     node('doc') {
       ws('workspace/tvm/deploy-docs') {
diff --git a/apps/android_rpc/README.md b/apps/android_rpc/README.md
index 38725917f424f..1f2a46a8589c7 100644
--- a/apps/android_rpc/README.md
+++ b/apps/android_rpc/README.md
@@ -52,9 +52,25 @@ cd apps/android_rpc
 gradle clean build
 ```
 
-In `app/build/outputs/apk` you'll find `app-release-unsigned.apk`, use `dev_tools/gen_keystore.sh` to generate a signature and use `dev_tools/sign_apk.sh` to get the signed apk file `app/build/outputs/apk/tvmrpc-release.apk`.
+In `app/build/outputs/apk` you'll find `app-release-unsigned.apk`, use `dev_tools/gen_keystore.sh` to generate a signature and use `dev_tools/sign_apk.sh` to get the signed apk file `app/build/outputs/apk/release/tvmrpc-release.apk`.
 
-Upload `tvmrpc-release.apk` to your Android device and install it.
+Upload `tvmrpc-release.apk` to your Android device and install it:
+
+```bash
+$ANDROID_HOME/platform-tools/adb install app/build/outputs/apk/release/tvmrpc-release.apk
+```
+
+If you see error:
+
+    adb: failed to install app/build/outputs/apk/release/tvmrpc-release.apk:
+      Failure [INSTALL_FAILED_UPDATE_INCOMPATIBLE:
+      Package ml.dmlc.tvm.tvmrpc signatures do not match the previously installed version; ignoring!]
+
+Run uninstall first:
+
+```bash
+$ANDROID_HOME/platform-tools/adb uninstall ml.dmlc.tvm.tvmrpc
+```
 
 ### Build with OpenCL
 
diff --git a/apps/android_rpc/app/src/main/jni/Application.mk b/apps/android_rpc/app/src/main/jni/Application.mk
index aef7629990c2f..548b69160b174 100644
--- a/apps/android_rpc/app/src/main/jni/Application.mk
+++ b/apps/android_rpc/app/src/main/jni/Application.mk
@@ -23,3 +23,7 @@ ifeq ($(USE_VULKAN), 1)
     APP_CPPFLAGS += -DTVM_VULKAN_RUNTIME=1
     APP_LDFLAGS += -lvulkan
 endif
+
+ifeq ($(USE_SORT), 1)
+    APP_CPPFLAGS += -DUSE_SORT=1
+endif
diff --git a/apps/android_rpc/app/src/main/jni/make/config.mk b/apps/android_rpc/app/src/main/jni/make/config.mk
index c40ce4ba3ec7d..f61811bd604e4 100644
--- a/apps/android_rpc/app/src/main/jni/make/config.mk
+++ b/apps/android_rpc/app/src/main/jni/make/config.mk
@@ -22,6 +22,9 @@ USE_OPENCL = 0
 # whether to enable Vulkan during compile
 USE_VULKAN = 0
 
+# whether to enable contrib sort functions during compile
+USE_SORT = 1
+
 ifeq ($(USE_VULKAN), 1)
   # Statically linking vulkan requires API Level 24 or higher
   APP_PLATFORM = android-24
diff --git a/apps/android_rpc/app/src/main/jni/tvm_runtime.h b/apps/android_rpc/app/src/main/jni/tvm_runtime.h
index 60b41baaf8e70..aadc4d1884307 100644
--- a/apps/android_rpc/app/src/main/jni/tvm_runtime.h
+++ b/apps/android_rpc/app/src/main/jni/tvm_runtime.h
@@ -66,6 +66,10 @@
 #include "../src/runtime/vulkan/vulkan_module.cc"
 #endif
 
+#ifdef USE_SORT
+#include "../src/contrib/sort/sort.cc"
+#endif
+
 
 #include <android/log.h>
 
diff --git a/conda/Dockerfile.template b/conda/Dockerfile.template
index 59b9ac96814ee..1b5dc6fbef5e0 100644
--- a/conda/Dockerfile.template
+++ b/conda/Dockerfile.template
@@ -15,9 +15,13 @@
 # specific language governing permissions and limitations
 # under the License.
 
-FROM nvidia/cuda:{{ cuda_version }}-devel-centos6
+FROM nvidia/cuda:{{ cuda_version }}-devel-ubuntu16.04
 
-RUN curl -fsSL http://developer.download.nvidia.com/compute/redist/cudnn/v{{ cudnn_short_version }}/cudnn-{{ cuda_version }}-linux-x64-v{{ cudnn_version }}.tgz -O && \
+RUN apt-get update && apt-get install -y --no-install-recommends \
+            bzip2 curl sudo binutils && \
+    rm -rf /var/lib/apt/lists/*
+
+RUN  curl -fsSL http://developer.download.nvidia.com/compute/redist/cudnn/v{{ cudnn_short_version }}/cudnn-{{ cuda_version }}-linux-x64-v{{ cudnn_version }}.tgz -O && \
     tar --no-same-owner -xzf cudnn-{{ cuda_version }}-linux-x64-v{{ cudnn_version }}.tgz -C /usr/local && \
     rm cudnn-{{ cuda_version }}-linux-x64-v{{ cudnn_version }}.tgz && \
     ldconfig
@@ -27,13 +31,16 @@ RUN curl -o ~/miniconda.sh -O https://repo.continuum.io/miniconda/Miniconda3-lat
      chmod +x ~/miniconda.sh && \
      ~/miniconda.sh -b -p /opt/conda && \
      rm ~/miniconda.sh && \
+     /opt/conda/bin/conda upgrade --all && \
      /opt/conda/bin/conda install conda-build conda-verify && \
      /opt/conda/bin/conda clean -ya
 
+RUN /opt/conda/bin/conda install --download-only cmake make zlib
+RUN /opt/conda/bin/conda install --download-only -c numba llvmdev=8.0.0
+
 ENV PATH /opt/conda/bin:$PATH
 ENV LD_LIBRARY_PATH /usr/local/nvidia/lib:/usr/local/nvidia/lib64
+ENV CONDA_BLD_PATH /tmp
 
 WORKDIR /workspace
 RUN chmod -R a+w /workspace
-
-CMD conda build --output-folder /workspace/conda/pkg --variants '{cuda: True, cuda_version: {{ cuda_version }}}' /workspace/conda/tvm-libs
diff --git a/conda/Makefile b/conda/Makefile
deleted file mode 100644
index cda546ac73ce3..0000000000000
--- a/conda/Makefile
+++ /dev/null
@@ -1,22 +0,0 @@
-# Licensed to the Apache Software Foundation (ASF) under one
-# or more contributor license agreements.  See the NOTICE file
-# distributed with this work for additional information
-# regarding copyright ownership.  The ASF licenses this file
-# to you under the Apache License, Version 2.0 (the
-# "License"); you may not use this file except in compliance
-# with the License.  You may obtain a copy of the License at
-#
-#   http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing,
-# software distributed under the License is distributed on an
-# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-# KIND, either express or implied.  See the License for the
-# specific language governing permissions and limitations
-# under the License.
-
-packages:
-	conda build tvm-libs
-	conda build tvm
-	conda build topi
-	conda built nnvm
diff --git a/conda/nnvm/build.sh b/conda/build_cpu.sh
old mode 100644
new mode 100755
similarity index 68%
rename from conda/nnvm/build.sh
rename to conda/build_cpu.sh
index bdd333f57734c..992b1a369b96b
--- a/conda/nnvm/build.sh
+++ b/conda/build_cpu.sh
@@ -1,4 +1,4 @@
-#!/bin/bash
+#!/bin/sh
 # Licensed to the Apache Software Foundation (ASF) under one
 # or more contributor license agreements.  See the NOTICE file
 # distributed with this work for additional information
@@ -6,9 +6,9 @@
 # to you under the Apache License, Version 2.0 (the
 # "License"); you may not use this file except in compliance
 # with the License.  You may obtain a copy of the License at
-# 
+#
 #   http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing,
 # software distributed under the License is distributed on an
 # "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
@@ -17,6 +17,15 @@
 # under the License.
 
 set -e
+set -u
 
-cd nnvm/python
-$PYTHON setup.py install --single-version-externally-managed --record=/tmp/record.txt
+# This is a fix for a weird bug in conda that makes it think
+# it can't write in /tmp
+HOME=/tmp
+mkdir -p /tmp/.conda/pkgs
+touch /tmp/.conda/pkgs/urls.txt
+touch /tmp/.conda/environments.txt
+
+
+conda build --output-folder=conda/pkg -c numba conda/tvm-libs
+conda build --output-folder=conda/pkg -m conda/conda_build_config.yaml conda/tvm
diff --git a/conda/topi/build.sh b/conda/build_cuda.sh
old mode 100644
new mode 100755
similarity index 70%
rename from conda/topi/build.sh
rename to conda/build_cuda.sh
index 4e5aafb937660..2c9a20ae66aec
--- a/conda/topi/build.sh
+++ b/conda/build_cuda.sh
@@ -1,4 +1,4 @@
-#!/bin/bash
+#!/bin/sh
 # Licensed to the Apache Software Foundation (ASF) under one
 # or more contributor license agreements.  See the NOTICE file
 # distributed with this work for additional information
@@ -6,9 +6,9 @@
 # to you under the Apache License, Version 2.0 (the
 # "License"); you may not use this file except in compliance
 # with the License.  You may obtain a copy of the License at
-# 
+#
 #   http://www.apache.org/licenses/LICENSE-2.0
-# 
+#
 # Unless required by applicable law or agreed to in writing,
 # software distributed under the License is distributed on an
 # "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
@@ -17,6 +17,14 @@
 # under the License.
 
 set -e
+set -u
 
-cd topi/python
-$PYTHON setup.py install --single-version-externally-managed --record=/tmp/record.txt
+# This is a fix for a weird bug in conda that makes it think
+# it can't write in /tmp
+HOME=/tmp
+mkdir -p /tmp/.conda/pkgs
+touch /tmp/.conda/pkgs/urls.txt
+touch /tmp/.conda/environments.txt
+
+
+conda build --output-folder=conda/pkg --variants "{cuda: True, cuda_version: ${CUDA_VERSION%.*}}" -c numba conda/tvm-libs
diff --git a/conda/topi/meta.yaml b/conda/cross-linux.cmake
similarity index 54%
rename from conda/topi/meta.yaml
rename to conda/cross-linux.cmake
index f4bc8950d4c49..360400267ae07 100644
--- a/conda/topi/meta.yaml
+++ b/conda/cross-linux.cmake
@@ -15,37 +15,24 @@
 # specific language governing permissions and limitations
 # under the License.
 
-{% set version = "0.6.dev" %}
+# this one is important
+set(CMAKE_SYSTEM_NAME Linux)
+set(CMAKE_PLATFORM Linux)
+#this one not so much
+set(CMAKE_SYSTEM_VERSION 1)
 
-package:
-  name: topi
-  version: {{ version }}
+# specify the cross compiler
+set(CMAKE_C_COMPILER $ENV{CC})
 
-source:
-  path: ../..
+# where is the target environment
+set(CMAKE_FIND_ROOT_PATH $ENV{PREFIX} $ENV{BUILD_PREFIX}/$ENV{HOST}/sysroot)
 
-build:
-  number: 1
+# search for programs in the build host directories
+set(CMAKE_FIND_ROOT_PATH_MODE_PROGRAM NEVER)
 
-requirements:
-  host:
-    - python {{ python }}
-    - numpy
-    - setuptools
-    - decorator
-    - tvm-libs =={{ version }}
-  run:
-    - python
-    - {{ pin_compatible('numpy') }}
-    - decorator
-    - tvm-libs =={{ version }}
-    - tvm =={{ version }}
+# for libraries and headers in the target directories
+set(CMAKE_FIND_ROOT_PATH_MODE_LIBRARY ONLY)
+set(CMAKE_FIND_ROOT_PATH_MODE_INCLUDE ONLY)
 
-test:
-  imports:
-    - topi
-
-about:
-  home: https://github.com/dmlc/tvm
-  license: Apache2
-  summary: "TOPI: TVM Operator Inventory"
+# god-awful hack because it seems to not run correct tests to determine this:
+set(__CHAR_UNSIGNED___EXITCODE 1)
diff --git a/conda/nnvm/meta.yaml b/conda/nnvm/meta.yaml
deleted file mode 100644
index d948484a61e5f..0000000000000
--- a/conda/nnvm/meta.yaml
+++ /dev/null
@@ -1,56 +0,0 @@
-# Licensed to the Apache Software Foundation (ASF) under one
-# or more contributor license agreements.  See the NOTICE file
-# distributed with this work for additional information
-# regarding copyright ownership.  The ASF licenses this file
-# to you under the Apache License, Version 2.0 (the
-# "License"); you may not use this file except in compliance
-# with the License.  You may obtain a copy of the License at
-#
-#   http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing,
-# software distributed under the License is distributed on an
-# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-# KIND, either express or implied.  See the License for the
-# specific language governing permissions and limitations
-# under the License.
-
-{% set version = "0.6.dev" %}
-
-package:
-  name: nnvm
-  version: {{ version }}
-
-source:
-  path: ../..
-
-build:
-  number: 1
-  skip: True  # [win]
-
-requirements:
-  build:
-    - {{ compiler('cxx') }}
-  host:
-    - python {{ python }}
-    - cython
-    - numpy
-    - setuptools
-    - decorator
-    - tvm-libs =={{ version }}
-  run:
-    - tvm =={{ version }}
-    - topi =={{ version }}
-    - tvm-libs =={{ version }}
-    - python
-    - {{ pin_compatible('numpy') }}
-    - decorator
-
-test:
-  imports:
-    - nnvm
-
-about:
-  home: https://github.com/dmlc/nnvm
-  license: Apache2
-  summary: Bring deep learning to bare metal
diff --git a/conda/build_cuda.py b/conda/render_cuda.py
similarity index 74%
rename from conda/build_cuda.py
rename to conda/render_cuda.py
index 47af6ce4564e9..8057892fd83c1 100644
--- a/conda/build_cuda.py
+++ b/conda/render_cuda.py
@@ -29,8 +29,8 @@
 # and from conda.
 
 # These two must be in sync
-CUDNN_FULL_VERSION = '7.3.1.20'
-CUDNN_VERSION = '7.3.1'
+CUDNN_FULL_VERSION = '7.6.0.64'
+CUDNN_VERSION = '7.6.0'
 
 
 condadir = os.path.dirname(sys.argv[0])
@@ -47,30 +47,15 @@ def render_dockerfile(version):
                                  cudnn_short_version=CUDNN_VERSION,
                                  cudnn_version=CUDNN_FULL_VERSION)
     fname = os.path.join(condadir,
-                         'Dockerfile.cuda' + version.replace('.', ''))
+                         '../docker/Dockerfile.conda_cuda' + version.replace('.', ''))
     with open(fname, 'w') as f:
         f.write(txt)
     return fname
 
 
-def build_docker(version):
-    vv = version.replace('.', '')
-    fname = render_dockerfile(version)
-    tagname = f'tvm-cuda{ vv }-forge'
-    subprocess.run(['docker', 'build', '-t', tagname,
-                    condadir, '-f', fname], check=True)
-    return tagname
-
-
-def build_pkg(version):
-    tagname = build_docker(version)
-    subprocess.run(['docker', 'run', '--rm', '-v', f'{ srcdir }:/workspace',
-                    tagname], check=True)
-
-
 if __name__ == '__main__':
     build_versions = CUDA_VERSIONS
     if len(sys.argv) > 1:
         build_versions = sys.argv[1:]
     for version in build_versions:
-        build_pkg(version)
+        render_dockerfile(version)
diff --git a/conda/tvm-libs/build.sh b/conda/tvm-libs/build.sh
index e0b85910475ea..94919c60e7797 100644
--- a/conda/tvm-libs/build.sh
+++ b/conda/tvm-libs/build.sh
@@ -17,24 +17,37 @@
 # under the License.
 
 set -e
-
-if [ "$cuda" == "True" ]; then
-    CUDA_OPT="-DUSE_CUDA=ON -DUSE_CUBLAS=ON -DUSE_CUDNN=ON"
-else
-    CUDA_OPT=""
-fi
+set -u
 
 if [ "$target_platform" == "osx-64" ]; then
     # macOS 64 bits
-    METAL_OPT=""  # Conda can only target 10.9 for now
+    METAL_OPT="-DUSE_METAL=ON"
+    TOOLCHAIN_OPT="-DCMAKE_OSX_DEPLOYMENT_TARGET=10.11"
 else
     METAL_OPT=""
+    if [ "$target_platform" == "linux-64" ]; then
+	# Linux 64 bits
+	TOOLCHAIN_OPT="-DCMAKE_TOOLCHAIN_FILE=${RECIPE_DIR}/../cross-linux.cmake"
+    else
+	# Windows (or 32 bits, which we don't support)
+	TOOLCHAIN_OPT=""
+    fi
+fi
+
+# When cuda is not set, we default to False
+cuda=${cuda:-False}
+
+if [ "$cuda" == "True" ]; then
+    CUDA_OPT="-DUSE_CUDA=ON -DUSE_CUBLAS=ON -DUSE_CUDNN=ON"
+    TOOLCHAIN_OPT=""
+else
+    CUDA_OPT=""
 fi
 
 rm -rf build || true
 mkdir -p build
 cd build
-cmake $METAL_OPT $CUDA_OPT -DUSE_LLVM=$PREFIX/bin/llvm-config -DINSTALL_DEV=ON -DCMAKE_INSTALL_PREFIX="$PREFIX" ..
+cmake $METAL_OPT $CUDA_OPT -DUSE_LLVM=$PREFIX/bin/llvm-config -DINSTALL_DEV=ON -DCMAKE_INSTALL_PREFIX="$PREFIX" $TOOLCHAIN_OPT ..
 make -j${CPU_COUNT} VERBOSE=1
 make install
 cd ..
diff --git a/conda/tvm-libs/meta.yaml b/conda/tvm-libs/meta.yaml
index aad8f251c2a69..e3422a2174efe 100644
--- a/conda/tvm-libs/meta.yaml
+++ b/conda/tvm-libs/meta.yaml
@@ -15,7 +15,7 @@
 # specific language governing permissions and limitations
 # under the License.
 
-{% set version = "0.6.dev" %}
+{% set version = "0.6.dev1" %}
 
 package:
   name: tvm-libs
@@ -25,21 +25,22 @@ source:
   path: ../..
 
 build:
-  number: 1
-  string: cuda{{ cuda_version }}_{{ PKG_BUILDNUM }}  # [cuda]
+  number: 0
+  string: cuda{{ cuda_version | replace('.', '') }}h{{ PKG_HASH }}_{{ PKG_BUILDNUM }}  # [cuda]
 
 requirements:
   build:
-    # The OS X build will require some manual setup or it will break
-    # See https://docs.conda.io/projects/conda-build/en/latest/source/resources/compiler-tools.html#macos-sdk
-    - {{ compiler('cxx') }}
-  host:
+    # The anaconda compilers for OS X are old an annoying
+    # so we rely on the platform ones for now
+    - {{ compiler('cxx') }}  # [linux]
     - cmake
-    - llvmdev ==6.0.0
+    - make
+  host:
+    - llvmdev ==8.0.0
     - zlib  # [linux]
   run:
     - {{ pin_compatible('cudatoolkit', lower_bound=cuda_version, max_pin='x.x') }}  # [cuda]
-    - {{ pin_compatible('cudnn', lower_bound='7.3.1', max_pin='x') }}  # [cuda]
+    - {{ pin_compatible('cudnn', lower_bound='7.6.0', max_pin='x') }}  # [cuda]
 
 about:
   home: https://github.com/dmlc/tvm
diff --git a/conda/tvm/build.sh b/conda/tvm/build.sh
index 6626aa5920914..494f90f0afa01 100644
--- a/conda/tvm/build.sh
+++ b/conda/tvm/build.sh
@@ -17,6 +17,16 @@
 # under the License.
 
 set -e
+set -u
 
 cd python
 $PYTHON setup.py install --single-version-externally-managed --record=/tmp/record.txt
+cd ..
+
+cd topi/python
+$PYTHON setup.py install --single-version-externally-managed --record=/tmp/record.txt
+cd ../..
+
+cd nnvm/python
+$PYTHON setup.py install --single-version-externally-managed --record=/tmp/record.txt
+cd ../..
diff --git a/conda/tvm/meta.yaml b/conda/tvm/meta.yaml
index 221dc7950f753..0daca4bcea2bd 100644
--- a/conda/tvm/meta.yaml
+++ b/conda/tvm/meta.yaml
@@ -15,7 +15,7 @@
 # specific language governing permissions and limitations
 # under the License.
 
-{% set version = "0.6.dev" %}
+{% set version = "0.6.dev1" %}
 
 package:
   name: tvm
@@ -25,7 +25,7 @@ source:
   path: ../..
 
 build:
-  number: 1
+  number: 0
 
 requirements:
   build:
@@ -46,6 +46,15 @@ requirements:
 test:
   imports:
     - tvm
+    - topi
+    - nnvm
+  requires:
+    - nose
+    - scipy
+  source_files:
+    - tests/python
+  commands:
+    - python -m nose -v tests/python/integration
 
 about:
   home: https://github.com/dmlc/tvm
diff --git a/docker/Dockerfile.conda_cpu b/docker/Dockerfile.conda_cpu
new file mode 100644
index 0000000000000..0660b5daa0e26
--- /dev/null
+++ b/docker/Dockerfile.conda_cpu
@@ -0,0 +1,41 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+FROM ubuntu:16.04
+
+RUN apt-get update && apt-get install -y bzip2 curl sudo binutils && rm -rf /var/lib/apt/lists/*
+
+RUN curl -o ~/miniconda.sh -O https://repo.continuum.io/miniconda/Miniconda3-latest-Linux-x86_64.sh  && \
+     chmod +x ~/miniconda.sh && \
+     ~/miniconda.sh -b -p /opt/conda && \
+     rm ~/miniconda.sh && \
+     /opt/conda/bin/conda upgrade --all && \
+     /opt/conda/bin/conda install conda-build conda-verify && \
+     /opt/conda/bin/conda clean -ya
+
+# Cache some of the packages for the builds
+RUN /opt/conda/bin/conda install --download-only cmake make zlib && \
+    /opt/conda/bin/conda install --download-only -c numba llvmdev=8.0.0 && \
+    /opt/conda/bin/conda create -n py35 --download-only nose scipy numpy=1.11 cython decorator python=3.5 && \
+    /opt/conda/bin/conda create -n py36 --download-only nose scipy numpy=1.11 cython decorator python=3.6 && \
+    /opt/conda/bin/conda create -n py37 --download-only nose scipy numpy=1.11 cython decorator python=3.7
+
+ENV PATH /opt/conda/bin:$PATH
+ENV CONDA_BLD_PATH /tmp
+
+WORKDIR /workspace
+RUN chmod -R a+w /workspace
diff --git a/docker/Dockerfile.conda_cuda100 b/docker/Dockerfile.conda_cuda100
new file mode 100644
index 0000000000000..d6e1cddbfd373
--- /dev/null
+++ b/docker/Dockerfile.conda_cuda100
@@ -0,0 +1,46 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+FROM nvidia/cuda:10.0-devel-ubuntu16.04
+
+RUN apt-get update && apt-get install -y --no-install-recommends \
+            bzip2 curl sudo binutils && \
+    rm -rf /var/lib/apt/lists/*
+
+RUN  curl -fsSL http://developer.download.nvidia.com/compute/redist/cudnn/v7.6.0/cudnn-10.0-linux-x64-v7.6.0.64.tgz -O && \
+    tar --no-same-owner -xzf cudnn-10.0-linux-x64-v7.6.0.64.tgz -C /usr/local && \
+    rm cudnn-10.0-linux-x64-v7.6.0.64.tgz && \
+    ldconfig
+
+
+RUN curl -o ~/miniconda.sh -O https://repo.continuum.io/miniconda/Miniconda3-latest-Linux-x86_64.sh  && \
+     chmod +x ~/miniconda.sh && \
+     ~/miniconda.sh -b -p /opt/conda && \
+     rm ~/miniconda.sh && \
+     /opt/conda/bin/conda upgrade --all && \
+     /opt/conda/bin/conda install conda-build conda-verify && \
+     /opt/conda/bin/conda clean -ya
+
+RUN /opt/conda/bin/conda install --download-only cmake make zlib
+RUN /opt/conda/bin/conda install --download-only -c numba llvmdev=8.0.0
+
+ENV PATH /opt/conda/bin:$PATH
+ENV LD_LIBRARY_PATH /usr/local/nvidia/lib:/usr/local/nvidia/lib64
+ENV CONDA_BLD_PATH /tmp
+
+WORKDIR /workspace
+RUN chmod -R a+w /workspace
\ No newline at end of file
diff --git a/docker/Dockerfile.conda_cuda90 b/docker/Dockerfile.conda_cuda90
new file mode 100644
index 0000000000000..f55aa1bf2e126
--- /dev/null
+++ b/docker/Dockerfile.conda_cuda90
@@ -0,0 +1,46 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+FROM nvidia/cuda:9.0-devel-ubuntu16.04
+
+RUN apt-get update && apt-get install -y --no-install-recommends \
+            bzip2 curl sudo binutils && \
+    rm -rf /var/lib/apt/lists/*
+
+RUN  curl -fsSL http://developer.download.nvidia.com/compute/redist/cudnn/v7.6.0/cudnn-9.0-linux-x64-v7.6.0.64.tgz -O && \
+    tar --no-same-owner -xzf cudnn-9.0-linux-x64-v7.6.0.64.tgz -C /usr/local && \
+    rm cudnn-9.0-linux-x64-v7.6.0.64.tgz && \
+    ldconfig
+
+
+RUN curl -o ~/miniconda.sh -O https://repo.continuum.io/miniconda/Miniconda3-latest-Linux-x86_64.sh  && \
+     chmod +x ~/miniconda.sh && \
+     ~/miniconda.sh -b -p /opt/conda && \
+     rm ~/miniconda.sh && \
+     /opt/conda/bin/conda upgrade --all && \
+     /opt/conda/bin/conda install conda-build conda-verify && \
+     /opt/conda/bin/conda clean -ya
+
+RUN /opt/conda/bin/conda install --download-only cmake make zlib
+RUN /opt/conda/bin/conda install --download-only -c numba llvmdev=8.0.0
+
+ENV PATH /opt/conda/bin:$PATH
+ENV LD_LIBRARY_PATH /usr/local/nvidia/lib:/usr/local/nvidia/lib64
+ENV CONDA_BLD_PATH /tmp
+
+WORKDIR /workspace
+RUN chmod -R a+w /workspace
\ No newline at end of file
diff --git a/docker/Dockerfile.demo_android b/docker/Dockerfile.demo_android
index e9c3e4f6ce8eb..4f93e84007495 100644
--- a/docker/Dockerfile.demo_android
+++ b/docker/Dockerfile.demo_android
@@ -52,6 +52,8 @@ ENV PATH ${PATH}:${VULKAN_SDK}/bin
 ENV LD_LIBRARY_PATH ${LD_LIBRARY_PATH}:${VULKAN_SDK}/lib
 ENV VK_LAYER_PATH ${VULKAN_SDK}/etc/explicit_layer.d
 
+RUN git clone https://github.com/KhronosGroup/OpenCL-Headers /usr/local/OpenCL-Headers/
+
 # Build TVM
 RUN cd /usr && \
     git clone --depth=1 https://github.com/dmlc/tvm --recursive && \
@@ -69,3 +71,4 @@ RUN cd /usr && \
 
 # Environment variables
 ENV PYTHONPATH=/usr/tvm/python:/usr/tvm/topi/python:/usr/tvm/nnvm/python/:/usr/tvm/vta/python:${PYTHONPATH}
+ENV ANDROID_HOME=/opt/android-sdk-linux/
diff --git a/docker/install/ubuntu_install_python_package.sh b/docker/install/ubuntu_install_python_package.sh
index 38cf36f237c7b..88d07cc884399 100755
--- a/docker/install/ubuntu_install_python_package.sh
+++ b/docker/install/ubuntu_install_python_package.sh
@@ -22,4 +22,4 @@ set -o pipefail
 
 # install libraries for python package on ubuntu
 pip2 install nose pylint==1.9.4 six numpy nose-timer cython decorator scipy tornado typing antlr4-python2-runtime attrs
-pip3 install nose pylint==1.9.4 six numpy nose-timer cython decorator scipy tornado typed_ast pytest mypy orderedset antlr4-python3-runtime attrs
+pip3 install nose pylint==1.9.4 six numpy nose-timer cython decorator scipy tornado typed_ast pytest mypy orderedset antlr4-python3-runtime attrs requests Pillow
diff --git a/docs/api/python/relay/index.rst b/docs/api/python/relay/index.rst
index 39a68b6d1f5d5..90746b8e5d4ee 100644
--- a/docs/api/python/relay/index.rst
+++ b/docs/api/python/relay/index.rst
@@ -33,7 +33,8 @@ compiler stack.
    expr
    frontend
    image
-   ir_pass
+   analysis
+   transform
    module
    nn
    op
diff --git a/include/tvm/arithmetic.h b/include/tvm/arithmetic.h
index 92f7399a89a57..446c4c0c19a91 100644
--- a/include/tvm/arithmetic.h
+++ b/include/tvm/arithmetic.h
@@ -623,12 +623,15 @@ IntSet Intersect(const Array<IntSet>& sets);
  *  give the domain of each variables. Return undefined IntSet to
  *  represent failure.
  *
+ * \note The returned set may be smaller than set that
+ *       contains all possible values of v that satisfies the bound.
+ *
  * \param v The target variable to be deduced.
  * \param cond The conditional expression.
  * \param hint_map The domain of variable, used to help deduce.
  * \param relax_map The domain of each variable, used to relax the domain,
- *        The deduce bound mush implies e for all value in relax_map
- * \return An integer set that can cover all the possible values.
+ *        The deduce bound must implies e for all value in relax_map
+ * \return An integer set that always satisfies the condition.
  */
 IntSet DeduceBound(Expr v, Expr cond,
                    const Map<Var, IntSet>& hint_map,
@@ -641,7 +644,7 @@ IntSet DeduceBound(Expr v, Expr cond,
  * \param hint_map The domain of variable, used to help deduce.
  * \param relax_map The domain of each variable, used to relax the domain,
  *        The deduce bound mush implies e for all value in relax_map
- * \return An integer set that can cover all the possible values.
+ * \return An integer set that always satisfies the condition.
  */
 IntSet DeduceBound(Expr v, Expr cond,
                    const std::unordered_map<const Variable*, IntSet>& hint_map,
diff --git a/include/tvm/buffer.h b/include/tvm/buffer.h
index ed4ac5ea6a63f..1233e9b0b89b8 100644
--- a/include/tvm/buffer.h
+++ b/include/tvm/buffer.h
@@ -36,10 +36,11 @@ namespace tvm {
 // Internal node container Buffer
 class BufferNode;
 
-/*! \brief memory access kind */
-enum class AccessMask : int {
-  kRead = 1,
-  kWrite = 2
+/*! \brief buffer type */
+enum BufferType : int {
+  kDefault = 1,
+  // Maps buffer[i][j][k] -> buffer[i][0][k] if dimension i's shape equals 1.
+  kAutoBroadcast = 2,
 };
 
 /*!
@@ -129,6 +130,8 @@ class BufferNode : public Node {
    *  elem_offset is guaranteed to be multiple of offset_factor.
    */
   int offset_factor;
+  /*! \brief buffer type */
+  BufferType buffer_type;
   /*! \brief constructor */
   BufferNode() {}
 
@@ -142,6 +145,7 @@ class BufferNode : public Node {
     v->Visit("scope", &scope);
     v->Visit("data_alignment", &data_alignment);
     v->Visit("offset_factor", &offset_factor);
+    v->Visit("buffer_type", &buffer_type);
   }
 
   /*! \return preferred index type for this buffer node */
@@ -159,7 +163,8 @@ class BufferNode : public Node {
                              std::string name,
                              std::string scope,
                              int data_alignment,
-                             int offset_factor);
+                             int offset_factor,
+                             BufferType buffer_type);
 
   static constexpr const char* _type_key = "Buffer";
   TVM_DECLARE_NODE_TYPE_INFO(BufferNode, Node);
diff --git a/include/tvm/ir_pass.h b/include/tvm/ir_pass.h
index e1c92e50e6ad1..98dbf6bb62906 100644
--- a/include/tvm/ir_pass.h
+++ b/include/tvm/ir_pass.h
@@ -27,7 +27,6 @@
 #ifndef TVM_IR_PASS_H_
 #define TVM_IR_PASS_H_
 
-#include <arithmetic/Simplify.h>
 #include <unordered_map>
 #include <unordered_set>
 #include <vector>
diff --git a/include/tvm/relay/adt.h b/include/tvm/relay/adt.h
index 9e4e00ca47ed4..2a6507b62a33d 100644
--- a/include/tvm/relay/adt.h
+++ b/include/tvm/relay/adt.h
@@ -114,7 +114,7 @@ class ConstructorNode : public ExprNode {
   /*! \brief The datatype the constructor will construct. */
   GlobalTypeVar belong_to;
   /*! \brief Index in the table of constructors (set when the type is registered). */
-  mutable int tag = -1;
+  mutable int32_t tag = -1;
 
   ConstructorNode() {}
 
diff --git a/include/tvm/relay/pass.h b/include/tvm/relay/analysis.h
similarity index 55%
rename from include/tvm/relay/pass.h
rename to include/tvm/relay/analysis.h
index 294d22b812a13..3672a22847dbf 100644
--- a/include/tvm/relay/pass.h
+++ b/include/tvm/relay/analysis.h
@@ -18,55 +18,21 @@
  */
 
 /*!
- * \file tvm/relay/pass.h
- * \brief The set of Relay passes written in C++.
-  */
-#ifndef TVM_RELAY_PASS_H_
-#define TVM_RELAY_PASS_H_
+ * \file tvm/relay/analysis.h
+ * \brief The set of Relay analysis passes written in C++.
+ */
+#ifndef TVM_RELAY_ANALYSIS_H_
+#define TVM_RELAY_ANALYSIS_H_
 
-#include <tvm/ir.h>
-#include <tvm/packed_func_ext.h>
+#include <tvm/relay/adt.h>
 #include <tvm/relay/expr.h>
 #include <tvm/relay/module.h>
-#include <tvm/relay/op_attr_types.h>
 #include <tvm/relay/type.h>
-#include <tvm/relay/adt.h>
-#include <tvm/relay/transform.h>
-#include <tvm/runtime/vm.h>
 #include <string>
-#include <vector>
 
 namespace tvm {
 namespace relay {
 
-/*!
- * \brief Infer the type of an expression.
- *
- * The result of type checking is a new expression with unambigous
- * type information filled in, as well as it's checked type field
- * populated with the result type.
- *
- * \param expr The expression to type check.
- * \param mod The module used for referencing global functions, can be
- * None.
- *
- * \return A type checked expression with its checked_type field populated.
- */
-TVM_DLL Expr InferType(const Expr& expr, const Module& mod);
-
-/*!
- * \brief Infer the type of a function as if it is mapped to var in the mod.
- *
- * \param f the function.
- * \param mod The module used for referencing global functions.
- * \param var The global variable corresponding to the function.
- *
- * \return A type checked Function with its checked_type field populated.
- * \note this function mutates mod and is not thread-safe.
- */
-TVM_DLL Function InferType(const Function& f, const Module& mod,
-                           const GlobalVar& var);
-
 /*!
  * \brief Check that types are well kinded by applying "kinding rules".
  *
@@ -140,23 +106,6 @@ TVM_DLL bool AlphaEqual(const Type& t1, const Type& t2);
  */
 TVM_DLL bool AlphaEqual(const Pattern& t1, const Pattern& t2);
 
-/*!
- * \brief Add abstraction over a function
- *
- * For example: `square` is transformed to
- * `fun x -> square x`.
- *
- * See https://en.wikipedia.org/wiki/Lambda_calculus#%CE%B7-conversion
- * for more details.
- *
- * \param e The original function.
- * \param mod The module used for referencing global functions, can be
- * None.
- *
- * \return the new function with abstraction
- */
-TVM_DLL Expr EtaExpand(const Expr& e, const Module& mod);
-
 /*!
  * \brief Check that each Var is only bound once.
  *
@@ -288,87 +237,6 @@ TVM_DLL tvm::Array<TypeVar> AllTypeVars(const Expr& expr, const Module& mod);
  */
 TVM_DLL tvm::Array<TypeVar> AllTypeVars(const Type& t, const Module& mod);
 
-/*! \brief Remove expressions which does not effect the program result.
- *
- * It will remove let bindings which are not referenced,
- * and inline let bindings that are only used once.
- *
- * For example, this pass should turn `let a = 1 in 2` into `2`,
- * as the value of the expression does not depend on a.
- *
- * As another example, `let a = 1 in a` will be optimized into 1,
- * if the flag is turned on.
- *
- * \param e the expression to optimize.
- * \param inline_once whether or not to inline binding used one.
- *
- * \return the optimized expression.
- */
-TVM_DLL Expr DeadCodeElimination(const Expr& e, bool inline_once = false);
-
-/*!
- * \brief Fold constant expressions.
- *
- * \param expr the expression to be optimized.
- *
- * \return The optimized expression.
- */
-TVM_DLL Expr FoldConstant(const Expr& expr);
-
-/*!
- * \brief Fuse operations into expr into seperate functions.
- *
- * \param expr The expression.
- * \param fuse_opt_level Optimization level.
- * \param mod the module.
- *
- * \return The optimized expression.
- */
-TVM_DLL Expr FuseOps(const Expr& expr, int fuse_opt_level, const Module& mod);
-
-/*!
- * \brief Apply rewrite rules to rewrite the expr in post DFS order.
- *
- * \param expr The expression.
- * \param rewrite_map_attr_name The Op's attr name which corresponds to the rewrite
- *                              rule function.
- * \param fcontext Additional callback to provide context argument for each call node.
- * \param fmulti_ref_trigger Transformation function to be called when
- *                           an Expr consumed by multiple callers.
- * \return The rewritten expression.
- */
-TVM_DLL Expr ForwardRewrite(const Expr& expr,
-                            const std::string& rewrite_map_attr_name,
-                            std::function<NodeRef(const Call&)> fcontext = nullptr,
-                            std::function<Expr(const Expr&)> fmulti_ref_trigger = nullptr);
-
-/*!
- * \brief Apply rewrite rules to rewrite the expr in post DFS order.
- *
- * \param expr The expression.
- * \param rewrite_func The rewrite func that will apply to all operators.
- * \param fcontext Additional callback to provide context argument for each call node.
- * \param fmulti_ref_trigger Transformation function to be called when
- *                           an Expr consumed by multiple callers.
- *
- * \return The rewritten expression.
- */
-TVM_DLL Expr ForwardRewrite(const Expr& expr,
-                            const FForwardRewrite& rewrite_func,
-                            std::function<NodeRef(const Call&)> fcontext = nullptr,
-                            std::function<Expr(const Expr&)> fmulti_ref_trigger = nullptr);
-
-/*!
- * \brief Rewrite the annotated program.
- *
- * \param expr The expression.
- * \param fallback_device The fallback device which is the default device for
- *                        operators without annotation.
- *
- * \return The updated program.
- */
-TVM_DLL Expr RewriteAnnotatedOps(const Expr& expr, int fallback_device);
-
 /*!
  * \brief Collect the device mapping information of each expression.
  *
@@ -387,38 +255,6 @@ TVM_DLL Map<Expr, Integer> CollectDeviceInfo(const Expr& expr);
  */
 TVM_DLL Map<Expr, Integer> CollectDeviceAnnotationOps(const Expr& expr);
 
-/*!
- * \brief turn a dataflow graph into Administrative Normal Form, or A-Normal Form (ANF).
- *
- * It will turn an expression that is in a graph form (with sharing implicit),
- * to an expression with explicit sharing (A-Normal Form).
- *
- * The scope of the root expression is the global scope.
- *
- * The scope of any non root expression is the least common ancestor of all it's scope.
- *
- * Values are ordered by post-DFS order in each scope.
- *
- * \param e the expression to observably share.
- * \param mod The module used for referencing global functions, can be
- * None.
- *
- * \return expression in A-Normal Form.
- */
-TVM_DLL Expr ToANormalForm(const Expr& e, const Module& mod);
-
-/*!
- * \brief Remove let binding and directly share via pointer instead.
- *
- * It will remove all let binding,
- * and turn all of the variable bound by let into direct pointer reference.
- *
- * \param e the expression.
- *
- * \return the expression in graph normal form.
- */
-TVM_DLL Expr ToGraphNormalForm(const Expr& e);
-
 /*!
  * \brief Finds cases that the given match expression does not catch, if any.
  *
@@ -431,30 +267,6 @@ TVM_DLL Expr ToGraphNormalForm(const Expr& e);
  */
 TVM_DLL Array<Pattern> UnmatchedCases(const Match& match, const Module& mod);
 
-/*!
- * \brief Aggressive constant propagation/constant folding/inlining.
- * It will do as much computation in compile time as possible.
- * It has two benefit: remove runtime overhead, and allow more optimization (typically fusion).
- * As a side effect, code size will explode.
- *
- * \param e the expression
- * \param mod the module
- *
- * \return the optimized expression.
- */
-TVM_DLL Expr PartialEval(const Expr& e, const Module& mod);
-
-/*
- * \brief Bind function parameters or free variables.
- *
- * Parameter binding can only happen if expr is a Function.
- * binds cannot change internal arguments of internal functions.
- *
- * \param expr The function to be binded.
- * \param binds The map of arguments to
- */
-TVM_DLL Expr Bind(const Expr& expr, const tvm::Map<Var, Expr>& bind_map);
-
 /*! \brief A hashing structure in the style of std::hash. */
 struct StructuralHash {
   /*! \brief Hash a Relay type.
@@ -466,7 +278,6 @@ struct StructuralHash {
    * \return the hash value.
    */
   size_t operator()(const Type& type) const;
-
   /*! \brief Hash a Relay expression.
    *
    * Implements structural hashing of a Relay expression.
@@ -478,20 +289,7 @@ struct StructuralHash {
   size_t operator()(const Expr& expr) const;
 };
 
-namespace vm {
-
-/*!
- * \brief Compile a module, and construct the virtual machine.
- *
- * \param mod The module to compile.
- *
- * \return The constructed virtual machine.
- */
-runtime::vm::VirtualMachine CompileModule(const Module& mod);
-
-}  // namespace vm
-
 }  // namespace relay
 }  // namespace tvm
 
-#endif  // TVM_RELAY_PASS_H_
+#endif  // TVM_RELAY_ANALYSIS_H_
diff --git a/include/tvm/relay/interpreter.h b/include/tvm/relay/interpreter.h
index 68b7ccab99c7b..d05099f781acd 100644
--- a/include/tvm/relay/interpreter.h
+++ b/include/tvm/relay/interpreter.h
@@ -182,7 +182,7 @@ RELAY_DEFINE_NODE_REF(RefValue, RefValueNode, Value);
 class ConstructorValue;
 
 struct ConstructorValueNode : ValueNode {
-  int tag;
+  int32_t tag;
 
   tvm::Array<Value> fields;
 
@@ -195,7 +195,7 @@ struct ConstructorValueNode : ValueNode {
     v->Visit("constructor", &constructor);
   }
 
-  TVM_DLL static ConstructorValue make(int tag,
+  TVM_DLL static ConstructorValue make(int32_t tag,
                                        tvm::Array<Value> fields,
                                        Constructor construtor = {});
 
diff --git a/include/tvm/relay/module.h b/include/tvm/relay/module.h
index 638f75968fd33..e888c54c17aca 100644
--- a/include/tvm/relay/module.h
+++ b/include/tvm/relay/module.h
@@ -32,6 +32,7 @@
 #include <tvm/relay/type.h>
 #include <string>
 #include <vector>
+#include <unordered_map>
 
 namespace tvm {
 namespace relay {
@@ -55,7 +56,7 @@ struct Module;
  *  The functional style allows users to construct custom
  *  environments easily, for example each thread can store
  *  a Module while auto-tuning.
- * */
+ */
 
 class ModuleNode : public RelayNode {
  public:
@@ -64,16 +65,12 @@ class ModuleNode : public RelayNode {
   /*! \brief A map from global type vars to ADT type data. */
   tvm::Map<GlobalTypeVar, TypeData> type_definitions;
 
-  /*! \brief The entry function (i.e. "main"). */
-  GlobalVar entry_func;
-
   ModuleNode() {}
 
   void VisitAttrs(tvm::AttrVisitor* v) final {
     v->Visit("functions", &functions);
     v->Visit("type_definitions", &type_definitions);
     v->Visit("global_var_map_", &global_var_map_);
-    v->Visit("entry_func", &entry_func);
     v->Visit("global_type_var_map_", &global_type_var_map_);
   }
 
@@ -118,6 +115,13 @@ class ModuleNode : public RelayNode {
    */
   TVM_DLL void Remove(const GlobalVar& var);
 
+  /*!
+   * \brief Check if the global_var_map_ contains a global variable.
+   * \param name The variable name.
+   * \returns true if contains, otherise false.
+   */
+  TVM_DLL bool ContainGlobalVar(const std::string& name) const;
+
   /*!
    * \brief Lookup a global function by its variable.
    * \param str The unique string specifying the global variable.
@@ -133,33 +137,40 @@ class ModuleNode : public RelayNode {
   TVM_DLL GlobalTypeVar GetGlobalTypeVar(const std::string& str) const;
 
   /*!
-   * \brief Lookup a global function by its variable.
+   * \brief Look up a global function by its variable.
    * \param var The global var to lookup.
    * \returns The function named by the variable argument.
    */
   TVM_DLL Function Lookup(const GlobalVar& var) const;
 
   /*!
-   * \brief Lookup a global function by its string name
+   * \brief Look up a global function by its string name
    * \param name The name of the function.
    * \returns The function named by the argument.
    */
   TVM_DLL Function Lookup(const std::string& name) const;
 
   /*!
-   * \brief Lookup a global type definition by its variable.
+   * \brief Look up a global type definition by its variable.
    * \param var The var of the global type definition.
    * \return The type definition.
    */
   TVM_DLL TypeData LookupDef(const GlobalTypeVar& var) const;
 
   /*!
-   * \brief Lookup a global type definition by its name.
+   * \brief Look up a global type definition by its name.
    * \param var The name of the global type definition.
    * \return The type definition.
    */
   TVM_DLL TypeData LookupDef(const std::string& var) const;
 
+  /*!
+   * \brief Look up a constructor by its tag.
+   * \param tag The tag for the constructor.
+   * \return The constructor object.
+   */
+  TVM_DLL Constructor LookupTag(const int32_t tag);
+
   /*!
    * \brief Update the functions inside this environment by
    *        functions in another environment.
@@ -172,10 +183,10 @@ class ModuleNode : public RelayNode {
    * Allows one to optionally pass a global function map as
    * well.
    *
-   * \param expr The expression to set as the entry point to the module.
+   * \param expr The expression to set as the main function to the module.
    * \param global_funcs The global function map.
    *
-   * \returns A module with expr set as the entry point.
+   * \returns A module with expr set as the main function.
    */
   TVM_DLL static Module FromExpr(
     const Expr& expr,
@@ -185,6 +196,9 @@ class ModuleNode : public RelayNode {
   TVM_DECLARE_NODE_TYPE_INFO(ModuleNode, Node);
 
  private:
+  /*! \brief Helper function for registering a typedef's constructors */
+  void RegisterConstructors(const GlobalTypeVar& var, const TypeData& type);
+
   /*! \brief A map from string names to global variables that
    * ensures global uniqueness.
    */
@@ -194,6 +208,11 @@ class ModuleNode : public RelayNode {
    * that ensures global uniqueness.
    */
   tvm::Map<std::string, GlobalTypeVar> global_type_var_map_;
+
+  /*! \brief A map from constructor tags to constructor objects
+   * for convenient access
+   */
+  std::unordered_map<int32_t, Constructor> constructor_tag_map_;
 };
 
 struct Module : public NodeRef {
diff --git a/include/tvm/relay/transform.h b/include/tvm/relay/transform.h
index 04b4e64dc9c3b..93129cf57a279 100644
--- a/include/tvm/relay/transform.h
+++ b/include/tvm/relay/transform.h
@@ -378,36 +378,6 @@ TVM_DLL Pass FoldConstant();
  */
 TVM_DLL Pass FuseOps(int fuse_opt_level = -1);
 
-/*!
- * \brief Apply rewrite rules to rewrite the expr in post DFS order.
- *
- * \param rewrite_map_attr_name The Op's attr name which corresponds to the rewrite
- *                              rule function.
- * \param fcontext Additional callback to provide context argument for each call node.
- * \param fmulti_ref_trigger Transformation function to be called when
- *                           an Expr consumed by multiple callers.
- *
- * \return The pass.
- */
-TVM_DLL Pass ForwardRewrite(const std::string& rewrite_map_attr_name,
-                            std::function<NodeRef(const Call&)> fcontext = nullptr,
-                            std::function<Expr(const Expr&)>
-                            fmulti_ref_trigger = nullptr);
-
-/*!
- * \brief Apply rewrite rules to rewrite the expr in post DFS order.
- *
- * \param rewrite_func The rewrite func that will apply to all operators.
- * \param fcontext Additional callback to provide context argument for each call node.
- * \param fmulti_ref_trigger Transformation function to be called when
- *                           an Expr consumed by multiple callers.
- *
- * \return The pass.
- */
-TVM_DLL Pass ForwardRewrite(const FForwardRewrite& rewrite_func,
-                            std::function<NodeRef(const Call&)> fcontext = nullptr,
-                            std::function<Expr(const Expr&)> fmulti_ref_trigger = nullptr);
-
 /*!
  * \brief Rewrite the annotated program.
  *
@@ -434,6 +404,22 @@ TVM_DLL Pass RewriteAnnotatedOps(int fallback_device);
  */
 TVM_DLL Pass ToANormalForm();
 
+/*!
+ * \brief Turn an expression into continuation passing style(CPS).
+ *
+ * CPS mean that every function will, instead of returning the result directly,
+ * be passed down an extra function (called the continuation) as argument,
+ * and pass the result to the continuation instead.
+ *
+ * Thus, every function call has to be passed an extra argument
+ * that represent the rest of the computation (Hence the name of continuation).
+ *
+ * Similarly, all other compute will be wrapped and call the continuation as well.
+ *
+ * \return the pass.
+ */
+TVM_DLL Pass ToCPS();
+
 /*!
  * \brief Remove let binding and directly share via pointer instead.
  *
@@ -541,7 +527,132 @@ TVM_DLL Pass AlterOpLayout();
  */
 TVM_DLL Pass CanonicalizeCast();
 
+/*!
+ * \brief Add abstraction over a function
+ *
+ * For example: `square` is transformed to
+ * `fun x -> square x`.
+ *
+ * See https://en.wikipedia.org/wiki/Lambda_calculus#%CE%B7-conversion
+ * for more details.
+ *
+ * \return The pass.
+ */
+TVM_DLL Pass EtaExpand();
+
 }  // namespace transform
+
+/*!
+ * \brief Bind the free variables to a Relay expression. This is a helper
+ * function usually called by other pass functions to help optimizations.
+ *
+ * \param expr The input expression.
+ * \param binds The variable to expression map that will be used to help the
+ *        binding.
+ *
+ * \return The updated expression.
+ */
+TVM_DLL Expr Bind(const Expr& expr, const tvm::Map<Var, Expr>& binds);
+
+/*!
+ * \brief Infer the type of a function as if it is mapped to var in the mod.
+ *
+ * \param f the function.
+ * \param mod The module used for referencing global functions.
+ * \param var The global variable corresponding to the function.
+ *
+ * \return A type checked Function with its checked_type field populated.
+ * \note this function mutates mod and is not thread-safe.
+ */
+TVM_DLL Function InferType(const Function& f,
+                           const Module& mod,
+                           const GlobalVar& var);
+
+/*!
+ * \brief Apply rewrite rules to rewrite the expr in post DFS order. This
+ * function is used as a helper function to rewrtie an expression in a pass.
+ *
+ * \param expr The expression.
+ * \param rewrite_map_attr_name The Op's attr name which corresponds to the rewrite
+ *                              rule function.
+ * \param fcontext Additional callback to provide context argument for each call node.
+ * \param fmulti_ref_trigger Transformation function to be called when
+ *                           an Expr consumed by multiple callers.
+ * \return The rewritten expression.
+ */
+TVM_DLL Expr ForwardRewrite(const Expr& expr,
+                            const std::string& rewrite_map_attr_name,
+                            std::function<NodeRef(const Call&)> fcontext = nullptr,
+                            std::function<Expr(const Expr&)> fmulti_ref_trigger = nullptr);
+
+/*!
+ * \brief Apply rewrite rules to rewrite the expr in post DFS order. This
+ * function is used as a helper function to rewrtie an expression in a pass.
+ *
+ * \param expr The expression.
+ * \param rewrite_func The rewrite func that will apply to all operators.
+ * \param fcontext Additional callback to provide context argument for each call node.
+ * \param fmulti_ref_trigger Transformation function to be called when
+ *                           an Expr consumed by multiple callers.
+ *
+ * \return The rewritten expression.
+ */
+TVM_DLL Expr ForwardRewrite(const Expr& expr,
+                            const FForwardRewrite& rewrite_func,
+                            std::function<NodeRef(const Call&)> fcontext = nullptr,
+                            std::function<Expr(const Expr&)> fmulti_ref_trigger = nullptr);
+
+/*!
+ * \brief Rewrite the annotated program.
+ *
+ * \param expr The expression.
+ * \param fallback_device The fallback device which is the default device for
+ *                        operators without annotation.
+ *
+ * \return The updated program.
+ */
+TVM_DLL Expr RewriteAnnotatedOps(const Expr& expr, int fallback_device);
+
+/*!
+ * \brief Turn an expression into continuation passing style(CPS).
+ *
+ * CPS mean that every function will, instead of returning the result directly,
+ * be passed down an extra function (called the continuation) as argument,
+ * and pass the result to the continuation instead.
+ *
+ * Thus, every function call has to be passed an extra argument
+ * that represent the rest of the computation (Hence the name of continuation).
+ *
+ * Similarly, all other compute will be wrapped and call the continuation as well.
+ *
+ * \param f the function.
+ * \param mod the module.
+ *
+ * \return the converted Function.
+ */
+TVM_DLL Function ToCPS(const Function& f, const Module& mod);
+
+/*!
+ * \brief Remove the continuation argument of a CPS function.
+ *
+ * Note that this only transform the type back into un-CPS form
+ * when there is no higher order input/output.
+ *
+ * \param f the function.
+ *
+ * \return the converted Function.
+ */
+TVM_DLL Function UnCPS(const Function& f);
+
+/*!
+ * \brief Deduplicate the bound variables and type variables in the expression.
+ *
+ * \param e the expression.
+ *
+ * \return the deduplicated expression.
+ */
+TVM_DLL Expr DeDup(const Expr& e);
+
 }  // namespace relay
 }  // namespace tvm
 
diff --git a/include/tvm/runtime/packed_func.h b/include/tvm/runtime/packed_func.h
index 82b3dd4695415..17fd626ee51d0 100644
--- a/include/tvm/runtime/packed_func.h
+++ b/include/tvm/runtime/packed_func.h
@@ -962,10 +962,10 @@ inline std::ostream& operator<<(std::ostream& os, TVMType t) {  // NOLINT(*)
   if (t.bits == 1 && t.lanes == 1 && t.code == kDLUInt) {
     os << "bool"; return os;
   }
-  if (GetCustomTypeRegistered(t.code)) {
-    os << "custom[" << GetCustomTypeName(t.code) << "]";
-  } else {
+  if (t.code < kCustomBegin) {
     os << TypeCode2Str(t.code);
+  } else {
+    os << "custom[" << GetCustomTypeName(t.code) << "]";
   }
   if (t.code == kHandle) return os;
   os << static_cast<int>(t.bits);
@@ -987,10 +987,10 @@ inline std::string TVMType2String(TVMType t) {
   if (t.bits == 1 && t.lanes == 1 && t.code == kDLUInt) {
     return "bool";
   }
-  if (GetCustomTypeRegistered(t.code)) {
-    repr += "custom[" + GetCustomTypeName(t.code) + "]";
-  } else {
+  if (t.code < kCustomBegin) {
     repr += TypeCode2Str(t.code);
+  } else {
+    repr += "custom[" + GetCustomTypeName(t.code) + "]";
   }
   if (t.code == kHandle) return repr;
   repr += std::to_string(static_cast<int>(t.bits));
diff --git a/nnvm/tests/python/compiler/test_to_relay.py b/nnvm/tests/python/compiler/test_to_relay.py
index e79831d06cf26..dac14a8c1f220 100644
--- a/nnvm/tests/python/compiler/test_to_relay.py
+++ b/nnvm/tests/python/compiler/test_to_relay.py
@@ -18,7 +18,7 @@
 from nnvm import testing
 from nnvm import to_relay
 import tvm
-from tvm.relay import ir_pass
+from tvm.relay import transform
 from tvm.relay import create_executor
 from tvm.contrib import graph_runtime
 import numpy as np
@@ -41,10 +41,11 @@ def check_model(sym, shapes, dtypes, params):
     nnvm_rts.run(**inputs)
     nnvm_out = nnvm_rts.get_output(0)
     relay_model, params = to_relay.to_relay(net, shapes, dtypes, params)
-    relay_model = ir_pass.infer_type(relay_model)
-    relay_rts = create_executor(kind='graph', ctx=tvm.cpu(0), target='llvm')
+    mod = tvm.relay.Module.from_expr(relay_model)
+    mod = transform.InferType()(mod)
+    relay_rts = create_executor(kind='graph', mod=mod, ctx=tvm.cpu(0), target='llvm')
     inputs.update(params)
-    relay_out = relay_rts.evaluate(relay_model)(*list(inputs.values()))
+    relay_out = relay_rts.evaluate()(*list(inputs.values()))
     np.testing.assert_allclose(nnvm_out.asnumpy(), relay_out.asnumpy())
 
 # def test_mlp():
diff --git a/python/tvm/api.py b/python/tvm/api.py
index d88f06170543c..e4777b6e39649 100644
--- a/python/tvm/api.py
+++ b/python/tvm/api.py
@@ -531,7 +531,8 @@ def decl_buffer(shape,
                 elem_offset=None,
                 scope="",
                 data_alignment=-1,
-                offset_factor=0):
+                offset_factor=0,
+                buffer_type=""):
     """Declare a new symbolic buffer.
 
     Normally buffer is created automatically during lower and build.
@@ -574,11 +575,39 @@ def decl_buffer(shape,
         If 0 is pssed, the alignment will be set to 1.
         if non-zero is passed, we will created a Var for elem_offset if elem_offset is not None.
 
+    buffer_type: str, optional, {"", "auto_broadcast"}
+        auto_broadcast buffer allows one to implement broadcast computation
+        without considering whether dimension size equals to one.
+        TVM maps buffer[i][j][k] -> buffer[i][0][k] if dimension i's shape equals 1.
+
     Returns
     -------
     buffer : Buffer
         The created buffer
 
+    Example
+    -------
+    Here's an example of how broadcast buffer can be used to define a symbolic broadcast operation,
+
+    .. code-block:: python
+
+        m0, m1, m2 = tvm.var("m0"), tvm.var("m1"), tvm.var("m2")
+        n0, n1, n2 = tvm.var("n0"), tvm.var("n1"), tvm.var("n2")
+        o0, o1, o2 = tvm.var("o0"), tvm.var("o1"), tvm.var("o2")
+        A = tvm.placeholder((m0, m1, m2), name='A')
+        B = tvm.placeholder((n0, n1, n2), name='B')
+        C = tvm.compute((o0, o1, o2), lambda i, j, k: A[i, j, k] + B[i, j, k], name='C')
+        Ab = tvm.decl_buffer(A.shape, A.dtype, name="Ab", buffer_type="broadcast")
+        Bb = tvm.decl_buffer(B.shape, B.dtype, name="Bb", buffer_type="broadcast")
+        s = tvm.create_schedule(C.op)
+        fadd = tvm.build(s, [A, B, C], target='llvm', name='bcast_add', binds={A:Ab, B:Bb})
+        ctx = tvm.cpu(0)
+        a = tvm.nd.array(np.random.uniform(size=(2, 4, 3)).astype(A.dtype), ctx)
+        b = tvm.nd.array(np.random.uniform(size=(2, 1, 3)).astype(B.dtype), ctx)
+        c = tvm.nd.array(np.zeros((2, 4, 3), dtype=C.dtype), ctx)
+        fadd(a, b, c)
+        tvm.testing.assert_allclose(c.asnumpy(), a.asnumpy() + b.asnumpy())
+
     Note
     ----
     Buffer data structure reflects the DLTensor structure in dlpack.
@@ -602,7 +631,7 @@ def decl_buffer(shape,
         data = var(name, "handle")
     return _api_internal._Buffer(
         data, dtype, shape, strides, elem_offset, name, scope,
-        data_alignment, offset_factor)
+        data_alignment, offset_factor, buffer_type)
 
 def layout(layout_str):
     """Create a layout node from a string.
diff --git a/python/tvm/autotvm/graph_tuner/base_graph_tuner.py b/python/tvm/autotvm/graph_tuner/base_graph_tuner.py
index 252882d17eceb..cffd42347b35d 100644
--- a/python/tvm/autotvm/graph_tuner/base_graph_tuner.py
+++ b/python/tvm/autotvm/graph_tuner/base_graph_tuner.py
@@ -142,7 +142,7 @@ def __init__(self, graph, input_shapes, records, target_ops,
 
         # Generate workload and schedule dictionaries.
         if isinstance(graph, relay.Module):
-            graph = graph[graph.entry_func]
+            graph = graph["main"]
 
         if isinstance(graph, relay.expr.Function):
             node_dict = {}
diff --git a/python/tvm/autotvm/graph_tuner/utils/traverse_graph.py b/python/tvm/autotvm/graph_tuner/utils/traverse_graph.py
index c0debaedede0d..5d07bd3fbce5f 100644
--- a/python/tvm/autotvm/graph_tuner/utils/traverse_graph.py
+++ b/python/tvm/autotvm/graph_tuner/utils/traverse_graph.py
@@ -21,6 +21,7 @@
 import topi
 
 from tvm import relay, autotvm
+from tvm.relay import transform
 from tvm.relay.expr import Call, Function, TupleGetItem, Var, Constant, Tuple
 from tvm.relay.ty import TupleType, TensorType
 from tvm.autotvm.task import TaskExtractEnv
@@ -80,6 +81,14 @@ def expr2graph(expr, target_ops, node_dict, node_list):
                 task_pos += 1
 
 
+def _infer_type(node):
+    """A method to infer the type of a relay expression."""
+    mod = relay.Module.from_expr(node)
+    mod = transform.InferType()(mod)
+    entry = mod["main"]
+    return entry if isinstance(node, relay.Function) else entry.body
+
+
 def _expr2graph_impl(expr, target_ops, node_dict, node_list):
     """Implementation to convert relay expr to graph data structure
     """
@@ -99,7 +108,7 @@ def _traverse_expr(node):
                     node_entry["inputs"] += node_list[in_node_idx]["inputs"]
                 else:
                     node_entry["inputs"].append([in_node_idx, 0, 0])
-            infer_out = relay.ir_pass.infer_type(node)
+            infer_out = _infer_type(node)
             out_type = infer_out._checked_type_
             if isinstance(out_type, TensorType):
                 node_entry["types"].append(out_type)
@@ -127,10 +136,10 @@ def _traverse_expr(node):
                     free_var = relay.Var("var_%d" % i, input_type)
                     params.append(free_var)
                 call = relay.Call(node.op, params, node.attrs)
-                func = relay.Function(params, call)
+                mod = relay.Module.from_expr(relay.Function(params, call))
                 relay.backend.compile_engine.get().clear()
                 build_thread = threading.Thread(target=relay.build,
-                                                args=(func,
+                                                args=(mod,
                                                       "llvm -device=tracing",
                                                       None,
                                                       None))
@@ -168,7 +177,7 @@ def _traverse_expr(node):
         node_dict[node] = node_index
         node_list.append(node_entry)
 
-    relay.ir_pass.post_order_visit(expr, _traverse_expr)
+    relay.analysis.post_order_visit(expr, _traverse_expr)
 
 
 def get_direct_ancestor(node_list, visited_dict, target_ops, node_idx, input_names):
diff --git a/python/tvm/autotvm/graph_tuner/utils/utils.py b/python/tvm/autotvm/graph_tuner/utils/utils.py
index 6151734299af6..b9777ef844595 100644
--- a/python/tvm/autotvm/graph_tuner/utils/utils.py
+++ b/python/tvm/autotvm/graph_tuner/utils/utils.py
@@ -17,6 +17,7 @@
 # pylint: disable=eval-used,invalid-name,too-many-arguments
 """Utility functions"""
 from tvm import relay
+from tvm.relay import transform
 
 
 def has_multiple_inputs(node_list, node_idx, input_names):
@@ -107,4 +108,7 @@ def bind_inputs(expr, input_shapes=None, input_dtypes="float32"):
             rebind_dict[var] = updated_input_dict[var.name_hint]
     updated_expr = relay.expr.bind(expr, rebind_dict)
 
-    return relay.ir_pass.infer_type(updated_expr)
+    mod = relay.Module.from_expr(updated_expr)
+    mod = transform.InferType()(mod)
+    entry = mod["main"]
+    return entry if isinstance(updated_expr, relay.Function) else entry.body
diff --git a/python/tvm/autotvm/task/relay_integration.py b/python/tvm/autotvm/task/relay_integration.py
index d80443a208d66..5b0294ef2d07d 100644
--- a/python/tvm/autotvm/task/relay_integration.py
+++ b/python/tvm/autotvm/task/relay_integration.py
@@ -105,8 +105,9 @@ def extract_from_program(func, params, ops, target, target_host=None):
 
         relay.backend.compile_engine.get().clear()
         # wrap build call in thread to avoid multiprocessing problems
+        mod = relay.Module.from_expr(func)
         build_thread = threading.Thread(target=_build,
-                                        args=(func,
+                                        args=(mod,
                                               target,
                                               target_host,
                                               params))
@@ -183,8 +184,9 @@ def extract_from_multiple_program(funcs, params, ops, target, target_host=None):
         for func, param in zip(funcs, params):
             relay.backend.compile_engine.get().clear()
             # wrap build call in thread to avoid multiprocessing problems
+            mod = relay.Module.from_expr(func)
             build_thread = threading.Thread(target=my_build,
-                                            args=(func,
+                                            args=(mod,
                                                   target,
                                                   target_host,
                                                   params))
diff --git a/python/tvm/make.py b/python/tvm/make.py
index 7439952ad7adb..241edd6b09481 100644
--- a/python/tvm/make.py
+++ b/python/tvm/make.py
@@ -24,7 +24,6 @@
 """
 from __future__ import absolute_import as _abs
 from ._ffi.function import _init_api
-from ._ffi.runtime_ctypes import TVMType
 
 
 def range_by_min_extent(min_value, extent):
@@ -48,35 +47,6 @@ def range_by_min_extent(min_value, extent):
     return _range_by_min_extent(min_value, extent)
 
 
-def static_cast(dtype, expr):
-    """Cast expr to dtype.
-
-    If expr is scalar and dtype is a corresponding vector
-    type, a Broadcast is generated. Otherwise it is a Cast.
-
-    Parameters
-    ----------
-    dtype : str
-        The target data type.
-
-    expr : Expr
-        The expression to be casted.
-
-    Returns
-    -------
-    casted : Expr
-        The casted expression.
-    """
-    target_type = TVMType(dtype)
-    src_type = TVMType(expr.dtype)
-    if target_type.type_code == src_type.type_code and src_type.bits == target_type.bits:
-        if src_type.lanes == target_type.lanes:
-            return expr
-        if src_type.lanes == 1 and target_type.lanes > 1:
-            return Broadcast(expr, target_type.lanes)
-    return Cast(dtype, expr)
-
-
 def node(type_key, **kwargs):
     """Make a new DSL node by its type key and fields
 
diff --git a/python/tvm/relay/__init__.py b/python/tvm/relay/__init__.py
index 5536e503e6b67..dfac85bb1ed28 100644
--- a/python/tvm/relay/__init__.py
+++ b/python/tvm/relay/__init__.py
@@ -24,7 +24,7 @@
 from . import expr_functor
 from . import module
 from . import adt
-from . import ir_pass
+from . import analysis
 from . import transform
 from .build_module import build, create_executor
 from .transform import build_config
@@ -32,6 +32,7 @@
 from . import parser
 from . import debug
 from . import param_dict
+from . import feature
 
 # Root operators
 from .op import Op
@@ -101,7 +102,7 @@
 bind = expr.bind
 module_pass = transform.module_pass
 function_pass = transform.function_pass
-alpha_equal = ir_pass.alpha_equal
+alpha_equal = analysis.alpha_equal
 
 # ExprFunctor
 ExprFunctor = expr_functor.ExprFunctor
@@ -122,3 +123,6 @@
 ModulePass = transform.ModulePass
 FunctionPass = transform.FunctionPass
 Sequential = transform.Sequential
+
+# Feature
+Feature = feature.Feature
diff --git a/python/tvm/relay/_ir_pass.py b/python/tvm/relay/_analysis.py
similarity index 89%
rename from python/tvm/relay/_ir_pass.py
rename to python/tvm/relay/_analysis.py
index 3a0e0ac846b99..32a7324ae29f5 100644
--- a/python/tvm/relay/_ir_pass.py
+++ b/python/tvm/relay/_analysis.py
@@ -14,8 +14,8 @@
 # KIND, either express or implied.  See the License for the
 # specific language governing permissions and limitations
 # under the License.
-"""FFI exposing the Relay type inference and checking."""
+"""FFI exposing the passes for Relay program analysis."""
 
 from tvm._ffi.function import _init_api
 
-_init_api("relay._ir_pass", __name__)
+_init_api("relay._analysis", __name__)
diff --git a/python/tvm/relay/_ir_pass.pyi b/python/tvm/relay/_ir_pass.pyi
deleted file mode 100644
index 13035bb36f716..0000000000000
--- a/python/tvm/relay/_ir_pass.pyi
+++ /dev/null
@@ -1,26 +0,0 @@
-# Licensed to the Apache Software Foundation (ASF) under one
-# or more contributor license agreements.  See the NOTICE file
-# distributed with this work for additional information
-# regarding copyright ownership.  The ASF licenses this file
-# to you under the Apache License, Version 2.0 (the
-# "License"); you may not use this file except in compliance
-# with the License.  You may obtain a copy of the License at
-#
-#   http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing,
-# software distributed under the License is distributed on an
-# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-# KIND, either express or implied.  See the License for the
-# specific language governing permissions and limitations
-# under the License.
-
-import tvm
-from . import ir
-from .env import Module
-
-def check_expr(env: Module, expr: ir.Expr) -> ir.Type: ...
-def generalize(env: Module, expr: ir.Expr) -> ir.Expr: ...
-def _get_checked_type(expr: ir.Expr) -> ir.Type: ...
-def well_formed(expr: ir.Expr) -> bool: ...
-def dead_code_elimination(expr: ir.Expr) -> ir.Expr: ...
diff --git a/python/tvm/relay/analysis.py b/python/tvm/relay/analysis.py
new file mode 100644
index 0000000000000..ee8ce985fcbc0
--- /dev/null
+++ b/python/tvm/relay/analysis.py
@@ -0,0 +1,363 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+# pylint: disable=no-else-return
+# pylint: disable=unidiomatic-typecheck
+"""
+This file contains the set of passes for Relay, which exposes an interface for
+configuring the passes and scripting them in Python.
+"""
+from . import _analysis
+from . import _make
+from .expr import Expr
+from .ty import Type
+from .module import Module
+from .feature import Feature
+
+
+def post_order_visit(expr, fvisit):
+    """Recursively visit the ir in post DFS order node,
+    apply fvisit. Each node is guaranteed to be visited
+    only once.
+
+    Parameters
+    ----------
+    expr : tvm.relay.Expr
+        The input expression.
+
+    fvisit : function
+        The visitor function to be applied.
+    """
+    return _analysis.post_order_visit(expr, fvisit)
+
+
+def well_formed(expr):
+    """Check that each Var is only bound once (well formed).
+
+    Parameters
+    ----------
+    expr : tvm.relay.Expr
+        The input expression
+
+    Returns
+    -------
+    well_form : bool
+        Whether the input expression is well formed
+    """
+    return _analysis.well_formed(expr)
+
+
+def check_kind(t, mod=None):
+    """Check that the type is well kinded and return the kind.
+    For example, this mean type cannot has tensor of tensor, or is a tuple type
+    of 2 shapes.
+
+    Parameters
+    ----------
+    t : tvm.relay.Type
+        The type to check
+
+    mod : Optional[tvm.relay.Module]
+        The global module.
+
+    Returns
+    -------
+    kind : Kind
+        the kind of t
+
+    Examples
+    --------
+    .. code:: python
+
+        assert check_kind(relay.TupleType([relay.TypeParam('tp1', relay.Kind.Shape)])) == Shape
+        assert check_kind(relay.TupleType([relay.TypeParam('tp1', relay.Kind.Type)])) == Type
+    """
+    if mod is not None:
+        return _analysis.check_kind(t, mod)
+    else:
+        return _analysis.check_kind(t)
+
+
+def free_vars(expr):
+    """Get free Vars from expression expr in Post DFS order.
+
+    Parameters
+    ----------
+    expr : tvm.relay.Expr
+        The input expression
+
+    Returns
+    -------
+    free : List[tvm.relay.Var]
+        The list of free variables in post DFS order.
+
+    Note
+    ----
+    The fact that Vars are post-DFS ordred are useful in
+    neural networks: usually this means weights of previous
+    are ordered first.
+    """
+    return _analysis.free_vars(expr)
+
+
+def bound_vars(expr):
+    """Get bound vars from expression expr in post-DFS order.
+
+    Parameters
+    ----------
+    expr : tvm.relay.Expr
+        The input expression
+
+    Returns
+    -------
+    free : List[tvm.relay.Var]
+        The list of bound variables in post-DFS order.
+    """
+    return _analysis.bound_vars(expr)
+
+
+def all_vars(expr):
+    """Get all vars from expression expr in post-DFS order.
+
+    Parameters
+    ----------
+    expr : tvm.relay.Expr
+        The input expression
+
+    Returns
+    -------
+    free : List[tvm.relay.Var]
+        The list of all variables in post-DFS order.
+    """
+    return _analysis.all_vars(expr)
+
+
+def free_type_vars(expr, mod=None):
+    """Get free type variables from expression/type e
+
+    Parameters
+    ----------
+    expr : Union[tvm.relay.Expr,tvm.relay.Type]
+        The input expression/type
+
+    mod : Optional[tvm.relay.Module]
+        The global module
+
+    Returns
+    -------
+    free : List[tvm.relay.TypeVar]
+        The list of free type variables in post-DFS order
+    """
+    use_mod = mod if mod is not None else Module()
+    return _analysis.free_type_vars(expr, use_mod)
+
+
+def bound_type_vars(expr, mod=None):
+    """Get bound type variables from expression/type e
+
+    Parameters
+    ----------
+    expr : Union[tvm.relay.Expr,tvm.relay.Type]
+        The input expression/type
+
+    mod : Optional[tvm.relay.Module]
+        The global module
+
+    Returns
+    -------
+    free : List[tvm.relay.TypeVar]
+        The list of bound type variables in post-DFS order
+    """
+    use_mod = mod if mod is not None else Module()
+    return _analysis.bound_type_vars(expr, use_mod)
+
+
+def all_type_vars(expr, mod=None):
+    """Get all type variables from expression/type e
+
+    Parameters
+    ----------
+    expr : Union[tvm.relay.Expr,tvm.relay.Type]
+        The input expression/type
+
+    mod : Optional[tvm.relay.Module]
+        The global module
+
+    Returns
+    -------
+    free : List[tvm.relay.TypeVar]
+        The list of all type variables in post-DFS order
+    """
+    use_mod = mod if mod is not None else Module()
+    return _analysis.all_type_vars(expr, use_mod)
+
+
+def alpha_equal(lhs, rhs):
+    """Compare two Relay expr for structural equivalence (alpha equivalence).
+
+    Parameters
+    ----------
+    lhs : tvm.relay.Expr
+        One of the input Expression.
+
+    rhs : tvm.relay.Expr
+        One of the input Expression.
+
+    Returns
+    -------
+    result : bool
+        True iff lhs is alpha equal to rhs.
+    """
+    return bool(_make._alpha_equal(lhs, rhs))
+
+
+def graph_equal(lhs, rhs):
+    """Compare two Relay expr for data-flow equivalence.
+    The difference between this and alpha-equality is that
+    variables are not expected to match between lhs and rhs;
+    they are treated as sources and are mapped between each other.
+
+    Parameters
+    ----------
+    lhs : tvm.relay.Expr
+      One of the input Expression.
+
+    rhs : tvm.relay.Expr
+      One of the input Expression.
+
+    Returns
+    -------
+    result : bool
+      True iff lhs is data-flow equivalent to rhs.
+    """
+    return bool(_make._graph_equal(lhs, rhs))
+
+
+def collect_device_info(expr):
+    """Collect the device allocation map for the given expression. The device
+    ids are propagated from the `device_copy` operators.
+
+    Parameters
+    ----------
+    expr : tvm.relay.Expr
+        The input expression.
+
+    Returns
+    -------
+    ret : Dict[tvm.relay.expr, int]
+        A dictionary mapping tvm.relay.Expr to device type.
+    """
+    return _analysis.CollectDeviceInfo(expr)
+
+
+def collect_device_annotation_ops(expr):
+    """Collect the device annotation ops for the given expression.
+
+    Parameters
+    ----------
+    expr : tvm.relay.Expr
+        The input expression.
+
+    Returns
+    -------
+    ret : Dict[tvm.relay.expr, int]
+        A dictionary mapping tvm.relay.Expr to device type where the keys are
+        annotation expressions.
+    """
+    return _analysis.CollectDeviceAnnotationOps(expr)
+
+
+def get_total_mac_number(expr):
+    """
+    Count the number of MACs (multiply-accumulate) of a model
+
+    Parameters
+    ----------
+    expr : tvm.relay.Expr
+        The input expression.
+
+    Returns
+    -------
+    result : int64
+      The number of MACs (multiply-accumulate) of a model
+    """
+    return _analysis.GetTotalMacNumber(expr)
+
+
+def unmatched_cases(match, mod=None):
+    """
+    Finds cases that the match expression does not catch, if any.
+
+    Parameters
+    ----------
+    match : tvm.relay.Match
+        The match expression
+
+    mod : Optional[tvm.relay.Module]
+        The module (defaults to an empty module)
+
+    Returns
+    -------
+    missing_patterns : [tvm.relay.Pattern]
+        Patterns that the match expression does not catch.
+    """
+    return _analysis.unmatched_cases(match, mod)
+
+
+def detect_feature(a, b=None):
+    """
+    Detect the feature used in a relay program.
+
+    Parameters
+    ----------
+    a : Union[tvm.relay.Expr, tvm.relay.Module]
+      The input expression or module.
+
+    b : Optional[Union[tvm.relay.Expr, tvm.relay.Module]]
+      The input expression or module.
+      The two arguments cannot both be expression or module.
+
+    Returns
+    -------
+    features : Set[Feature]
+      Features used in the program.
+    """
+    if isinstance(a, Module):
+        a, b = b, a
+    return set([Feature(int(x)) for x in _analysis.detect_feature(a, b)])
+
+
+def structural_hash(value):
+    """Hash a Relay expression structurally.
+
+    Parameters
+    ----------
+    expr : Union[tvm.relay.Expr, tvm.relay.Type]
+      The expression to hash.
+
+    Returns
+    -------
+    result : int
+      The hash value
+    """
+    if isinstance(value, Expr):
+        return int(_analysis._expr_hash(value))
+    elif isinstance(value, Type):
+        return int(_analysis._type_hash(value))
+    else:
+        msg = ("found value of type {0} expected" +
+               "relay.Expr or relay.Type").format(type(value))
+        raise TypeError(msg)
diff --git a/python/tvm/relay/backend/interpreter.py b/python/tvm/relay/backend/interpreter.py
index c54a65b78fb23..462dda9488c21 100644
--- a/python/tvm/relay/backend/interpreter.py
+++ b/python/tvm/relay/backend/interpreter.py
@@ -21,7 +21,7 @@
 import numpy as np
 
 from . import _backend
-from .. import _make, ir_pass, transform
+from .. import _make, analysis, transform
 from .. import module
 from ... import register_func, nd
 from ..base import NodeBase, register_relay_node
@@ -114,17 +114,18 @@ def __init__(self, value):
             _make.RefValue, value)
 
 
-def _arg_to_ast(arg):
+def _arg_to_ast(mod, arg):
     if isinstance(arg, TensorValue):
         return Constant(arg.data.copyto(nd.cpu(0)))
     elif isinstance(arg, TupleValue):
-        return Tuple([_arg_to_ast(field) for field in arg.fields])
+        return Tuple([_arg_to_ast(mod, field) for field in arg.fields])
     elif isinstance(arg, tuple):
-        return Tuple([_arg_to_ast(field) for field in arg])
+        return Tuple([_arg_to_ast(mod, field) for field in arg])
     elif isinstance(arg, RefValue):
-        return RefCreate(_arg_to_ast(arg.value))
+        return RefCreate(_arg_to_ast(mod, arg.value))
     elif isinstance(arg, ConstructorValue):
-        return Call(arg.constructor, [_arg_to_ast(field) for field in arg.fields])
+        return Call(mod.get_constructor(arg.tag),
+                    [_arg_to_ast(mod, field) for field in arg.fields])
     elif isinstance(arg, np.ndarray):
         return Constant(nd.array(arg))
     elif isinstance(arg, Constant):
@@ -163,6 +164,8 @@ def _convert_args(self, expr, args, kwargs):
             args: List[tvm.NDArray]
                 The new arguments with all keyword arguments placed in the correct slot.
         """
+        assert expr is not None
+
         if not kwargs:
             return args
 
@@ -229,7 +232,7 @@ def evaluate(self, expr=None, binds=None):
         if binds:
             scope_builder = ScopeBuilder()
             for key, value in binds.items():
-                scope_builder.let(key, _arg_to_ast(value))
+                scope_builder.let(key, _arg_to_ast(self.mod, value))
             scope_builder.ret(expr)
             expr = scope_builder.get()
 
@@ -237,7 +240,7 @@ def evaluate(self, expr=None, binds=None):
             return self._make_executor()
 
         if isinstance(expr, Function):
-            assert not ir_pass.free_vars(expr)
+            assert not analysis.free_vars(expr)
 
         if isinstance(expr, (Function, GlobalVar)):
             return self._make_executor(expr)
@@ -286,29 +289,29 @@ def _make_executor(self, expr=None):
             assert self.mod is not None
         def _interp_wrapper(*args, **kwargs):
             if expr is None:
-                args = self._convert_args(self.mod[self.mod.entry_func], args, kwargs)
+                args = self._convert_args(self.mod["main"], args, kwargs)
             else:
                 args = self._convert_args(expr, args, kwargs)
 
             relay_args = []
             for arg in args:
-                relay_args.append(_arg_to_ast(arg))
+                relay_args.append(_arg_to_ast(self.mod, arg))
 
             # Set the entry function for the module.
             if expr is None:
                 pass
             elif isinstance(expr, GlobalVar):
-                self.mod[self.mod.entry_func] = self.mod[expr]
+                self.mod["main"] = self.mod[expr]
             else:
                 assert isinstance(expr, Function)
                 func = Function([], Call(expr, relay_args))
                 relay_args = []
                 if self.mod:
-                    self.mod[self.mod.entry_func] = func
+                    self.mod["main"] = func
                 else:
                     self.mod = module.Module.from_expr(func)
 
             mod = self.optimize()
-            opt_expr = Call(mod[self.mod.entry_func.name_hint], relay_args)
+            opt_expr = Call(mod["main"], relay_args)
             return self._intrp(opt_expr)
         return _interp_wrapper
diff --git a/python/tvm/relay/backend/vm.py b/python/tvm/relay/backend/vm.py
index ceb403fe77174..152ee576e7bdb 100644
--- a/python/tvm/relay/backend/vm.py
+++ b/python/tvm/relay/backend/vm.py
@@ -45,7 +45,7 @@ def optimize(mod):
     ret : tvm.relay.Module
         The optimized module.
     """
-    main_func = mod[mod.entry_func]
+    main_func = mod["main"]
 
     opt_passes = []
     if not main_func.params and isinstance(main_func.body, GlobalVar):
@@ -134,8 +134,8 @@ def _make_executor(self, expr=None):
         expr = expr if expr else self.mod
         assert expr, "either expr or self.mod should be not null."
         if isinstance(expr, Expr):
-            self.mod[self.mod.entry_func] = expr
-        main = self.mod[self.mod.entry_func]
+            self.mod["main"] = expr
+        main = self.mod["main"]
 
         def _vm_wrapper(*args, **kwargs):
             args = self._convert_args(main, args, kwargs)
diff --git a/python/tvm/relay/build_module.py b/python/tvm/relay/build_module.py
index cdda17aa517b6..404829f74cf78 100644
--- a/python/tvm/relay/build_module.py
+++ b/python/tvm/relay/build_module.py
@@ -25,7 +25,6 @@
 from .. import nd as _nd, target as _target, autotvm
 from ..contrib import graph_runtime as _graph_rt
 from . import _build_module
-from . import ir_pass
 from . import ty as _ty
 from . import expr as _expr
 from .module import Module as _Module
@@ -178,7 +177,7 @@ def build(mod, target=None, target_host=None, params=None):
         The parameters of the final graph.
     """
     if isinstance(mod, _Module):
-        func = mod[mod.entry_func]
+        func = mod["main"]
     elif isinstance(mod, _expr.Function):
         func = mod
         warnings.warn(
@@ -227,23 +226,23 @@ class GraphExecutor(_interpreter.Executor):
     """
 
     def __init__(self, mod, ctx, target):
+        assert mod is not None
         self.mod = mod
         self.ctx = ctx
         self.target = target
 
     def _make_executor(self, expr=None):
-        if not expr:
-            assert self.mod, "either expr or self.mod should be not null."
-            expr = self.mod[self.mod.entry_func]
-        ret_type = ir_pass.infer_type(expr).ret_type
+        if expr:
+            self.mod["main"] = expr
+        ret_type = self.mod["main"].checked_type.ret_type
         num_outputs = len(ret_type.fields) if isinstance(ret_type, _ty.TupleType) else 1
-        graph_json, mod, params = build(expr, target=self.target)
+        graph_json, mod, params = build(self.mod, target=self.target)
         gmodule = _graph_rt.create(graph_json, mod, self.ctx)
         if params:
             gmodule.set_input(**params)
 
         def _graph_wrapper(*args, **kwargs):
-            args = self._convert_args(expr, args, kwargs)
+            args = self._convert_args(self.mod["main"], args, kwargs)
             # Create map of inputs.
             for i, arg in enumerate(args):
                 gmodule.set_input(i, arg)
@@ -280,6 +279,8 @@ def create_executor(kind="debug",
     target : :py:class:`tvm.Target`
         The corresponding context
     """
+    if mod is None:
+        mod = _Module()
     if ctx is not None:
         assert ctx.device_type == _nd.context(str(target), 0).device_type
     else:
diff --git a/python/tvm/relay/expr.pyi b/python/tvm/relay/expr.pyi
index b7395c365390a..d264e99e05770 100644
--- a/python/tvm/relay/expr.pyi
+++ b/python/tvm/relay/expr.pyi
@@ -19,7 +19,7 @@ from typing import List
 import tvm
 from .base import Span, NodeBase
 from .ty import Type, TypeParam
-from ._ir_pass import _get_checked_type
+from ._analysis import _get_checked_type
 
 
 class Expr(NodeBase):
@@ -128,4 +128,4 @@ class If(Expr):
 
     def __init__(self, cond, true_value, false_value):
         # type: (Expr, Expr, Expr) -> None
-        ...
\ No newline at end of file
+        ...
diff --git a/python/tvm/relay/frontend/caffe2.py b/python/tvm/relay/frontend/caffe2.py
index 18489b380ee71..43d9d21c09b5d 100644
--- a/python/tvm/relay/frontend/caffe2.py
+++ b/python/tvm/relay/frontend/caffe2.py
@@ -18,7 +18,7 @@
 """Caffe2 frontend"""
 from __future__ import absolute_import as _abs
 import tvm
-from .. import ir_pass
+from .. import analysis
 from .. import expr as _expr
 from .. import module as _module
 from .. import op as _op
@@ -450,8 +450,8 @@ def from_caffe2(self, init_net, predict_net):
         else:
             outputs = out[0]
 
-        func = _expr.Function(ir_pass.free_vars(outputs), outputs)
-        self._mod[self._mod.entry_func] = func
+        func = _expr.Function(analysis.free_vars(outputs), outputs)
+        self._mod["main"] = func
 
         return self._mod, self._params
 
diff --git a/python/tvm/relay/frontend/common.py b/python/tvm/relay/frontend/common.py
index efd198803c2b6..c5057f35fedef 100644
--- a/python/tvm/relay/frontend/common.py
+++ b/python/tvm/relay/frontend/common.py
@@ -19,8 +19,8 @@
 import logging
 from topi.util import get_const_tuple
 from .. import expr as _expr
-from .. import expr as _expr
-from .. import ir_pass
+from .. import module as _module
+from .. import transform as _transform
 from .. import op as _op
 
 
@@ -407,9 +407,17 @@ def get_name(node):
         name = node.name_hint
     return name
 
+
+def infer_type(node):
+    """A method to infer the type of an intermediate node in the relay graph."""
+    mod = _module.Module.from_expr(node)
+    mod = _transform.InferType()(mod)
+    entry = mod["main"]
+    return entry if isinstance(node, _expr.Function) else entry.body
+
 def infer_shape(inputs):
     """A method to get the output shape of an intermediate node in the graph."""
-    out_type = ir_pass.infer_type(inputs)
+    out_type = infer_type(inputs)
     out_shapes = get_const_tuple(out_type.checked_type.shape)
     return out_shapes
 
@@ -417,7 +425,7 @@ def infer_channels(inputs, transpose=False):
     """A hack for getting 'channels' or 'units' since caffe2 does not provide
     these attributes. We check the shape of weights provided to get the number.
     """
-    out_type = ir_pass.infer_type(inputs)
+    out_type = infer_type(inputs)
     out_shapes = [get_const_tuple(out_type.checked_type.shape)]
     channels = out_shapes[0][0] if not transpose else out_shapes[0][1]
     return channels
diff --git a/python/tvm/relay/frontend/coreml.py b/python/tvm/relay/frontend/coreml.py
index 1cac547d07c95..e7b129e66724b 100644
--- a/python/tvm/relay/frontend/coreml.py
+++ b/python/tvm/relay/frontend/coreml.py
@@ -19,7 +19,7 @@
 from __future__ import absolute_import as _abs
 import numpy as np
 import tvm
-from .. import ir_pass
+from .. import analysis
 from .. import expr as _expr
 from .. import module as _module
 from .. import op as _op
@@ -462,6 +462,6 @@ def from_coreml(model, shape=None):
                for o in spec.description.output]
     # for now return first output
     outexpr = outexpr[0]
-    func = _expr.Function(ir_pass.free_vars(outexpr), outexpr)
+    func = _expr.Function(analysis.free_vars(outexpr), outexpr)
     params = {k:_nd.array(np.array(v, dtype=np.float32)) for k, v in etab.params.items()}
     return _module.Module.from_expr(func), params
diff --git a/python/tvm/relay/frontend/darknet.py b/python/tvm/relay/frontend/darknet.py
index 7b26ed5692df7..f452146ae46cc 100644
--- a/python/tvm/relay/frontend/darknet.py
+++ b/python/tvm/relay/frontend/darknet.py
@@ -23,7 +23,7 @@
 from enum import Enum
 import numpy as np
 import tvm
-from .. import ir_pass
+from .. import analysis
 from .. import expr as _expr
 from .. import module as _module
 from .common import get_relay_op, new_var
@@ -820,7 +820,7 @@ def from_darknet(self):
 
         outputs = _as_list(sym) + self._outs
         outputs = outputs[0] if len(outputs) == 1 else _expr.Tuple(outputs)
-        sym = _expr.Function(ir_pass.free_vars(outputs), outputs)
+        sym = _expr.Function(analysis.free_vars(outputs), outputs)
         return _module.Module.from_expr(sym), self._tvmparams
 
 def from_darknet(net,
diff --git a/python/tvm/relay/frontend/keras.py b/python/tvm/relay/frontend/keras.py
index ad033f9bf3260..91da87c84b809 100644
--- a/python/tvm/relay/frontend/keras.py
+++ b/python/tvm/relay/frontend/keras.py
@@ -20,7 +20,7 @@
 import sys
 import numpy as np
 import tvm
-from .. import ir_pass
+from .. import analysis
 from .. import expr as _expr
 from .. import module as _module
 from .. import op as _op
@@ -743,6 +743,6 @@ def _convert_input_layer(keras_layer):
     outexpr = [etab.get_expr(oc[0].name + ":" + str(oc[1]) + ":" + str(oc[2])) \
                for oc in model._output_coordinates]
     outexpr = outexpr[0] if len(outexpr) == 1 else _expr.Tuple(outexpr)
-    func = _expr.Function(ir_pass.free_vars(outexpr), outexpr)
+    func = _expr.Function(analysis.free_vars(outexpr), outexpr)
     params = {k:_nd.array(np.array(v, dtype=np.float32)) for k, v in etab.params.items()}
     return _module.Module.from_expr(func), params
diff --git a/python/tvm/relay/frontend/mxnet.py b/python/tvm/relay/frontend/mxnet.py
index 0bcee63ad3e8c..e40f1dea61a9f 100644
--- a/python/tvm/relay/frontend/mxnet.py
+++ b/python/tvm/relay/frontend/mxnet.py
@@ -20,7 +20,7 @@
 
 import json
 import tvm
-from .. import ir_pass
+from .. import analysis, transform
 from .. import expr as _expr
 from .. import op as _op
 from .. import module as _module
@@ -41,6 +41,13 @@
     "relu"   : _op.nn.relu
 }
 
+def _infer_type(node):
+    """A method to infer the type of an intermediate node in the relay graph."""
+    mod = _module.Module.from_expr(node)
+    mod = transform.InferType()(mod)
+    entry = mod["main"]
+    return entry if isinstance(node, _expr.Function) else entry.body
+
 def _mx_fully_connected(inputs, attrs):
     import mxnet as mx
     units = attrs.get_int("num_hidden")
@@ -89,7 +96,8 @@ def _stable_softrelu(x):
 
 def _mx_compare(new_op, wrapper):
     def impl(inputs, attrs):
-        dtype = ir_pass.infer_type(inputs[0]).checked_type.dtype
+        expr = _infer_type(inputs[0])
+        dtype = expr.checked_type.dtype
         return wrapper(new_op)(inputs, attrs).astype(dtype)
     return impl
 
@@ -258,7 +266,8 @@ def _mx_slice_like(inputs, attrs):
 
 def _mx_slice_axis(inputs, attrs):
     assert len(inputs) == 1
-    shape = ir_pass.infer_type(inputs[0]).checked_type.shape
+    expr = _infer_type(inputs[0])
+    shape = expr.checked_type.shape
     axis = attrs.get_int("axis")
     ax_beg = attrs.get_int("begin")
     ax_end = attrs.get_str("end")
@@ -302,7 +311,8 @@ def _mx_crop_like(inputs, attrs):
     if offset == (0, 0):
         new_attrs["axes"] = (2, 3)
         return _op.slice_like(*inputs, **new_attrs)
-    like_shape = ir_pass.infer_type(inputs[1]).checked_type.shape
+    expr = _infer_type(inputs[1])
+    like_shape = expr.checked_type.shape
     new_attrs['begin'] = [0, 0, offset[0], offset[1]]
     new_attrs['end'] = [like_shape[0], like_shape[1], offset[0]+like_shape[2],
                         offset[1]+like_shape[3]]
@@ -532,7 +542,8 @@ def _mx_resize(inputs, attrs):
     scale_width = attrs.get_float("scale_width", None)
     height = attrs.get_int("height", 1)
     width = attrs.get_int("width", 1)
-    shape = ir_pass.infer_type(inputs[0]).checked_type.shape
+    expr = _infer_type(inputs[0])
+    shape = expr.checked_type.shape
     if scale_height is not None:
         height = (scale_height * shape[2]).astype("int32")
     if scale_width is not None:
@@ -639,7 +650,8 @@ def _mx_broadcast_axis(inputs, attrs):
     assert len(axis) == len(size)
     if len(axis) == 0:
         return inputs[0]
-    src_shape = ir_pass.infer_type(inputs[0])._checked_type_.shape
+    expr = _infer_type(inputs[0])
+    src_shape = expr.checked_type.shape
     tgt_shape = []
     for i, dim in enumerate(src_shape):
         if i not in axis:
@@ -734,7 +746,8 @@ def _rnn_cell(data, states, i2h_weight, h2h_weight, i2h_bias, h2h_bias, activati
         return out, [out]
 
     def _gru_cell(data, states, i2h_weight, h2h_weight, i2h_bias, h2h_bias):
-        dtype = ir_pass.infer_type(data).checked_type.dtype
+        expr = _infer_type(data)
+        dtype = expr.checked_type.dtype
         i2h = _op.nn.bias_add(_op.nn.dense(data, i2h_weight), i2h_bias, axis=-1)
         h2h = _op.nn.bias_add(_op.nn.dense(states[0], h2h_weight), h2h_bias, axis=-1)
         i2h_r, i2h_z, i2h = _op.split(i2h, indices_or_sections=3, axis=1)
@@ -776,7 +789,8 @@ def _lstm_cell(data, states, i2h_weight, h2h_weight, i2h_bias, h2h_bias):
     seq_data = inputs[0]
     concat_weight = inputs[1]
     init_states = inputs[2:]
-    data_shape = ir_pass.infer_type(seq_data).checked_type.shape
+    expr = _infer_type(seq_data)
+    data_shape = expr.checked_type.shape
     seq_len = int(data_shape[0])
     assert len(concat_weight) == num_layers * 4 * direct
 
@@ -1099,7 +1113,7 @@ def _from_mxnet_impl(symbol, shape_dict, dtype_info, mod=None):
 
     outputs = [node_map[e[0]][e[1]] for e in jgraph["heads"]]
     outputs = outputs[0] if len(outputs) == 1 else _expr.Tuple(outputs)
-    func = _expr.Function(ir_pass.free_vars(outputs), outputs)
+    func = _expr.Function(analysis.free_vars(outputs), outputs)
     return func
 
 
@@ -1186,5 +1200,5 @@ def from_mxnet(symbol,
     else:
         msg = "mxnet.Symbol or gluon.HybridBlock expected, got {}".format(type(symbol))
         raise ValueError(msg)
-    mod[mod.entry_func] = func
+    mod["main"] = func
     return mod, params
diff --git a/python/tvm/relay/frontend/onnx.py b/python/tvm/relay/frontend/onnx.py
index bb968ec0bea8a..397ca90de55f2 100644
--- a/python/tvm/relay/frontend/onnx.py
+++ b/python/tvm/relay/frontend/onnx.py
@@ -22,7 +22,7 @@
 import numpy as np
 import tvm
 from ... import nd as _nd
-from .. import ir_pass
+from .. import analysis
 from .. import transform as _transform
 from .. import expr as _expr
 from .. import module as _module
@@ -412,7 +412,7 @@ def _impl_v1(cls, inputs, attr, params):
         else:
             data, shape = inputs
             logging.warning("Constant evaluating Reshape's shape argument, may reduce performance")
-            shape_params = ir_pass.free_vars(shape)
+            shape_params = analysis.free_vars(shape)
             func = _expr.Function(shape_params, shape)
             mod = _module.Module.from_expr(func)
             seq = _transform.Sequential([_transform.InferType(),
@@ -1106,7 +1106,7 @@ def from_onnx(self, graph, opset):
         # now return the outputs
         outputs = [self._nodes[self._parse_value_proto(i)] for i in graph.output]
         outputs = outputs[0] if len(outputs) == 1 else _expr.Tuple(outputs)
-        func = _expr.Function(ir_pass.free_vars(outputs), outputs)
+        func = _expr.Function(analysis.free_vars(outputs), outputs)
         return _module.Module.from_expr(func), self._params
 
     def _parse_value_proto(self, value_proto):
diff --git a/python/tvm/relay/frontend/tensorflow.py b/python/tvm/relay/frontend/tensorflow.py
index d754e85ef78d7..59e0983e95985 100644
--- a/python/tvm/relay/frontend/tensorflow.py
+++ b/python/tvm/relay/frontend/tensorflow.py
@@ -27,7 +27,8 @@
 
 import tvm
 from topi.util import get_const_tuple
-from .. import ir_pass
+from .. import analysis
+from .. import transform as _transform
 from .. import expr as _expr
 from .. import op as _op
 from ..expr_functor import ExprMutator
@@ -38,9 +39,9 @@
 def _infer_value(input_val, params):
     from tvm.contrib import graph_runtime
     # Check that all free variables have associated parameters.
-    assert all(var.name_hint in params.keys() for var in ir_pass.free_vars(
+    assert all(var.name_hint in params.keys() for var in analysis.free_vars(
         input_val)), "All inputs to infer must be available in params."
-    func = _expr.Function(ir_pass.free_vars(input_val), input_val)
+    func = _expr.Function(analysis.free_vars(input_val), input_val)
     with tvm.relay.build_config(opt_level=0):
         graph, lib, params = tvm.relay.build(func, target="llvm", params=params)
     ctx = tvm.context("llvm", 0)
@@ -235,9 +236,16 @@ def _infer_out_shapes(inputs, params):
     """A method to get the output shape of intermediate nodes in the relay graph."""
     return [_infer_shape(inputs, params)]
 
+def _infer_type(node):
+    """A method to infer the type of an intermediate node in the relay graph."""
+    mod = _module.Module.from_expr(node)
+    mod = _transform.InferType()(mod)
+    entry = mod["main"]
+    return entry if isinstance(node, _expr.Function) else entry.body
+
 def _infer_shape(node, params=None):
     """A method to get the output shape of an intermediate node in the relay graph."""
-    out_type = ir_pass.infer_type(node)
+    out_type = _infer_type(node)
     return get_const_tuple(out_type.checked_type.shape)
 
 def _get_param(params, input_node):
@@ -1841,7 +1849,8 @@ def _while_loop(self):
         bind_map = {}
         for i, var in enumerate(self.loop_vars):
             if not isinstance(var, _expr.Var):
-                var_type = ir_pass.infer_type(var).checked_type
+                var_chk = _infer_type(var)
+                var_type = var_chk.checked_type
             else:
                 var_type = var.type_annotation
 
@@ -2112,8 +2121,8 @@ def from_tensorflow(self, graph, layout="NHWC", shape=None, outputs=None):
                 out.append(out_rnn)
 
         out = out[0] if len(out) == 1 else _expr.Tuple(out)
-        func = _expr.Function(ir_pass.free_vars(out), out)
-        self._mod[self._mod.entry_func] = func
+        func = _expr.Function(analysis.free_vars(out), out)
+        self._mod["main"] = func
         return self._mod, self._params
 
     def _parse_import_prerequisites(self, graph):
@@ -2329,7 +2338,8 @@ def _convert_control_flow_operator(self, node, inputs, attrs, control_flow_node_
             else:
                 if node_name_prefix not in self._branches:
                     self._branches[node_name_prefix] = Branch()
-                self._branches[node_name_prefix].cond = ir_pass.infer_type(op[0])
+                chk_op = _infer_type(op[0])
+                self._branches[node_name_prefix].cond = chk_op
         elif node.op == "NextIteration":
             op = self._nodes[node.input[0]]
             assert len(op) == 1
diff --git a/python/tvm/relay/frontend/tflite.py b/python/tvm/relay/frontend/tflite.py
index fe163871fa60f..bf1938b1481e7 100644
--- a/python/tvm/relay/frontend/tflite.py
+++ b/python/tvm/relay/frontend/tflite.py
@@ -20,7 +20,7 @@
 import math
 import numpy as np
 import tvm
-from .. import ir_pass
+from .. import analysis
 from .. import expr as _expr
 from .. import module as _module
 from .. import op as _op
@@ -914,5 +914,5 @@ def from_tflite(model, shape_dict, dtype_dict):
     params = {k:_nd.array(np.array(v)) for k, v in exp_tab.params.items()}
     outputs = [exp_tab.get_expr(get_tensor_name(subgraph, i)) for i in model_outputs]
     outputs = outputs[0] if len(outputs) == 1 else _expr.Tuple(outputs)
-    func = _expr.Function(ir_pass.free_vars(outputs), outputs)
+    func = _expr.Function(analysis.free_vars(outputs), outputs)
     return _module.Module.from_expr(func), params
diff --git a/python/tvm/relay/ir_pass.py b/python/tvm/relay/ir_pass.py
deleted file mode 100644
index 1748571cb3163..0000000000000
--- a/python/tvm/relay/ir_pass.py
+++ /dev/null
@@ -1,704 +0,0 @@
-# Licensed to the Apache Software Foundation (ASF) under one
-# or more contributor license agreements.  See the NOTICE file
-# distributed with this work for additional information
-# regarding copyright ownership.  The ASF licenses this file
-# to you under the Apache License, Version 2.0 (the
-# "License"); you may not use this file except in compliance
-# with the License.  You may obtain a copy of the License at
-#
-#   http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing,
-# software distributed under the License is distributed on an
-# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-# KIND, either express or implied.  See the License for the
-# specific language governing permissions and limitations
-# under the License.
-# pylint: disable=no-else-return
-# pylint: disable=unidiomatic-typecheck
-"""
-This file contains the set of passes for Relay, which exposes an interface for
-configuring the passes and scripting them in Python.
-"""
-from . import _ir_pass
-from . import _make
-from .expr import Expr
-from .ty import Type
-from .module import Module
-from .feature import Feature
-
-
-def post_order_visit(expr, fvisit):
-    """Recursively visit the ir in post DFS order node,
-    apply fvisit. Each node is guaranteed to be visited
-    only once.
-
-    Parameters
-    ----------
-    expr : tvm.relay.Expr
-        The input expression.
-
-    fvisit : function
-        The visitor function to be applied.
-    """
-    return _ir_pass.post_order_visit(expr, fvisit)
-
-def infer_type(expr, mod=None):
-    """Infer the type of expr under the context of mod.
-
-    Parameters
-    ----------
-    expr: tvm.relay.Expr
-        The input expression.
-
-    mod: Optional[tvm.relay.Module]
-        The global module.
-
-    Returns
-    -------
-    checked_expr : tvm.relay.Expr
-        The checked expression.
-    """
-    return _ir_pass.infer_type(expr, mod)
-
-
-def backward_fold_scale_axis(expr):
-    """Backward fold axis scaling into weights of conv2d/dense.
-
-    Parameters
-    ----------
-    expr : tvm.relay.Expr
-        The input expression, we expect that expr's types
-        should be fully inferred by infer_type.
-
-    Returns
-    -------
-    folded_expr : tvm.relay.Expr
-        The folded expression after transformation.
-
-    Note
-    ----
-    It is recommended to call backward_fold_scale_axis
-    before using forward_fold_scale_axis.
-    As backward folding targets common conv-bn pattern.
-    """
-    return _ir_pass.backward_fold_scale_axis(expr)
-
-def eta_expand(expr, mod):
-    """Add abstraction over a function.
-
-    Parameters
-    ----------
-    expr : tvm.relay.Expr
-        The input expression, we expect that expr's types
-        should be fully inferred by infer_type.
-    mod : tvm.relay.Module
-         The global module.
-
-    Returns
-    -------
-    expanded_expr : tvm.relay.Expr
-        The expression after eta expansion.
-    """
-    return _ir_pass.eta_expand(expr, mod)
-
-def forward_fold_scale_axis(expr):
-    """Fold the scaling of axis into weights of conv2d/dense.
-
-    Parameters
-    ----------
-    expr : tvm.relay.Expr
-        The input expression, we expect that expr's types
-        should be fully inferred by infer_type.
-
-    Returns
-    -------
-    folded_expr : tvm.relay.Expr
-        The folded expression after transformation.
-
-    Note
-    ----
-    It is recommended to call backward_fold_scale_axis
-    before using forward_fold_scale_axis.
-    As backward folding targets common conv-bn pattern.
-    """
-    return _ir_pass.forward_fold_scale_axis(expr)
-
-
-def well_formed(expr):
-    """Check that each Var is only bound once (well formed).
-
-    Parameters
-    ----------
-    expr : tvm.relay.Expr
-        The input expression
-
-    Returns
-    -------
-    well_form : bool
-        Whether the input expression is well formed
-    """
-    return _ir_pass.well_formed(expr)
-
-
-def check_kind(t, mod=None):
-    """Check that the type is well kinded and return the kind.
-    For example, this mean type cannot has tensor of tensor, or is a tuple type of 2 shapes.
-
-    Parameters
-    ----------
-    t : tvm.relay.Type
-        The type to check
-
-    mod : Optional[tvm.relay.Module]
-        The global module.
-
-    Returns
-    -------
-    kind : Kind
-        the kind of t
-
-    Examples
-    --------
-    .. code:: python
-
-        assert check_kind(relay.TupleType([relay.TypeParam('tp1', relay.Kind.Shape)])) == Shape
-        assert check_kind(relay.TupleType([relay.TypeParam('tp1', relay.Kind.Type)])) == Type
-    """
-    if mod is not None:
-        return _ir_pass.check_kind(t, mod)
-    else:
-        return _ir_pass.check_kind(t)
-
-
-def free_vars(expr):
-    """Get free Vars from expression expr in Post DFS order.
-
-    Parameters
-    ----------
-    expr : tvm.relay.Expr
-        The input expression
-
-    Returns
-    -------
-    free : List[tvm.relay.Var]
-        The list of free variables in post DFS order.
-
-    Note
-    ----
-    The fact that Vars are post-DFS ordred are useful in
-    neural networks: usually this means weights of previous
-    are ordered first.
-    """
-    return _ir_pass.free_vars(expr)
-
-
-def bound_vars(expr):
-    """Get bound vars from expression expr in post-DFS order.
-
-    Parameters
-    ----------
-    expr : tvm.relay.Expr
-        The input expression
-
-    Returns
-    -------
-    free : List[tvm.relay.Var]
-        The list of bound variables in post-DFS order.
-    """
-    return _ir_pass.bound_vars(expr)
-
-
-def all_vars(expr):
-    """Get all vars from expression expr in post-DFS order.
-
-    Parameters
-    ----------
-    expr : tvm.relay.Expr
-        The input expression
-
-    Returns
-    -------
-    free : List[tvm.relay.Var]
-        The list of all variables in post-DFS order.
-    """
-    return _ir_pass.all_vars(expr)
-
-
-def free_type_vars(expr, mod=None):
-    """Get free type variables from expression/type e
-
-    Parameters
-    ----------
-    expr : Union[tvm.relay.Expr,tvm.relay.Type]
-        The input expression/type
-
-    mod : Optional[tvm.relay.Module]
-        The global module
-
-    Returns
-    -------
-    free : List[tvm.relay.TypeVar]
-        The list of free type variables in post-DFS order
-    """
-    use_mod = mod if mod is not None else Module()
-    return _ir_pass.free_type_vars(expr, use_mod)
-
-
-def bound_type_vars(expr, mod=None):
-    """Get bound type variables from expression/type e
-
-    Parameters
-    ----------
-    expr : Union[tvm.relay.Expr,tvm.relay.Type]
-        The input expression/type
-
-    mod : Optional[tvm.relay.Module]
-        The global module
-
-    Returns
-    -------
-    free : List[tvm.relay.TypeVar]
-        The list of bound type variables in post-DFS order
-    """
-    use_mod = mod if mod is not None else Module()
-    return _ir_pass.bound_type_vars(expr, use_mod)
-
-
-def all_type_vars(expr, mod=None):
-    """Get all type variables from expression/type e
-
-    Parameters
-    ----------
-    expr : Union[tvm.relay.Expr,tvm.relay.Type]
-        The input expression/type
-    mod : Optional[tvm.relay.Module]
-        The global module
-
-    Returns
-    -------
-    free : List[tvm.relay.TypeVar]
-        The list of all type variables in post-DFS order
-    """
-    use_mod = mod if mod is not None else Module()
-    return _ir_pass.all_type_vars(expr, use_mod)
-
-
-def simplify_inference(expr):
-    """ Simplify the data-flow graph for inference phase.
-
-    Parameters
-    ----------
-    expr : tvm.relay.Expr
-        The input Expression
-
-    Returns
-    -------
-    result : tvm.relay.Expr
-        An expression which is semantically equal to the input expression,
-        but with some simplification
-    """
-    return _ir_pass.simplify_inference(expr)
-
-
-def canonicalize_ops(expr):
-    """ Canonicalize special operators to basic operators.
-    This can simplify latter analysis. (e.g. Expand bias_add to expand_dims and broadcast_add.)
-
-    Parameters
-    ----------
-    expr : tvm.relay.Expr
-        The input Expression
-
-    Returns
-    -------
-    result : tvm.relay.Expr
-        An expression without bias_add
-    """
-    return _ir_pass.canonicalize_ops(expr)
-
-
-def dead_code_elimination(expr, inline_once=False):
-    """ Remove expressions which does not effect the program result (dead code).
-
-    Parameters
-    ----------
-    expr : tvm.relay.Expr
-        The input Expression
-
-    inline_once : Optional[Bool]
-        Whether to inline binding that occur only once.
-    Returns
-    -------
-    result : tvm.relay.Expr
-        An expression which is semantically equal to the input expression,
-        but with dead code removed.
-    """
-    return _ir_pass.dead_code_elimination(expr, inline_once)
-
-
-def alpha_equal(lhs, rhs):
-    """Compare two Relay expr for structural equivalence (alpha equivalence).
-
-    Parameters
-    ----------
-    lhs : tvm.relay.Expr
-        One of the input Expression.
-
-    rhs : tvm.relay.Expr
-        One of the input Expression.
-
-    Returns
-    -------
-    result : bool
-        True iff lhs is alpha equal to rhs.
-    """
-    return bool(_make._alpha_equal(lhs, rhs))
-
-
-def graph_equal(lhs, rhs):
-    """Compare two Relay expr for data-flow equivalence.
-    The difference between this and alpha-equality is that
-    variables are not expected to match between lhs and rhs;
-    they are treated as sources and are mapped between each other.
-
-    Parameters
-    ----------
-    lhs : tvm.relay.Expr
-      One of the input Expression.
-
-    rhs : tvm.relay.Expr
-      One of the input Expression.
-
-    Returns
-    -------
-    result : bool
-      True iff lhs is data-flow equivalent to rhs.
-    """
-    return bool(_make._graph_equal(lhs, rhs))
-
-
-def structural_hash(value):
-    """Hash a Relay expression structurally.
-
-    Parameters
-    ----------
-    expr : Union[tvm.relay.Expr, tvm.relay.Type]
-      The expression to hash.
-
-    Returns
-    -------
-    result : int
-      The hash value
-    """
-    if isinstance(value, Expr):
-        return int(_ir_pass._expr_hash(value))
-    elif isinstance(value, Type):
-        return int(_ir_pass._type_hash(value))
-    else:
-        msg = ("found value of type {0} expected" +
-               "relay.Expr or relay.Type").format(type(value))
-        raise TypeError(msg)
-
-
-def fold_constant(expr):
-    """Fold the constant expression in expr.
-
-    Parameters
-    ----------
-    expr : tvm.relay.Expr
-        The input expression.
-
-    Returns
-    -------
-    transformed_expr : tvm.relay.Expr
-        The transformed expression.
-    """
-    return _ir_pass.FoldConstant(expr)
-
-
-def fuse_ops(expr, opt_level=1, mod=None):
-    """Fuse operators in expr together.
-
-    Parameters
-    ----------
-    expr : tvm.relay.Expr
-        The input expression.
-
-    opt_level : int
-        The level of fuse optimization.
-
-    mod : tvm.relay.Module
-        The module to perform fusion over.
-
-    Returns
-    -------
-    transformed_expr : tvm.relay.Expr
-        Transformed expression, containing fused result.
-    """
-    return _ir_pass.FuseOps(expr, opt_level, mod)
-
-
-def combine_parallel_conv2d(expr, min_num_branches=3):
-    """Combine multiple conv2d into one.
-
-    Parameters
-    ----------
-    expr : tvm.relay.Expr
-        The input expression.
-
-    min_num_branches : int
-        The minimum number of parallel branches when the transformation should be applied.
-
-    Returns
-    -------
-    transformed_expr : tvm.relay.Expr
-        Transformed expression
-    """
-    return _ir_pass.CombineParallelConv2D(expr, min_num_branches)
-
-
-def alter_op_layout(expr):
-    """Alternate the layouts of operators or replace primitive operators with
-    other expressions.
-    This pass can be used for computing convolution in custom layouts or
-    other general weight pre-transformation.
-
-    Parameters
-    ----------
-    expr : tvm.relay.Expr
-        The input expression.
-
-    Returns
-    -------
-    transformed_expr : tvm.relay.Expr
-        Transformed expression with alternated layout.
-    """
-    return _ir_pass.AlterOpLayout(expr)
-
-
-def rewrite_annotated_ops(expr, fallback_device):
-    """Rewrite the annotated program where annotation operators, e.g.
-    `on_deivce`, mark which device an expression should be scheduled to.
-    This pass helps heterogeneous execution where different operators may need
-    to be allocated on various devices.
-
-    Parameters
-    ----------
-    expr : tvm.relay.Expr
-        The input expression.
-
-    fallback_device : int
-        The fallback device type. It is also used as the default device for
-        operators with no annotated device.
-
-    Returns
-    -------
-    transformed_expr : tvm.relay.Expr
-        Transformed expression with cross device data copy operators.
-    """
-    return _ir_pass.RewriteDeviceAnnotation(expr, fallback_device)
-
-
-def collect_device_info(expr):
-    """Collect the device allocation map for the given expression. The device
-    ids are propagated from the `device_copy` operators.
-
-    Parameters
-    ----------
-    expr : tvm.relay.Expr
-        The input expression.
-
-    Returns
-    -------
-    ret : Dict[tvm.relay.expr, int]
-        A dictionary mapping tvm.relay.Expr to device type.
-    """
-    return _ir_pass.CollectDeviceInfo(expr)
-
-
-def collect_device_annotation_ops(expr):
-    """Collect the device annotation ops for the given expression.
-
-    Parameters
-    ----------
-    expr : tvm.relay.Expr
-        The input expression.
-
-    Returns
-    -------
-    ret : Dict[tvm.relay.expr, int]
-        A dictionary mapping tvm.relay.Expr to device type where the keys are
-        annotation expressions.
-    """
-    return _ir_pass.CollectDeviceAnnotationOps(expr)
-
-
-def to_a_normal_form(expr, mod=None):
-    """
-    Turn Graph Normal Form expression into A Normal Form Expression.
-
-    The scope of the root expression is the global scope.
-
-    The scope of any non root expression is the least common ancestor of all it's scope.
-
-    Values are ordered by post-DFS order in each scope.
-
-    Parameters
-    ----------
-    expr : tvm.relay.Expr
-        The input expression.
-
-    mod : Optional[tvm.relay.Module]
-        The global module.
-
-    Returns
-    -------
-    result : tvm.relay.Expr
-      The output expression.
-    """
-    return _ir_pass.to_a_normal_form(expr, mod)
-
-
-def to_graph_normal_form(expr):
-    """Turn A Normal Form expression into Graph Normal Form expression
-    Parameters
-    ----------
-    expr : tvm.relay.Expr
-        The input expression
-    Returns
-    -------
-    result : tvm.relay.Expr
-      The output expression
-    """
-    return _ir_pass.to_graph_normal_form(expr)
-
-
-def gradient(expr, mod=None, mode='higher_order'):
-    """
-    Transform the input function,
-    returning a function that calculate the original result,
-    paired with gradient of the input.
-
-    Parameters
-    ----------
-    expr : tvm.relay.Expr
-        The input expression, which is a Function or a GlobalVar.
-
-    mod : Optional[tvm.relay.Module]
-
-    mode : Optional[String]
-        The mode of the automatic differentiation algorithm.
-        'first_order' only work on first order code, but will not produce reference nor closure.
-        'higher_order' work on all code using reference and closure.
-
-    Returns
-    -------
-    expr : tvm.relay.Expr
-      The transformed expression.
-    """
-    if mode == 'first_order':
-        return _ir_pass.first_order_gradient(expr, mod)
-    elif mode == 'higher_order':
-        return _ir_pass.gradient(expr, mod)
-    else:
-        raise Exception('unknown mode')
-
-
-def get_total_mac_number(expr):
-    """
-    Count the number of MACs (multiply-accumulate) of a model
-
-    Parameters
-    ----------
-    expr : tvm.relay.Expr
-        The input expression.
-
-    Returns
-    -------
-    result : int64
-      The number of MACs (multiply-accumulate) of a model
-    """
-    return _ir_pass.GetTotalMacNumber(expr)
-
-
-def eliminate_common_subexpr(expr, fskip=None):
-    """
-    Eliminate common subexpressions.
-
-    Parameters
-    ----------
-    expr : tvm.relay.Expr
-        The input expression.
-
-    fskip : function
-        The callback function that decides whether an expression should be skipped.
-
-    Returns
-    -------
-    result : tvm.relay.Expr
-      The output expression.
-    """
-    return _ir_pass.eliminate_common_subexpr(expr, fskip)
-
-
-def partial_evaluate(expr, mod=None):
-    """
-    Evaluate the static fragment of the code.
-
-    Parameters
-    ----------
-    expr : tvm.relay.Expr
-        The input expression.
-
-    mod : Optional[tvm.relay.Module]
-        The global module
-
-    Returns
-    -------
-    result : tvm.relay.Expr
-      The output expression.
-    """
-    return _ir_pass.partial_evaluate(expr, mod)
-
-
-def unmatched_cases(match, mod=None):
-    """
-    Finds cases that the match expression does not catch, if any.
-
-    Parameters
-    ----------
-    match : tvm.relay.Match
-        The match expression
-    mod : Optional[tvm.relay.Module]
-        The module (defaults to an empty module)
-
-    Returns
-    -------
-    missing_patterns : [tvm.relay.Pattern]
-      Patterns that the match expression does not catch.
-    """
-    return _ir_pass.unmatched_cases(match, mod)
-
-
-def detect_feature(a, b=None):
-    """
-    Detect the feature used in a relay program.
-
-    Parameters
-    ----------
-    a : Union[tvm.relay.Expr, tvm.relay.Module]
-      The input expression or module.
-
-    b : Optional[Union[tvm.relay.Expr, tvm.relay.Module]]
-      The input expression or module.
-      The two arguments cannot both be expression or module.
-
-    Returns
-    -------
-    features : Set[Feature]
-      Features used in the program.
-    """
-    if isinstance(a, Module):
-        a, b = b, a
-    return set([Feature(int(x)) for x in _ir_pass.detect_feature(a, b)])
diff --git a/python/tvm/relay/module.py b/python/tvm/relay/module.py
index 138dfa8822154..8ac15f743fc4f 100644
--- a/python/tvm/relay/module.py
+++ b/python/tvm/relay/module.py
@@ -33,7 +33,7 @@ class Module(RelayNode):
 
     Parameters
     ----------
-    functions : dict, optional.
+    functions: Optional[dict].
         Map of global var to Function
     """
     def __init__(self, functions=None, type_definitions=None):
@@ -78,17 +78,11 @@ def __setitem__(self, var, val):
     def _add(self, var, val, update=False):
         if isinstance(val, _expr.Expr):
             if isinstance(var, _base.string_types):
-                var = _expr.GlobalVar(var)
-
-            # TODO(@jroesch): Port this logic to C++.
-            if not isinstance(val, _expr.Function):
-                if isinstance(val, _expr.GlobalVar):
-                    val = ir_pass.eta_expand(val, self)
+                if _module.Module_ContainGlobalVar(self, var):
+                    var = _module.Module_GetGlobalVar(self, var)
                 else:
-                    val = _expr.Function([], val)
-
-
-            _make.Module_Add(self, var, val, update)
+                    var = _expr.GlobalVar(var)
+            _module.Module_Add(self, var, val, update)
         else:
             assert isinstance(val, _ty.Type)
             if isinstance(var, _base.string_types):
@@ -100,7 +94,7 @@ def __getitem__(self, var):
 
         Parameters
         ----------
-        var: str or GlobalVar
+        var: Union[String, GlobalVar, GlobalTypeVar]
             The name or global variable.
 
         Returns
@@ -165,6 +159,25 @@ def get_global_type_var(self, name):
         """
         return _module.Module_GetGlobalTypeVar(self, name)
 
+    def get_constructor(self, tag):
+        """Look up an ADT constructor by tag.
+
+        Parameters
+        ----------
+        tag: int
+            The tag for a constructor.
+
+        Returns
+        -------
+        constructor: Constructor
+           The constructor associated with the given tag,
+
+        Raises
+        ------
+        tvm.TVMError if the corresponding constructor cannot be found.
+        """
+        return _module.Module_LookupTag(self, tag)
+
     @staticmethod
     def from_expr(expr):
         return _module.Module_FromExpr(expr)
diff --git a/python/tvm/relay/op/nn/nn.py b/python/tvm/relay/op/nn/nn.py
index 7bce9dd3c5b99..1de86173040d0 100644
--- a/python/tvm/relay/op/nn/nn.py
+++ b/python/tvm/relay/op/nn/nn.py
@@ -137,6 +137,12 @@ def conv2d_transpose(data,
     dilation : Tuple[int], optional
         Specifies the dilation rate to be used for dilated convolution.
 
+    channels : int, optional
+        Number of output channels of this convolution.
+
+    kernel_size : tuple of int, optional
+        The spatial of the convolution kernel.
+
     groups : int, optional
         Number of groups for grouped convolution.
 
diff --git a/python/tvm/relay/quantize/quantize.py b/python/tvm/relay/quantize/quantize.py
index fa70e19544677..beebceaf8590c 100644
--- a/python/tvm/relay/quantize/quantize.py
+++ b/python/tvm/relay/quantize/quantize.py
@@ -22,7 +22,7 @@
 from . import _quantize
 from .. import expr as _expr
 from .. import module as _module
-from .. import ir_pass as _ir_pass
+from .. import analysis as _analysis
 from .. import transform as _transform
 from .. import op as _op
 from ... import make as _make
@@ -250,7 +250,7 @@ def _make_const(val):
             const_params[nclip_min] = _make_const(- (valid_range - 1))
             const_params[nclip_max] = _make_const((valid_range - 1))
 
-    _ir_pass.post_order_visit(graph, visit_func)
+    _analysis.post_order_visit(graph, visit_func)
     return _expr.bind(graph, const_params)
 
 
@@ -365,4 +365,4 @@ def quantize(graph, params=None, dataset=None):
         mod = optimize(mod)
         mod = quantize_seq(mod)
 
-    return mod[mod.entry_func.name_hint]
+    return mod["main"]
diff --git a/python/tvm/relay/testing/__init__.py b/python/tvm/relay/testing/__init__.py
index 7a5007bbfb8f2..de9e55b369d19 100644
--- a/python/tvm/relay/testing/__init__.py
+++ b/python/tvm/relay/testing/__init__.py
@@ -17,6 +17,9 @@
 """Utilities for testing and benchmarks"""
 from __future__ import absolute_import as _abs
 
+import tvm.relay as relay
+from tvm.relay import transform
+
 from . import mlp
 from . import resnet
 from . import dqn
@@ -32,3 +35,15 @@
 from .config import ctx_list
 from .init import create_workload
 from .nat import add_nat_definitions, count, make_nat_value, make_nat_expr
+
+
+def run_opt_pass(expr, opt_pass):
+    assert isinstance(opt_pass, transform.Pass)
+    mod = relay.Module.from_expr(expr)
+    mod = opt_pass(mod)
+    entry = mod["main"]
+    return entry if isinstance(expr, relay.Function) else entry.body
+
+
+def run_infer_type(expr):
+    return run_opt_pass(expr, transform.InferType())
diff --git a/python/tvm/relay/testing/dcgan.py b/python/tvm/relay/testing/dcgan.py
index 4ee0bd13a5a7e..c6b258badb5b6 100644
--- a/python/tvm/relay/testing/dcgan.py
+++ b/python/tvm/relay/testing/dcgan.py
@@ -81,7 +81,7 @@ def get_net(batch_size, random_len=100, oshape=(3, 64, 64), ngf=128, code=None,
         dc32, ishape=(ngf, 32, 32), oshape=oshape[-3:], kshape=(4, 4), name="g5_deconv")
     tanh = relay.tanh(dc64)
 
-    args = relay.ir_pass.free_vars(tanh)
+    args = relay.analysis.free_vars(tanh)
     return relay.Function(args, tanh)
 
 
@@ -103,8 +103,8 @@ def get_workload(batch_size, oshape=(3, 64, 64), ngf=128, random_len=100, dtype=
 
     Returns
     -------
-    net : nnvm.symbol
-        The computational graph
+    mod : tvm.relay.Module
+        The relay module that contains a DCGAN network.
     params : dict of str to NDArray
         The parameters.
     """
diff --git a/python/tvm/relay/testing/densenet.py b/python/tvm/relay/testing/densenet.py
index de3ebe36eb7bd..f9b479153bfad 100644
--- a/python/tvm/relay/testing/densenet.py
+++ b/python/tvm/relay/testing/densenet.py
@@ -79,7 +79,7 @@ def _make_dense_net(num_init_features, growth_rate, block_config,
 
     ret = layers.dense_add_bias(flat, units=classes, name='dense')
 
-    return relay.Function(relay.ir_pass.free_vars(ret), ret)
+    return relay.Function(relay.analysis.free_vars(ret), ret)
 
 def get_workload(densenet_size=121, classes=1000, batch_size=4,
                  image_shape=(3, 224, 224), dtype='float32'):
@@ -105,8 +105,8 @@ def get_workload(densenet_size=121, classes=1000, batch_size=4,
 
     Returns
     -------
-    net: relay.Function
-        The computation graph representing densenet.
+    mod: tvm.relay.Module
+        The relay module that contains a DenseNet network.
 
     params : dict of str to NDArray
         The benchmark paraeters.
diff --git a/python/tvm/relay/testing/dqn.py b/python/tvm/relay/testing/dqn.py
index 034ac0a6c2e5f..cdf9d24af996a 100644
--- a/python/tvm/relay/testing/dqn.py
+++ b/python/tvm/relay/testing/dqn.py
@@ -54,7 +54,7 @@ def get_net(batch_size, num_actions=18, image_shape=(4, 84, 84), dtype="float32"
     relu4 = relay.nn.relu(dense1)
     dense2 = layers.dense_add_bias(relu4, units=num_actions, name="dense2")
 
-    args = relay.ir_pass.free_vars(dense2)
+    args = relay.analysis.free_vars(dense2)
     return relay.Function(args, dense2)
 
 
@@ -72,8 +72,8 @@ def get_workload(batch_size, num_actions=18, image_shape=(4, 84, 84), dtype="flo
         The data type
     Returns
     -------
-    net : nnvm.symbol
-        The computational graph
+    mod : tvm.relay.Module
+        The relay module that contains a DQN network.
     params : dict of str to NDArray
         The parameters.
     """
diff --git a/python/tvm/relay/testing/inception_v3.py b/python/tvm/relay/testing/inception_v3.py
index c9ec3293ed0a1..4da543257c318 100644
--- a/python/tvm/relay/testing/inception_v3.py
+++ b/python/tvm/relay/testing/inception_v3.py
@@ -266,7 +266,7 @@ def get_net(batch_size,
     fc1 = relay.nn.dense(flatten, relay.var("fc1_weight"), units=num_classes)
     fc1 = relay.nn.bias_add(fc1, relay.var("fc2_bias"), axis=-1)
     inception_v3 = relay.nn.softmax(data=fc1)
-    args = relay.ir_pass.free_vars(inception_v3)
+    args = relay.analysis.free_vars(inception_v3)
     return relay.Function(args, inception_v3)
 
 def get_workload(batch_size=1, num_classes=1000,
@@ -289,8 +289,8 @@ def get_workload(batch_size=1, num_classes=1000,
 
     Returns
     -------
-    net : nnvm.Symbol
-        The computational graph
+    mod : tvm.relay.Module
+        The relay module that contains an Inception V3 network.
 
     params : dict of str to NDArray
         The parameters.
diff --git a/python/tvm/relay/testing/init.py b/python/tvm/relay/testing/init.py
index b246b46172766..0b8ab2b42029b 100644
--- a/python/tvm/relay/testing/init.py
+++ b/python/tvm/relay/testing/init.py
@@ -144,16 +144,16 @@ def create_workload(net, initializer=None, seed=0):
 
     Returns
     -------
-    net : tvm.relay.Function
-        The updated dataflow
+    mod : tvm.relay.Module
+        The created relay module.
 
     params : dict of str to NDArray
         The parameters.
     """
-    net = relay.ir_pass.infer_type(net)
+    mod = relay.Module.from_expr(net)
+    mod = relay.transform.InferType()(mod)
     shape_dict = {
-        v.name_hint : v.checked_type for v in net.params}
-    net.astext()
+        v.name_hint : v.checked_type for v in mod["main"].params}
     np.random.seed(seed)
     initializer = initializer if initializer else Xavier()
     params = {}
@@ -163,4 +163,4 @@ def create_workload(net, initializer=None, seed=0):
         init_value = np.zeros(v.concrete_shape).astype(v.dtype)
         initializer(k, init_value)
         params[k] = tvm.nd.array(init_value, ctx=tvm.cpu(0))
-    return net, params
+    return mod, params
diff --git a/python/tvm/relay/testing/lstm.py b/python/tvm/relay/testing/lstm.py
index b0915e033ccbf..d0134c1a864d6 100644
--- a/python/tvm/relay/testing/lstm.py
+++ b/python/tvm/relay/testing/lstm.py
@@ -154,7 +154,7 @@ def get_net(iterations, num_hidden, batch_size=1, dtype="float32"):
 
     builder.ret(out)
     body = builder.get()
-    args = relay.ir_pass.free_vars(body)
+    args = relay.analysis.free_vars(body)
     return relay.Function(args, body, input_type)
 
 
@@ -173,8 +173,8 @@ def get_workload(iterations, num_hidden, batch_size=1, dtype="float32"):
         The data type
     Returns
     -------
-    net : nnvm.symbol
-        The computational graph
+    mod : tvm.relay.Module
+        The relay module that contains a LSTM network.
     params : dict of str to NDArray
         The parameters.
     """
diff --git a/python/tvm/relay/testing/mlp.py b/python/tvm/relay/testing/mlp.py
index 562ef21ba9f1c..337bde5d5889e 100644
--- a/python/tvm/relay/testing/mlp.py
+++ b/python/tvm/relay/testing/mlp.py
@@ -58,7 +58,7 @@ def get_net(batch_size,
     fc3 = relay.nn.dense(act2, relay.var("fc3_weight"), units=num_classes)
     fc3 = relay.nn.bias_add(fc3, relay.var("fc3_bias"), axis=-1)
     mlp = relay.nn.softmax(data=fc3)
-    args = relay.ir_pass.free_vars(mlp)
+    args = relay.analysis.free_vars(mlp)
     return relay.Function(args, mlp)
 
 
@@ -84,8 +84,8 @@ def get_workload(batch_size,
 
     Returns
     -------
-    net : relay.Function
-        The dataflow.
+    mod : tvm.relay.Module
+        The relay module that contains a mlp network.
 
     params : dict of str to NDArray
         The parameters.
diff --git a/python/tvm/relay/testing/mobilenet.py b/python/tvm/relay/testing/mobilenet.py
index 78e1d82456c84..3b068c05a24ed 100644
--- a/python/tvm/relay/testing/mobilenet.py
+++ b/python/tvm/relay/testing/mobilenet.py
@@ -108,7 +108,7 @@ def mobile_net(num_classes=1000, data_shape=(1, 3, 224, 224),
     weight = relay.var('fc_weight')
     fc = relay.nn.dense(data=flatten, weight=weight, units=num_classes)
     softmax = relay.nn.softmax(data=fc)
-    return relay.Function(relay.ir_pass.free_vars(softmax), softmax)
+    return relay.Function(relay.analysis.free_vars(softmax), softmax)
 
 
 def get_workload(batch_size=1, num_classes=1000, image_shape=(3, 224, 224), dtype='float32'):
@@ -130,8 +130,8 @@ def get_workload(batch_size=1, num_classes=1000, image_shape=(3, 224, 224), dtyp
 
     Returns
     -------
-    net : relay.Function
-        The computational graph
+    mod : tvm.relay.Module
+        The relay module that contains a MobileNet network.
 
     params : dict of str to NDArray
         The parameters.
diff --git a/python/tvm/relay/testing/resnet.py b/python/tvm/relay/testing/resnet.py
index 9ba57ae09ef5b..a8e369b740219 100644
--- a/python/tvm/relay/testing/resnet.py
+++ b/python/tvm/relay/testing/resnet.py
@@ -169,7 +169,7 @@ def resnet(units,
     flat = relay.nn.batch_flatten(data=pool1)
     fc1 = layers.dense_add_bias(data=flat, units=num_classes, name='fc1')
     net = relay.nn.softmax(data=fc1)
-    return relay.Function(relay.ir_pass.free_vars(net), net)
+    return relay.Function(relay.analysis.free_vars(net), net)
 
 
 def get_net(batch_size,
@@ -261,8 +261,8 @@ def get_workload(batch_size=1,
 
     Returns
     -------
-    net : relay.Function
-        The computational graph
+    mod : tvm.relay.Module
+        The relay module that contains a ResNet network.
 
     params : dict of str to NDArray
         The parameters.
diff --git a/python/tvm/relay/testing/squeezenet.py b/python/tvm/relay/testing/squeezenet.py
index c7b8e8db166b6..1e9ea73e9360e 100644
--- a/python/tvm/relay/testing/squeezenet.py
+++ b/python/tvm/relay/testing/squeezenet.py
@@ -119,7 +119,7 @@ def get_net(batch_size, image_shape, num_classes, version, dtype):
     net = relay.nn.global_avg_pool2d(net)
     net = relay.nn.batch_flatten(net)
     net = relay.nn.softmax(net)
-    args = relay.ir_pass.free_vars(net)
+    args = relay.analysis.free_vars(net)
     return relay.Function(args, net)
 
 
@@ -149,8 +149,8 @@ def get_workload(batch_size=1,
 
     Returns
     -------
-    net : nnvm.Symbol
-        The computational graph
+    mod : tvm.relay.Module
+        The relay module that contains a SqueezeNet network.
 
     params : dict of str to NDArray
         The parameters.
diff --git a/python/tvm/relay/testing/vgg.py b/python/tvm/relay/testing/vgg.py
index bec141f70ffd0..205c5b1fa8e39 100644
--- a/python/tvm/relay/testing/vgg.py
+++ b/python/tvm/relay/testing/vgg.py
@@ -90,7 +90,7 @@ def get_net(batch_size, image_shape, num_classes, dtype, num_layers=11, batch_no
     feature = get_feature(data, layers, filters, batch_norm)
     classifier = get_classifier(feature, num_classes)
     symbol = relay.nn.softmax(data=classifier)
-    args = relay.ir_pass.free_vars(symbol)
+    args = relay.analysis.free_vars(symbol)
     return relay.Function(args, symbol)
 
 
@@ -124,8 +124,8 @@ def get_workload(batch_size,
 
     Returns
     -------
-    net : nnvm.Symbol
-        The computational graph
+    mod : tvm.relay.Module
+        The relay module that contains a VGG network.
 
     params : dict of str to NDArray
         The parameters.
diff --git a/python/tvm/relay/transform.py b/python/tvm/relay/transform.py
index 5f47e5b446aa7..2805e0b429fa0 100644
--- a/python/tvm/relay/transform.py
+++ b/python/tvm/relay/transform.py
@@ -277,6 +277,40 @@ def FoldScaleAxis():
     return _transform.FoldScaleAxis()
 
 
+def BackwardFoldScaleAxis():
+    """Backward fold axis scaling into weights of conv2d/dense.
+
+    Returns
+    -------
+    ret : tvm.relay.Pass
+        The registered pass to backward fold expressions.
+
+    Note
+    ----
+    It is recommended to call backward_fold_scale_axis
+    before using forward_fold_scale_axis.
+    As backward folding targets common conv-bn pattern.
+    """
+    return _transform.BackwardFoldScaleAxis()
+
+
+def ForwardFoldScaleAxis():
+    """Fold the scaling of axis into weights of conv2d/dense.
+
+    Returns
+    -------
+    ret : tvm.relay.Pass
+        The registered pass to forward fold expressions.
+
+    Note
+    ----
+    It is recommended to call backward_fold_scale_axis
+    before using forward_fold_scale_axis.
+    As backward folding targets common conv-bn pattern.
+    """
+    return _transform.ForwardFoldScaleAxis()
+
+
 def SimplifyInference():
     """Simplify the data-flow graph for inference phase. An simplified expression
     which is semantically equal to the input expression will be returned.
@@ -302,15 +336,20 @@ def CanonicalizeOps():
     return _transform.CanonicalizeOps()
 
 
-def DeadCodeElimination():
-    """ Remove expressions which does not effect the program result (dead code).
+def DeadCodeElimination(inline_once=False):
+    """Remove expressions which does not effect the program result (dead code).
+
+    Parameters
+    ----------
+    inline_once: Optional[Bool]
+        Whether to inline binding that occurs only once.
 
     Returns
     -------
     ret: tvm.relay.Pass
         The registered pass that eliminates the dead code in a Relay program.
     """
-    return _transform.DeadCodeElimination()
+    return _transform.DeadCodeElimination(inline_once)
 
 
 def FoldConstant():
@@ -401,11 +440,26 @@ def ToANormalForm():
 
     Returns
     -------
-    ret: tvm.relay.Pass
+    ret: Union[tvm.relay.Pass, tvm.relay.Expr]
         The registered pass that transforms an expression into A Normal Form.
     """
     return _transform.ToANormalForm()
 
+
+def ToCPS(expr, mod=None):
+    """
+    Turn expression into continuation passing style(CPS).
+
+    Every intermediate compute will be passed to a continuation.
+
+    Returns
+    -------
+    result: tvm.relay.Pass
+        The registered pass that transforms an expression into CPS.
+    """
+    return _transform.to_cps(expr, mod)
+
+
 def EtaExpand():
     """Add abstraction over a function
 
@@ -416,6 +470,7 @@ def EtaExpand():
     """
     return _transform.EtaExpand()
 
+
 def ToGraphNormalForm():
     """Turn A Normal Form expression into Graph Normal Form expression
 
@@ -447,13 +502,21 @@ def EliminateCommonSubexpr(fskip=None):
 def PartialEvaluate():
     """Evaluate the static fragment of the code.
 
+    Note
+    ----
+    This transformation could be either `Module -> Module` or `Expr -> Expr`.
+    It will directly transform the input expression to a new one if the target
+    expression is provided. Otherwise, it will rely on the pass manager to
+    carry out transformation.
+
     Returns
     -------
-    ret : tvm.relay.Pass
+    ret: tvm.relay.Pass
         The registered pass that performs partial evaluation on an expression.
     """
     return _transform.PartialEvaluate()
 
+
 def CanonicalizeCast():
     """
     Canonicalize cast expressions to make operator fusion more efficient.
@@ -465,6 +528,80 @@ def CanonicalizeCast():
     """
     return _transform.CanonicalizeCast()
 
+
+def gradient(expr, mod=None, mode='higher_order'):
+    """
+    Transform the input function,
+    returning a function that calculate the original result,
+    paired with gradient of the input.
+
+    Parameters
+    ----------
+    expr : tvm.relay.Expr
+        The input expression, which is a Function or a GlobalVar.
+
+    mod : Optional[tvm.relay.Module]
+
+    mode : Optional[String]
+        The mode of the automatic differentiation algorithm.
+        'first_order' only works on first order code, but will not produce
+        reference nor closure.
+        'higher_order' works on all code using reference and closure.
+
+    Returns
+    -------
+    expr : tvm.relay.Expr
+      The transformed expression.
+    """
+    if mode == 'first_order':
+        return _transform.first_order_gradient(expr, mod)
+    if mode == 'higher_order':
+        return _transform.gradient(expr, mod)
+    raise Exception('unknown mode')
+
+
+def to_cps(func, mod=None):
+    """
+    Turn expression into CPS expression.
+
+    Every intermediate compute will be passed to a continuation.
+
+    Parameters
+    ----------
+    func: tvm.relay.Function
+        The input function.
+
+    mod: Optional[tvm.relay.Module]
+        The global module.
+
+    Returns
+    -------
+    result: tvm.relay.Function
+      The output function.
+    """
+    return _transform.to_cps(func, mod)
+
+
+def un_cps(func):
+    """
+    Turn an cps function into a Function without the continuation argument.
+
+    Note that this will not give the exact same interface as before cps:
+      If the input/output is higher order, they will still be in cps form.
+
+    Parameters
+    ----------
+    func: tvm.relay.Function
+        The input function
+
+    Returns
+    -------
+    result: tvm.relay.Function
+        The output function
+    """
+    return _transform.un_cps(func)
+
+
 def _wrap_class_module_pass(pass_cls, pass_info):
     """Wrap a python class as function pass"""
     class PyModulePass(ModulePass):
diff --git a/src/api/api_lang.cc b/src/api/api_lang.cc
index 42d60b85e375f..00ac715e8c075 100644
--- a/src/api/api_lang.cc
+++ b/src/api/api_lang.cc
@@ -207,7 +207,13 @@ TVM_REGISTER_API("Range")
   });
 
 TVM_REGISTER_API("_Buffer")
-.set_body_typed(BufferNode::make);
+.set_body([](TVMArgs args, TVMRetValue* ret) {
+    CHECK_EQ(args.size(), 10);
+    auto buffer_type = args[9].operator std::string();
+    BufferType type = (buffer_type == "auto_broadcast") ? kAutoBroadcast : kDefault;
+    *ret = BufferNode::make(args[0], args[1], args[2], args[3], args[4],
+                            args[5], args[6], args[7], args[8], type);
+  });
 
 TVM_REGISTER_API("_BufferAccessPtr")
 .set_body_method(&Buffer::access_ptr);
diff --git a/src/arithmetic/analyzer.cc b/src/arithmetic/analyzer.cc
index 2198aee934787..626fc18c57df9 100644
--- a/src/arithmetic/analyzer.cc
+++ b/src/arithmetic/analyzer.cc
@@ -106,6 +106,7 @@ bool Analyzer::CanProve(const Expr& expr) {
 Expr Analyzer::Simplify(const Expr& expr) {
   if (is_const(expr)) return expr;
   auto res = this->rewrite_simplify(expr);
+  if (is_const(res)) return res;
   res = this->canonical_simplify(res);
   return res;
 }
diff --git a/src/arithmetic/bound_deducer.cc b/src/arithmetic/bound_deducer.cc
index 395a371f43af7..003ba8def7612 100644
--- a/src/arithmetic/bound_deducer.cc
+++ b/src/arithmetic/bound_deducer.cc
@@ -84,11 +84,11 @@ class BoundDeducer: public IRVisitor {
   void Deduce();
 
   void Visit(const NodeRef& e) final {
-    if (!success) return;
+    if (!success_) return;
     if (e.get() == path_[iter_++]) {
       IRVisitor::Visit(e);
     } else {
-      success = false;
+      success_ = false;
       return;
     }
   }
@@ -111,18 +111,18 @@ class BoundDeducer: public IRVisitor {
 
   void Visit_(const Add* op) final {
     bool left = op->a.get() == path_[iter_];
-    result -= left ? op->b : op->a;
+    result_ -= left ? op->b : op->a;
     Visit(left ? op->a : op->b);
   }
 
   void Visit_(const Sub* op) final {
     bool left = op->a.get() == path_[iter_];
     if (left) {
-      result += op->b;
+      result_ += op->b;
     } else {
-      result -= op->a;
-      result = - result;
-      is_greater = !is_greater;
+      result_ -= op->a;
+      result_ = - result_;
+      is_greater_ = !is_greater_;
     }
     Visit(left ? op->a : op->b);
   }
@@ -130,43 +130,65 @@ class BoundDeducer: public IRVisitor {
   void Visit_(const Mul* op) final {
     bool left = op->a.get() == path_[iter_];
     Expr operand = left ? op->b : op->a;
+    Expr target_var = left ? op->a : op->b;
 
-    SignType sign;
+    SignType sign_operand;
     if (operand.type().is_uint()) {
-      sign = kPositive;
+      sign_operand = kPositive;
     } else {
-      sign = expr_map_[operand].sign_type();
+      sign_operand = expr_map_[operand].sign_type();
     }
 
-    if (sign == SignType::kNegative) {
-      is_greater = !is_greater;
-    } else if (sign == SignType::kUnknown) {
+    if (sign_operand == SignType::kNegative) {
+      is_greater_ = !is_greater_;
+    } else if (sign_operand == SignType::kUnknown) {
       // unable to get the sign of operand
-      success = false;
+      success_ = false;
       return;
     }
-
     // always use relax bound
-    bool divided = can_prove(result % operand == 0);
-    result = result / operand;
-    // since system will round down when not divided
-    // eg. 2/4 -> 0; -2/4 -> -1
-    // no need fix for !is_greater:
-    // eg. a <= 2/4 -> a <= 0
-    // eg. a <= 0/4 -> a <= 0
-    // so just fix for not divided and is_greater
-    // eg. a >= 2/4 -> a >= 0 + 1
-    // eg. a >= 0/4 -> a >= 0
-    if (is_greater && !divided) {
-       result += 1;
+    bool divided = analyzer_.CanProve(result_ % operand == 0);
+
+    result_ = result_ / operand;
+
+    if (!divided) {
+      // Handle non-divisible case
+      // NOTE: this accounts for truc div behavior.
+      bool target_is_non_neg = expr_map_[target_var].can_prove_non_negative();
+
+      if (is_greater_) {
+        result_ += 1;
+      } else {
+        // NOTE: this is a bit sutble hack.
+        //
+        // condition:
+        // - x * operand <= result
+        // - operand > 0
+        // - x >= 0
+        //
+        // Then it is fine to deduce that x <= result / operand.
+        // - if result > 0,  this division round down
+        // - if result < 0, (result / operand) rounds up and may violate the constraint
+        //   however, given that x is always non-negative,
+        //   it is fine to have this relaxed bound, given that the user of deduce bound
+        //   will respect the bound of x
+        //
+        // TODO(tvm-team): think about a better API to incorporate constraint of x.
+        //                 e.g. specify an interval of x and return a bound
+        //                 that is in the interval and satisfies the condition.
+        if (target_is_non_neg && sign_operand == kPositive) {
+          // do nothing
+        } else {
+          result_ -= 1;
+        }
+      }
     }
-
     Visit(left ? op->a : op->b);
   }
 
-  Expr result;
-  bool is_greater{true};
-  bool success{true};
+  Expr result_;
+  bool is_greater_{true};
+  bool success_{true};
 
  private:
   void Init();
@@ -180,6 +202,8 @@ class BoundDeducer: public IRVisitor {
   ExprIntSetMap expr_map_;
   std::vector<const Node*> path_;
   size_t iter_{0};
+  // internal analzyer
+  Analyzer analyzer_;
 };
 
 class BoundDeduceInputChecker: public IRVisitor {
@@ -202,7 +226,7 @@ class BoundDeduceInputChecker: public IRVisitor {
 
 void BoundDeducer::Init() {
   BoundDeduceInputChecker checker;
-  if (!checker.Check(this)) success = false;
+  if (!checker.Check(this)) success_ = false;
   Transform();
 }
 
@@ -211,66 +235,65 @@ void BoundDeducer::Transform() {
   if (const LT* op = expr_.as<LT>()) {
     if (GetPath(target_, op->a).empty()) {
       // a < b -> b >= a + 1
-      is_greater = true;
+      is_greater_ = true;
       expr_ = op->b;
-      result = op->a + 1;
+      result_ = op->a + 1;
     } else {
       // a < b -> a <= b - 1
-      is_greater = false;
+      is_greater_ = false;
       expr_ = op->a;
-      result = op->b - 1;
+      result_ = op->b - 1;
     }
   } else if (const LE* op = expr_.as<LE>()) {
     if (GetPath(target_, op->a).empty()) {
       // a <= b -> b >= a
-      is_greater = true;
+      is_greater_ = true;
       expr_ = op->b;
-      result = op->a;
+      result_ = op->a;
     } else {
-      is_greater = false;
+      is_greater_ = false;
       expr_ = op->a;
-      result = op->b;
+      result_ = op->b;
     }
   } else if (const GT* op = expr_.as<GT>()) {
     if (GetPath(target_, op->a).empty()) {
       // a > b -> b <= a - 1
-      is_greater = false;
+      is_greater_ = false;
       expr_ = op->b;
-      result = op->a - 1;
+      result_ = op->a - 1;
     } else {
       // a > b -> a >= b + 1
-      is_greater = true;
+      is_greater_ = true;
       expr_ = op->a;
-      result = op->b + 1;
+      result_ = op->b + 1;
     }
   } else if (const GE* op = expr_.as<GE>()) {
     if (GetPath(target_, op->a).empty()) {
       // a >= b -> b <= a
-      is_greater = false;
+      is_greater_ = false;
       expr_ = op->b;
-      result = op->a;
+      result_ = op->a;
     } else {
-      is_greater = true;
+      is_greater_ = true;
       expr_ = op->a;
-      result = op->b;
+      result_ = op->b;
     }
   } else {
-    success = false;
+    success_ = false;
   }
 }
 
 void BoundDeducer::Deduce() {
   Init();
-  if (!success) return;
+  if (!success_) return;
   Relax();
-  if (!success) return;
+  if (!success_) return;
   // get the path
   path_ = GetPath(target_, expr_);
   if (!path_.size()) {
-    success = false;
+    success_ = false;
     return;
   }
-
   expr_map_ = EvalSetForEachSubExpr(expr_, hint_map_);
 
   Visit(expr_);
@@ -278,13 +301,13 @@ void BoundDeducer::Deduce() {
 
 void BoundDeducer::Relax() {
   IntSet a = EvalSet(expr_, relax_map_);
-  IntSet b = EvalSet(result, relax_map_);
+  IntSet b = EvalSet(result_, relax_map_);
   if (a.is_everything() || b.is_everything()) {
-    success = false;
+    success_ = false;
     return;
   }
-  expr_  = is_greater ? a.min() : a.max();
-  result = is_greater ? b.max() : b.min();
+  expr_  = is_greater_ ? a.min() : a.max();
+  result_ = is_greater_ ? b.max() : b.min();
 }
 
 IntSet DeduceBound(Expr v, Expr e,
@@ -292,12 +315,12 @@ IntSet DeduceBound(Expr v, Expr e,
   const std::unordered_map<const Variable*, IntSet>& relax_map) {
   BoundDeducer d(v, e, hint_map, relax_map);
   d.Deduce();
-  if (!d.success) return IntSet::nothing();
+  if (!d.success_) return IntSet::nothing();
   Expr min = neg_inf(), max = pos_inf();
-  if (d.is_greater) {
-    min = d.result;
+  if (d.is_greater_) {
+    min = d.result_;
   } else {
-    max = d.result;
+    max = d.result_;
   }
   return IntSet::interval(min, max);
 }
diff --git a/src/arithmetic/compute_expr.h b/src/arithmetic/compute_expr.h
index cc54bff596be7..4fa5fe9bd06a9 100644
--- a/src/arithmetic/compute_expr.h
+++ b/src/arithmetic/compute_expr.h
@@ -18,10 +18,8 @@
  */
 
 /*!
- *  Copyright (c) 2017 by Contributors
  * \file compute_expr.h
- * \brief Utility integer expression with quick eager simplification.
- *  This is weaker than Simplify but can be done Eagerly.
+ * \brief Utility to invoke certan compute operations.
  */
 #ifndef TVM_ARITHMETIC_COMPUTE_EXPR_H_
 #define TVM_ARITHMETIC_COMPUTE_EXPR_H_
@@ -41,7 +39,7 @@ namespace arith {
  * \return The result.
  */
 template<typename OP>
-inline Expr ComputeExpr(Expr lhs, Expr rhs) {
+inline Expr Compute(Expr lhs, Expr rhs) {
   return OP::make(lhs, rhs);
 }
 
@@ -79,37 +77,37 @@ inline bool GetConstInt(Expr e, int* out) {
 }
 
 template<>
-inline Expr ComputeExpr<ir::Add>(Expr a, Expr b) {
+inline Expr Compute<ir::Add>(Expr a, Expr b) {
   return a + b;
 }
 
 template<>
-inline Expr ComputeExpr<ir::Sub>(Expr a, Expr b) {
+inline Expr Compute<ir::Sub>(Expr a, Expr b) {
   return a - b;
 }
 
 template<>
-inline Expr ComputeExpr<ir::Mul>(Expr a, Expr b) {
+inline Expr Compute<ir::Mul>(Expr a, Expr b) {
   return a * b;
 }
 
 template<>
-inline Expr ComputeExpr<ir::Div>(Expr a, Expr b) {
+inline Expr Compute<ir::Div>(Expr a, Expr b) {
   return a / b;
 }
 
 template<>
-inline Expr ComputeExpr<ir::Mod>(Expr a, Expr b) {
+inline Expr Compute<ir::Mod>(Expr a, Expr b) {
   return a % b;
 }
 
 template<>
-inline Expr ComputeExpr<ir::Max>(Expr a, Expr b) {
+inline Expr Compute<ir::Max>(Expr a, Expr b) {
   return max(a, b);
 }
 
 template<>
-inline Expr ComputeExpr<ir::Min>(Expr a, Expr b) {
+inline Expr Compute<ir::Min>(Expr a, Expr b) {
   return min(a, b);
 }
 
@@ -121,7 +119,7 @@ inline Expr ComputeReduce(const Array<Expr>& values, Expr empty_value) {
   }
   Expr res = values[0];
   for (size_t i = 1; i < values.size(); ++i) {
-    res = ComputeExpr<Op>(res, values[i]);
+    res = Compute<Op>(res, values[i]);
   }
   return res;
 }
diff --git a/src/arithmetic/const_fold.h b/src/arithmetic/const_fold.h
index ec50aef5c51ed..dc6b80a31c7bd 100644
--- a/src/arithmetic/const_fold.h
+++ b/src/arithmetic/const_fold.h
@@ -155,9 +155,10 @@ template<>
 inline Expr TryConstFold<ir::Div>(Expr a, Expr b) {
   TVM_ARITH_CONST_PROPAGATION({
       const Type& rtype = a.type();
-      // due to division and mod can have different modes
-      // only constant fold positive number where rule is fixed.
-      if (pa && pb && pa->value >= 0 && pb->value > 0) {
+      if (pa && pb) {
+        // due to division and mod can have different modes
+        // NOTE: this will assumes truc div.
+        CHECK_NE(pb->value, 0) << "Divide by zero";
         return IntImm::make(rtype, pa->value / pb->value);
       }
       if (pa) {
diff --git a/src/arithmetic/detect_linear_equation.cc b/src/arithmetic/detect_linear_equation.cc
index e584c8b1ce332..3c5f12a7379e4 100644
--- a/src/arithmetic/detect_linear_equation.cc
+++ b/src/arithmetic/detect_linear_equation.cc
@@ -27,7 +27,6 @@
 #include <tvm/ir_visitor.h>
 #include <tvm/ir_functor_ext.h>
 #include <tvm/arithmetic.h>
-#include "compute_expr.h"
 
 namespace tvm {
 namespace arith {
@@ -127,18 +126,18 @@ class LinearEqDetector
   Expr AddCombine(Expr a, Expr b) {
     if (!a.defined()) return b;
     if (!b.defined()) return a;
-    return ComputeExpr<Add>(a, b);
+    return a + b;
   }
   Expr SubCombine(Expr a, Expr b) {
     // Check b first in case they are both undefined
     if (!b.defined()) return a;
     if (!a.defined()) return -b;
-    return ComputeExpr<Sub>(a, b);
+    return a - b;
   }
   Expr MulCombine(Expr a, Expr b) {
     if (!a.defined()) return a;
     if (!b.defined()) return b;
-    return ComputeExpr<Mul>(a, b);
+    return a * b;
   }
 };
 
diff --git a/src/arithmetic/rewrite_simplify.cc b/src/arithmetic/rewrite_simplify.cc
index bc8666e893b4e..773f6c3a85c40 100644
--- a/src/arithmetic/rewrite_simplify.cc
+++ b/src/arithmetic/rewrite_simplify.cc
@@ -155,7 +155,6 @@ Mutate_(const Add* op, const Expr& self) {
     TVM_TRY_REWRITE(max(x, y - z) + z, max(x + z, y));
     TVM_TRY_REWRITE(max(x - z, y) + z, max(x, y + z));
 
-
     TVM_TRY_REWRITE_IF(min(x, y + z * c1) + z * c2, min(x + z * c2, y),
                        c1.Eval()->value == -c2.Eval()->value);
     TVM_TRY_REWRITE_IF(max(x, y + z * c1) + z * c2, max(x + z * c2, y),
@@ -343,13 +342,16 @@ Mutate_(const Sub* op, const Expr& self) {
                        c1.Eval()->value != 0 &&
                        c3.Eval()->value == c1.Eval()->value * c2.Eval()->value);
 
+    // Proof in the case of floordiv, need positive condition.
+    // let x = a * c3 + r
+    // (x + c1) / c3 - x / c3 => (r + c1) / c3
     TVM_TRY_REWRITE_IF((x + c1) / c3  - (x + c2) / c3,
-                       ((x + (c1 % c3)) % c3 + (c1 - c2)) / c3,
+                       ((x + ((c2 % c3) + c3) % c3) % c3 + (c1 - c2)) / c3,
                        CanProveGreaterEqual(x.Eval(), -c2.Eval()->value) &&
                        c1.Eval()->value >= c2.Eval()->value &&
                        c3.Eval()->value > 0);
     TVM_TRY_REWRITE_IF((x + c1) / c3  - x / c3,
-                       ((x + (c1 % c3)) % c3 + c1) / c3,
+                       (x % c3 + c1) / c3,
                        CanProveGreaterEqual(x.Eval(), 0) &&
                        c1.Eval()->value >= 0 &&
                        c3.Eval()->value > 0);
@@ -1192,9 +1194,9 @@ Mutate_(const LT* op, const Expr& self) {
     TVM_TRY_RECURSIVE_REWRITE(c1 - y < x, c1 < x + y);
     TVM_TRY_RECURSIVE_REWRITE(c1 + y < x, c1 < x - y);
 
-
+    TVM_TRY_RECURSIVE_REWRITE(x + c1 < c2, x < c2 - c1);
+    TVM_TRY_RECURSIVE_REWRITE(x - c1 < c2, x < c2 + c1);
     TVM_TRY_REWRITE(x - c1 < 0, x < c1);
-    TVM_TRY_REWRITE(x + c1 < c2, x < c2 - c1);
   }
   return ret;
 }
diff --git a/src/arithmetic/stmt_simplify.cc b/src/arithmetic/stmt_simplify.cc
index 01cb96ee1323e..fc6b92a87ce1d 100644
--- a/src/arithmetic/stmt_simplify.cc
+++ b/src/arithmetic/stmt_simplify.cc
@@ -28,15 +28,27 @@
 #include <tvm/ir_mutator.h>
 #include <tvm/expr_operator.h>
 #include <tvm/arithmetic.h>
-#include "arithmetic/Simplify.h"
 
 namespace tvm {
 namespace arith {
-// statement simplifier
+
 using namespace ir;
 
 class StmtSimplifier : public IRMutator {
  public:
+  using IRMutator::Mutate;
+
+  Expr Mutate(Expr expr) final {
+    return analyzer_.Simplify(expr);
+  }
+
+  Stmt Simplify(Stmt stmt, Map<Var, Range> vrange) {
+    for (auto kv : vrange) {
+      analyzer_.Bind(kv.first, kv.second);
+    }
+    return Mutate(stmt);
+  }
+
   Stmt Mutate_(const For* op, const Stmt& s) final {
     Var loop_var(op->loop_var.node_);
     analyzer_.Bind(loop_var, Range::make_by_min_extent(op->min, op->extent));
@@ -125,28 +137,12 @@ class StmtSimplifier : public IRMutator {
   std::unordered_map<const Variable*, Range> var_dom_;
 };
 
-
-class CanonicalStmtSimplifier : public StmtSimplifier {
- public:
-  using StmtSimplifier::Mutate;
-  Expr Mutate(Expr expr) final {
-    return analyzer_.canonical_simplify(expr);
-  }
-
-  Stmt CanonicalSimplify(Stmt stmt, Map<Var, Range> vrange) {
-    for (auto kv : vrange) {
-      analyzer_.Bind(kv.first, kv.second);
-    }
-    return Mutate(stmt);
-  }
-};
-
 }  // namespace arith
 
 namespace ir {
 
 Stmt CanonicalSimplify(Stmt stmt, Map<Var, Range> vrange) {
-  return arith::CanonicalStmtSimplifier().CanonicalSimplify(
+  return arith::StmtSimplifier().Simplify(
       stmt, vrange);
 }
 
@@ -158,42 +154,18 @@ Expr CanonicalSimplify(Expr expr, Map<Var, Range> vrange) {
   return analyzer.canonical_simplify(expr);
 }
 
-template<typename T>
-T Simplify_(T a, Map<Var, Range> vrange) {
-  using namespace HalideIR::Internal;
-  Scope<Interval> rscope;
+Expr Simplify(Expr expr, Map<Var, Range> vrange) {
+  arith::Analyzer analyzer;
   for (auto kv : vrange) {
-    Range r = kv.second;
-    rscope.push(
-        kv.first.get(),
-        Interval(r->min,
-                 simplify(r->min + r->extent - make_const(r->min.type(), 1))));
-  }
-  return HalideIR::Internal::simplify(a, true, rscope);
-}
-
-
-Expr Simplify(Expr a, Map<Var, Range> vrange) {
-  // Simplify top level reduce.
-  if (const Reduce* r = a.as<Reduce>()) {
-    Array<Expr> new_source;
-    for (auto& e : r->source) {
-      new_source.push_back(Simplify_(e, vrange));
-    }
-    Expr new_condition = Simplify_(r->condition, vrange);
-    if (r->source.same_as(new_source) &&
-        r->condition.same_as(new_condition)) {
-      return a;
-    } else {
-      return Reduce::make(
-              r->combiner, new_source, r->axis, new_condition, r->value_index);
-    }
+    analyzer.Bind(kv.first, kv.second);
   }
-  return Simplify_(a, vrange);
+  expr = analyzer.Simplify(expr);
+  return expr;
 }
 
-Stmt Simplify(Stmt a, Map<Var, Range> vrange) {
-  return Simplify_(a, vrange);
+Stmt Simplify(Stmt stmt, Map<Var, Range> vrange) {
+  return arith::StmtSimplifier().Simplify(
+      stmt, vrange);
 }
 }  // namespace ir
 }  // namespace tvm
diff --git a/src/codegen/build_module.cc b/src/codegen/build_module.cc
index 6917200ff9205..c1622338174df 100644
--- a/src/codegen/build_module.cc
+++ b/src/codegen/build_module.cc
@@ -342,7 +342,7 @@ Buffer BufferWithOffsetAlignment(Array<Expr> shape,
   }
 
   return BufferNode::make(data, dtype, shape, Array<Expr>(), elem_offset, name, "",
-    data_alignment, offset_factor);
+    data_alignment, offset_factor, kDefault);
 }
 
 void GetBinds(const Array<Tensor>& args,
diff --git a/src/codegen/codegen_cuda.cc b/src/codegen/codegen_cuda.cc
index 22dde1c463892..a32473158bd5f 100644
--- a/src/codegen/codegen_cuda.cc
+++ b/src/codegen/codegen_cuda.cc
@@ -6,9 +6,9 @@
  * to you under the Apache License, Version 2.0 (the
  * "License"); you may not use this file except in compliance
  * with the License.  You may obtain a copy of the License at
- * 
+ *
  *   http://www.apache.org/licenses/LICENSE-2.0
- * 
+ *
  * Unless required by applicable law or agreed to in writing,
  * software distributed under the License is distributed on an
  * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
@@ -27,7 +27,6 @@
 #include <vector>
 #include <string>
 #include "codegen_cuda.h"
-#include "../arithmetic/compute_expr.h"
 
 namespace tvm {
 namespace codegen {
diff --git a/src/codegen/llvm/codegen_llvm.cc b/src/codegen/llvm/codegen_llvm.cc
index 1e56583a37fd0..fde0486483b2b 100644
--- a/src/codegen/llvm/codegen_llvm.cc
+++ b/src/codegen/llvm/codegen_llvm.cc
@@ -748,9 +748,7 @@ void CodeGenLLVM::Scalarize(const Expr& e,
                             std::function<void(int i, llvm::Value* v)> f) {
   if (const Ramp* ramp = e.as<Ramp>()) {
     for (int i = 0; i < ramp->type.lanes(); ++i) {
-      Expr offset = arith::ComputeExpr<Add>(
-          ramp->base,
-          arith::ComputeExpr<Mul>(ramp->stride, i));
+      Expr offset = ramp->base + (ramp->stride * i);
       f(i, MakeValue(offset));
     }
   } else {
diff --git a/src/codegen/spirv/codegen_spirv.cc b/src/codegen/spirv/codegen_spirv.cc
index fd113ca4614a2..7686250c5ce57 100644
--- a/src/codegen/spirv/codegen_spirv.cc
+++ b/src/codegen/spirv/codegen_spirv.cc
@@ -25,8 +25,8 @@
 #include <tvm/ir.h>
 #include <tvm/ir_pass.h>
 #include <string>
-#include "../../arithmetic/compute_expr.h"
 #include "codegen_spirv.h"
+#include "../../arithmetic/compute_expr.h"
 
 namespace tvm {
 namespace codegen {
@@ -339,7 +339,7 @@ spirv::Value CodeGenSPIRV::VisitExpr_(const Ramp* op) {
     spirv::Value v = base;
     if (i != 0) {
       spirv::Value offset = MakeValue(
-          arith::ComputeExpr<Mul>(make_const(op->stride.type(), i), op->stride));
+          make_const(op->stride.type(), i) * op->stride);
       v = builder_->Add(v, offset);
     }
     values.push_back(v);
@@ -419,9 +419,7 @@ void CodeGenSPIRV::Scalarize(const Expr& e,
                              std::function<void(int i, spirv::Value v)> f) {
   if (const Ramp* ramp = e.as<Ramp>()) {
     for (int i = 0; i < ramp->type.lanes(); ++i) {
-      Expr offset = arith::ComputeExpr<Add>(
-          ramp->base,
-          arith::ComputeExpr<Mul>(ramp->stride, i));
+      Expr offset = ramp->base + ramp->stride * i;
       f(i, MakeValue(offset));
     }
   } else {
diff --git a/src/lang/buffer.cc b/src/lang/buffer.cc
index 8c584c50b3c67..cb5c86710fabb 100644
--- a/src/lang/buffer.cc
+++ b/src/lang/buffer.cc
@@ -6,9 +6,9 @@
  * to you under the Apache License, Version 2.0 (the
  * "License"); you may not use this file except in compliance
  * with the License.  You may obtain a copy of the License at
- * 
+ *
  *   http://www.apache.org/licenses/LICENSE-2.0
- * 
+ *
  * Unless required by applicable law or agreed to in writing,
  * software distributed under the License is distributed on an
  * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
@@ -26,6 +26,7 @@
 #include <tvm/ir.h>
 #include <tvm/ir_pass.h>
 #include <iterator>
+#include <stack>
 #include "../arithmetic/compute_expr.h"
 
 namespace tvm {
@@ -48,7 +49,8 @@ Buffer decl_buffer(Array<Expr> shape,
       Expr(),
       name,
       "",
-      0, 0);
+      0, 0,
+      kDefault);
 }
 
 // Split the given expression w.r.t the add operator
@@ -364,7 +366,8 @@ Buffer Buffer::MakeSlice(Array<Expr> begins, Array<Expr> extents) const {
                           n->name + "_slice",
                           n->scope,
                           n->data_alignment,
-                          0);
+                          0,
+                          n->buffer_type);
 }
 
 Expr Buffer::access_ptr(int access_mask, Type ptr_type, int content_lanes, Expr offset) const {
@@ -375,8 +378,7 @@ Expr Buffer::access_ptr(int access_mask, Type ptr_type, int content_lanes, Expr
     extent = make_const(self->DefaultIndexType(), 1);
   } else if (self->strides.size() == self->shape.size()) {
     int highest_dim = 0;
-    extent = arith::ComputeExpr<ir::Mul>(
-        self->strides[highest_dim], self->shape[highest_dim]) - offset;
+    extent = self->strides[highest_dim] * self->shape[highest_dim] - offset;
   } else {
     extent = arith::ComputeReduce<ir::Mul>(self->shape, Expr()) - offset;
   }
@@ -404,7 +406,8 @@ Buffer BufferNode::make(Var data,
                         std::string name,
                         std::string scope,
                         int data_alignment,
-                        int offset_factor) {
+                        int offset_factor,
+                        BufferType buffer_type) {
   auto n = make_node<BufferNode>();
   n->data = std::move(data);
   n->dtype = dtype;
@@ -427,6 +430,12 @@ Buffer BufferNode::make(Var data,
   n->elem_offset = std::move(elem_offset);
   n->data_alignment = data_alignment;
   n->offset_factor = offset_factor;
+  n->buffer_type = buffer_type;
+  if (n->buffer_type == kAutoBroadcast && n->shape.size() > 0 && n->strides.empty()) {
+    for (size_t i = 0; i < n->shape.size(); ++i) {
+      n->strides.push_back(tvm::var("stride"));
+    }
+  }
   return Buffer(n);
 }
 
diff --git a/src/op/scan_op.cc b/src/op/scan_op.cc
index 42b1331e3736c..78f8c82d97dbf 100644
--- a/src/op/scan_op.cc
+++ b/src/op/scan_op.cc
@@ -6,9 +6,9 @@
  * to you under the Apache License, Version 2.0 (the
  * "License"); you may not use this file except in compliance
  * with the License.  You may obtain a copy of the License at
- * 
+ *
  *   http://www.apache.org/licenses/LICENSE-2.0
- * 
+ *
  * Unless required by applicable law or agreed to in writing,
  * software distributed under the License is distributed on an
  * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
@@ -80,7 +80,7 @@ Operation ScanOpNode::make(std::string name,
   for (size_t i = 0; i < init.size(); ++i) {
     CHECK_EQ(init[i]->dtype, state_placeholder[i]->dtype);
     CHECK_EQ(init[i]->dtype, update[i]->dtype);
-    CHECK(can_prove(init[i]->shape[0] == axis->dom->min))
+    CHECK(prove_equal(init[i]->shape[0], axis->dom->min))
         << "init.shape[0] need to match scan_axis.dom.min";
     CHECK(prove_equal(
         state_placeholder[i]->shape[0], axis->dom->min + axis->dom->extent))
diff --git a/src/pass/arg_binder.cc b/src/pass/arg_binder.cc
index 2822393d3f75e..ff4c77accf073 100644
--- a/src/pass/arg_binder.cc
+++ b/src/pass/arg_binder.cc
@@ -6,9 +6,9 @@
  * to you under the Apache License, Version 2.0 (the
  * "License"); you may not use this file except in compliance
  * with the License.  You may obtain a copy of the License at
- * 
+ *
  *   http://www.apache.org/licenses/LICENSE-2.0
- * 
+ *
  * Unless required by applicable law or agreed to in writing,
  * software distributed under the License is distributed on an
  * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
@@ -18,7 +18,6 @@
  */
 
 /*!
- *  Copyright (c) 2017 by Contributors
  * \file arg_binder.cc
  * \brief Helper utility to match and bind arguments.
  */
@@ -242,6 +241,21 @@ void ArgBinder::BindDLTensor(const Buffer& buffer,
       check = IfThenElse::make(Not::make(is_null), check, Stmt());
       init_nest_.emplace_back(Block::make(check, Evaluate::make(0)));
     }
+  } else if (buffer->buffer_type == kAutoBroadcast) {
+    Type stype = buffer->DefaultIndexType();
+    Expr stride = make_const(stype, 1);
+    for (size_t i = buffer->shape.size(); i != 0; --i) {
+      size_t k = i - 1;
+      std::ostringstream field_name;
+      field_name << v_strides->name_hint << '[' << k << ']';
+      Expr value = cast(buffer->shape[k].type(),
+                        Load::make(tvm_shape_type, v_strides,
+                                   IntImm::make(Int(32), k), const_true(1)));
+      value = tvm::if_then_else(is_null, stride, value);
+      value = tvm::if_then_else(buffer->shape[k] == 1, 0, value);
+      Bind_(buffer->strides[k], value, field_name.str(), true);
+      stride = Simplify(stride * buffer->shape[k]);
+    }
   } else {
     std::ostringstream stride_null_err_msg;
     stride_null_err_msg << arg_name << ".strides: expected non-null strides.";
diff --git a/src/pass/inject_copy_intrin.cc b/src/pass/inject_copy_intrin.cc
index a906ee3e54741..8df5fe1f77572 100644
--- a/src/pass/inject_copy_intrin.cc
+++ b/src/pass/inject_copy_intrin.cc
@@ -160,7 +160,7 @@ class CopyIntrinInjector : public IRMutator {
         store_strides[loop_var_size],
         store->buffer_var->name_hint,
         GetStorageScope(store->buffer_var.get()),
-        0, 0);
+        0, 0, kDefault);
     Buffer src = BufferNode::make(
         Var(load->buffer_var.node_),
         load->type,
@@ -169,7 +169,7 @@ class CopyIntrinInjector : public IRMutator {
         src_elem_offset,
         load->buffer_var->name_hint,
         GetStorageScope(load->buffer_var.get()),
-        0, 0);
+        0, 0, kDefault);
     *out = flower_copy_fromto_(src, dst, pad_before, pad_after, pad_value);
     CHECK(out->defined()) << "flower function did not return correct stmt";
     return true;
diff --git a/src/pass/inject_double_buffer.cc b/src/pass/inject_double_buffer.cc
index 94b4ab3cb4c93..027639caf7028 100644
--- a/src/pass/inject_double_buffer.cc
+++ b/src/pass/inject_double_buffer.cc
@@ -6,9 +6,9 @@
  * to you under the Apache License, Version 2.0 (the
  * "License"); you may not use this file except in compliance
  * with the License.  You may obtain a copy of the License at
- * 
+ *
  *   http://www.apache.org/licenses/LICENSE-2.0
- * 
+ *
  * Unless required by applicable law or agreed to in writing,
  * software distributed under the License is distributed on an
  * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
@@ -26,6 +26,7 @@
 #include <tvm/ir_pass.h>
 #include <tvm/ir_visitor.h>
 #include <tvm/ir_mutator.h>
+#include <tvm/expr_operator.h>
 #include "ir_util.h"
 #include "../arithmetic/compute_expr.h"
 
@@ -100,8 +101,8 @@ class DoubleBufferInjector : public IRMutator {
   Stmt Mutate_(const Allocate* op, const Stmt& s) final {
     auto it = dbuffer_info_.find(op->buffer_var.get());
     if (it != dbuffer_info_.end()) {
-      it->second.stride = arith::ComputeReduce<Mul>
-          (op->extents, Expr()) * op->type.lanes();
+      it->second.stride = arith::ComputeReduce<Mul>(
+          op->extents, Expr()) * op->type.lanes();
       Stmt stmt = IRMutator::Mutate_(op, s);
       op = stmt.as<Allocate>();
       Array<Expr> new_extents{make_const(op->extents[0].type(), 2)};
@@ -135,11 +136,11 @@ class DoubleBufferInjector : public IRMutator {
             << "It is better to split with multiple of 2";
         CHECK(is_zero(old_loop->min));
         Expr zero = old_loop->min;
-        Expr new_ext = arith::ComputeExpr<Sub>(
-            old_loop->extent, make_const(old_loop->loop_var.type(), 1));
+        Expr new_ext =
+            old_loop->extent - make_const(old_loop->loop_var.type(), 1);
         Expr factor = make_const(new_ext.type(), split_loop_);
-        Expr outer_ext = arith::ComputeExpr<Div>(new_ext, factor);
-        Expr tail_base = arith::ComputeExpr<Mul>(outer_ext, factor);
+        Expr outer_ext = new_ext / factor;
+        Expr tail_base = outer_ext * factor;
         Var outer_var(old_loop->loop_var->name_hint + ".outer", old_loop->loop_var.type());
         std::unordered_map<const Variable*, Expr> vmap;
         std::vector<Stmt> loop_seq;
diff --git a/src/pass/inject_virtual_thread.cc b/src/pass/inject_virtual_thread.cc
index 9009416192e08..88e7f4370126f 100644
--- a/src/pass/inject_virtual_thread.cc
+++ b/src/pass/inject_virtual_thread.cc
@@ -6,9 +6,9 @@
  * to you under the Apache License, Version 2.0 (the
  * "License"); you may not use this file except in compliance
  * with the License.  You may obtain a copy of the License at
- * 
+ *
  *   http://www.apache.org/licenses/LICENSE-2.0
- * 
+ *
  * Unless required by applicable law or agreed to in writing,
  * software distributed under the License is distributed on an
  * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
@@ -18,7 +18,6 @@
  */
 
 /*!
- *  Copyright (c) 2017 by Contributors
  * \file inject_virtual_thread.cc
  */
 #include <tvm/ir.h>
@@ -37,6 +36,7 @@ class ExprTouched final : public IRVisitor {
   explicit ExprTouched(const std::unordered_set<const Variable*> &touched,
                        bool check_write)
       : touched_var_(touched), check_write_(check_write) {}
+
   void Visit(const NodeRef& n) final {
     // early stopping
     if (expr_touched_ && !check_write_) return;
@@ -241,8 +241,8 @@ class VTInjector : public IRMutator {
       visit_touched_var_ = true;
       Expr offset = Mutate(op->args[2]);
       Expr extent = Mutate(op->args[3]);
-      Expr stride = arith::ComputeExpr<Div>(
-          it->second, make_const(offset.type(), dtype.lanes()));
+      Expr stride =
+          it->second / make_const(offset.type(), dtype.lanes());
       offset = stride * var_ + offset;
       return Call::make(
           op->type, op->name,
diff --git a/src/pass/loop_partition.cc b/src/pass/loop_partition.cc
index 0a5b7410f3cff..33dbaed83b697 100644
--- a/src/pass/loop_partition.cc
+++ b/src/pass/loop_partition.cc
@@ -466,8 +466,13 @@ Stmt LoopPartitioner::TryPartition(const Node* node,
                                    Stmt body,
                                    bool partition_thread_scope) {
   using namespace arith;
+  // include hint of var.
+  hint_map_.insert({var.get(), IntSet::interval(min, max)});
+
   PartitionFinder finder(var, hint_map_, relax_map_);
   finder.Visit(body);
+
+  hint_map_.erase(var.get());
   if (finder.partitions.empty()) return Stmt();
 
   arith::IntervalSet for_interval(min, max);
@@ -504,9 +509,9 @@ Stmt LoopPartitioner::TryPartition(const Node* node,
   bool pre_stmt_recurse = true;
   if (middle_interval_i->HasLowerBound()) {
     body_begin = ir::Simplify(middle_interval.min());
-    if (!can_prove(body_begin == min)) {
+    if (!analyzer_.CanProve(body_begin == min)) {
       Expr cond = (body_begin - min >= 0);
-      if (!can_prove(cond)) {
+      if (!analyzer_.CanProve(cond)) {
         LOG(WARNING) << "Cannot prove: " << cond
                      << ", when generating the pre doubt loop";
         body_begin = Max::make(body_begin, min);
@@ -529,10 +534,10 @@ Stmt LoopPartitioner::TryPartition(const Node* node,
   bool post_stmt_recurse = true;
   if (middle_interval_i->HasUpperBound()) {
     post_doubt_begin = ir::Simplify(middle_interval.max() + 1);
-    if (!can_prove(middle_interval.max() == max)) {
+    if (!analyzer_.CanProve(middle_interval.max() == max)) {
       // require the extent to be non-negative
       Expr cond = (max - post_doubt_begin + 1 >= 0);
-      if (!can_prove(cond)) {
+      if (!analyzer_.CanProve(cond)) {
         LOG(WARNING) << "Cannot prove: " << cond
                      << ", when generating the post doubt loop";
         post_doubt_begin = Min::make(post_doubt_begin, max);
@@ -554,7 +559,7 @@ Stmt LoopPartitioner::TryPartition(const Node* node,
   // Generating code for middle subrange
   if (!partition_thread_scope) {
     Stmt mid_stmt;
-    if (!can_prove(body_begin >= post_doubt_begin)) {
+    if (!analyzer_.CanProve(body_begin >= post_doubt_begin)) {
       // [body_begin, post_doubt_begin)
       Stmt simplified_body = ConditionEliminator(cond_set, cond_value).Mutate(body);
       Stmt new_body = Substitute(simplified_body, {{Var{var}, var + body_begin}});
@@ -576,8 +581,8 @@ Stmt LoopPartitioner::TryPartition(const Node* node,
     s = AppendStmts(s, post_stmt);
   } else {
     Expr cond = const_true();
-    if (!can_prove(body_begin == min)) cond = cond && (var >= body_begin);
-    if (!can_prove(post_doubt_begin == (max + 1))) cond = cond && (var < post_doubt_begin);
+    if (!analyzer_.CanProve(body_begin == min)) cond = cond && (var >= body_begin);
+    if (!analyzer_.CanProve(post_doubt_begin == (max + 1))) cond = cond && (var < post_doubt_begin);
     s = ThreadPartitionInserter(cond_set, cond).Mutate(stmt);
   }
   s = ConvertSSA(s);
@@ -587,7 +592,7 @@ Stmt LoopPartitioner::TryPartition(const Node* node,
 inline Stmt LoopPartitioner::MakeFor(const Node *node, Expr extent, Stmt body) {
   const For *for_node = static_cast<const For*>(node);
   CHECK(for_node);
-  if (can_prove(extent == make_const(Int(32), 1))) {
+  if (analyzer_.CanProve(extent == make_const(Int(32), 1))) {
     // If the loop extent is 1, do not create the loop anymore
     return Substitute(body, {{Var{for_node->loop_var}, make_const(Int(32), 0)}});
   } else {
diff --git a/src/pass/lower_thread_allreduce.cc b/src/pass/lower_thread_allreduce.cc
index d0490b2152a0d..02c72d03fea89 100644
--- a/src/pass/lower_thread_allreduce.cc
+++ b/src/pass/lower_thread_allreduce.cc
@@ -6,9 +6,9 @@
  * to you under the Apache License, Version 2.0 (the
  * "License"); you may not use this file except in compliance
  * with the License.  You may obtain a copy of the License at
- * 
+ *
  *   http://www.apache.org/licenses/LICENSE-2.0
- * 
+ *
  * Unless required by applicable law or agreed to in writing,
  * software distributed under the License is distributed on an
  * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
diff --git a/src/pass/lower_warp_memory.cc b/src/pass/lower_warp_memory.cc
index 7d9d48600f715..bb7260fb5ddec 100644
--- a/src/pass/lower_warp_memory.cc
+++ b/src/pass/lower_warp_memory.cc
@@ -18,8 +18,6 @@
  */
 
 /*!
- *  Copyright (c) 2018 by Contributors
- *
  * Lower warp memory to use local memory
  * and shuffle intrinsics.
  *
diff --git a/src/pass/make_api.cc b/src/pass/make_api.cc
index 13f46ecb6f7a2..0109ad19d7a67 100644
--- a/src/pass/make_api.cc
+++ b/src/pass/make_api.cc
@@ -6,9 +6,9 @@
  * to you under the Apache License, Version 2.0 (the
  * "License"); you may not use this file except in compliance
  * with the License.  You may obtain a copy of the License at
- * 
+ *
  *   http://www.apache.org/licenses/LICENSE-2.0
- * 
+ *
  * Unless required by applicable law or agreed to in writing,
  * software distributed under the License is distributed on an
  * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
@@ -33,7 +33,6 @@
 
 #include "ir_util.h"
 #include "arg_binder.h"
-#include "../arithmetic/compute_expr.h"
 
 namespace tvm {
 namespace ir {
diff --git a/src/pass/narrow_channel_access.cc b/src/pass/narrow_channel_access.cc
index 731064edb0121..57f3baf20e108 100644
--- a/src/pass/narrow_channel_access.cc
+++ b/src/pass/narrow_channel_access.cc
@@ -6,9 +6,9 @@
  * to you under the Apache License, Version 2.0 (the
  * "License"); you may not use this file except in compliance
  * with the License.  You may obtain a copy of the License at
- * 
+ *
  *   http://www.apache.org/licenses/LICENSE-2.0
- * 
+ *
  * Unless required by applicable law or agreed to in writing,
  * software distributed under the License is distributed on an
  * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
@@ -200,7 +200,7 @@ class ChannelAccessRewriter : public IRMutator {
     Expr base = linear_eq[1];
     if (!is_zero(base)) return body;
     Expr left = ir::Simplify(adv_op->value - coeff * for_op->extent);
-    if (!can_prove(left >= 0)) return body;
+    if (!analyzer_.CanProve(left >= 0)) return body;
     // rewrite access index.
     ChannelAccessIndexRewriter rw(
         ch->handle_var.get(), var * coeff, read_access);
@@ -233,6 +233,7 @@ class ChannelAccessRewriter : public IRMutator {
     return body;
   }
 
+  arith::Analyzer analyzer_;
   std::vector<RewriteEntry> tasks_;
 };
 
diff --git a/src/pass/storage_flatten.cc b/src/pass/storage_flatten.cc
index 215f6d7397323..19e7a32e4acf5 100644
--- a/src/pass/storage_flatten.cc
+++ b/src/pass/storage_flatten.cc
@@ -6,9 +6,9 @@
  * to you under the Apache License, Version 2.0 (the
  * "License"); you may not use this file except in compliance
  * with the License.  You may obtain a copy of the License at
- * 
+ *
  *   http://www.apache.org/licenses/LICENSE-2.0
- * 
+ *
  * Unless required by applicable law or agreed to in writing,
  * software distributed under the License is distributed on an
  * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
@@ -211,7 +211,7 @@ class StorageFlattener : public IRMutator {
             stride = ir::Simplify(stride);
           }
           rstrides.push_back(stride);
-          stride = arith::ComputeExpr<Mul>(stride, shape[dim]);
+          stride = stride * shape[dim];
         }
         strides = Array<Expr>(rstrides.rbegin(), rstrides.rend());
       }
@@ -220,7 +220,7 @@ class StorageFlattener : public IRMutator {
           Var(key.GetName(), Handle()),
           op->type, shape, strides, Expr(),
           key.GetName(), skey.to_string(),
-          align, 0);
+          align, 0, kDefault);
 
       buf_map_[key] = e;
       Stmt body = this->Mutate(op->body);
@@ -237,7 +237,7 @@ class StorageFlattener : public IRMutator {
         int first_dim = 0;
         ret = Allocate::make(
             e.buffer->data, storage_type,
-            {arith::ComputeExpr<Mul>(e.buffer->strides[first_dim], e.buffer->shape[first_dim])},
+            {e.buffer->strides[first_dim] * e.buffer->shape[first_dim]},
             make_const(Bool(e.buffer->dtype.lanes()), true), body);
       } else {
         shape = e.buffer->shape;
@@ -414,8 +414,7 @@ class StorageFlattener : public IRMutator {
     if (be.bounds.size() != 0) {
       CHECK_EQ(tuple->args.size(), be.bounds.size() * 2);
       for (size_t i = 0; i < be.buffer->shape.size(); ++i) {
-        begins.push_back(
-            arith::ComputeExpr<Sub>(tuple->args[2 * i], be.bounds[i]->min));
+        begins.push_back(tuple->args[2 * i] - be.bounds[i]->min);
         extents.push_back(tuple->args[2 * i + 1]);
       }
     } else {
diff --git a/src/pass/storage_rewrite.cc b/src/pass/storage_rewrite.cc
index 806a80ad4dc90..eba1cee8b7c70 100644
--- a/src/pass/storage_rewrite.cc
+++ b/src/pass/storage_rewrite.cc
@@ -6,9 +6,9 @@
  * to you under the Apache License, Version 2.0 (the
  * "License"); you may not use this file except in compliance
  * with the License.  You may obtain a copy of the License at
- * 
+ *
  *   http://www.apache.org/licenses/LICENSE-2.0
- * 
+ *
  * Unless required by applicable law or agreed to in writing,
  * software distributed under the License is distributed on an
  * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
@@ -606,7 +606,7 @@ class StoragePlanRewriter : public IRMutator {
           }
           // transform to alloc bytes
           auto type_bits = alloc_type.bits() * alloc_type.lanes();
-          bool divided = can_prove(combo_size % type_bits == 0);
+          bool divided = analyzer_.CanProve(combo_size % type_bits == 0);
           combo_size = combo_size / type_bits;
           // round up for can not divided
           if (!divided) {
@@ -920,6 +920,8 @@ class StoragePlanRewriter : public IRMutator {
   std::unordered_map<const Variable*, StorageEntry*> alloc_map_;
   // The allocations
   std::vector<std::unique_ptr<StorageEntry> > alloc_vec_;
+  // analyzer
+  arith::Analyzer analyzer_;
 };
 
 // Turn alloc into vector alloc
diff --git a/src/pass/unroll_loop.cc b/src/pass/unroll_loop.cc
index ead234e2c4a08..756130886e13f 100644
--- a/src/pass/unroll_loop.cc
+++ b/src/pass/unroll_loop.cc
@@ -6,9 +6,9 @@
  * to you under the Apache License, Version 2.0 (the
  * "License"); you may not use this file except in compliance
  * with the License.  You may obtain a copy of the License at
- * 
+ *
  *   http://www.apache.org/licenses/LICENSE-2.0
- * 
+ *
  * Unless required by applicable law or agreed to in writing,
  * software distributed under the License is distributed on an
  * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
@@ -18,7 +18,6 @@
  */
 
 /*!
- *  Copyright (c) 2017 by Contributors
  *  Loop unrolling as in Halide pipeline.
  * \file unroll_loop.cc
  */
@@ -144,7 +143,6 @@ class LoopUnroller : public IRMutator {
   }
 
   Stmt Unroll(const For* op) {
-    using arith::ComputeExpr;
     int value = GetExtent(op);
     // For loop must have a constant integer extent
     CHECK_NE(value, -1) << "loop doesn't have a constant integer extent";
@@ -154,9 +152,7 @@ class LoopUnroller : public IRMutator {
     Stmt unrolled;
     for (int i = 0; i < value; ++i) {
       Var lv(op->loop_var.node_);
-      vmap.Set(lv,
-               ComputeExpr<Add>(
-                       op->min, make_const(op->loop_var.type(), i)));
+      vmap.Set(lv, op->min + make_const(op->loop_var.type(), i));
       Stmt step = Substitute(body, vmap);
       if (unrolled.defined()) {
         unrolled = Block::make(unrolled, step);
diff --git a/src/pass/vectorize_loop.cc b/src/pass/vectorize_loop.cc
index 8c3d383c1529a..2d8416e9a9de7 100644
--- a/src/pass/vectorize_loop.cc
+++ b/src/pass/vectorize_loop.cc
@@ -18,13 +18,13 @@
  */
 
 /*!
- *  Copyright (c) 2017 by Contributors
  * \file vectorize_loop.cc
  */
 // Loop vectorizer as in Halide pipeline.
 #include <tvm/ir.h>
 #include <tvm/ir_pass.h>
 #include <tvm/ir_mutator.h>
+#include <tvm/arithmetic.h>
 #include <unordered_set>
 #include <unordered_map>
 #include <vector>
@@ -132,11 +132,11 @@ class Vectorizer : public IRMutator {
       if (lanes != 1) {
         const Ramp* b_ramp = b.as<Ramp>();
         const Ramp* a_ramp = a.as<Ramp>();
-        if (a_ramp && b.type().lanes() == 1 && can_prove(b > 0)) {
+        if (a_ramp && b.type().lanes() == 1 && analyzer_.CanProve(b > 0)) {
           return Ramp::make(
               a_ramp->base * b, a_ramp->stride * b, a_ramp->lanes);
         }
-        if (b_ramp && a.type().lanes() == 1 && can_prove(a > 0)) {
+        if (b_ramp && a.type().lanes() == 1 && analyzer_.CanProve(a > 0)) {
           return Ramp::make(
               b_ramp->base * a, b_ramp->stride * a, b_ramp->lanes);
         }
@@ -186,7 +186,7 @@ class Vectorizer : public IRMutator {
     Expr stride = this->Mutate(op->stride);
     if (base.type().lanes() > 1 && stride.type().lanes() == 1) {
       const Ramp* base_ramp = base.as<Ramp>();
-      if (can_prove(base_ramp->stride == stride * make_const(stride.type(), op->lanes))) {
+      if (analyzer_.CanProve(base_ramp->stride == stride * make_const(stride.type(), op->lanes))) {
         return Ramp::make(base_ramp->base, stride, op->lanes * base_ramp->lanes);
       }
     }
@@ -423,6 +423,8 @@ class Vectorizer : public IRMutator {
   }
 
  private:
+  // analyzer
+  arith::Analyzer analyzer_;
   // variable to be replaced
   Var var_;
   // the lanes.
@@ -483,13 +485,13 @@ class Vectorizer : public IRMutator {
         const Ramp* a_ramp = a.as<Ramp>();
         if (a.type().lanes() == 1 && b_ramp) {
           return Ramp::make(
-              arith::ComputeExpr<T>(a, b_ramp->base),
-              arith::ComputeExpr<T>(make_zero(b_ramp->stride.type()), b_ramp->stride),
+              arith::Compute<T>(a, b_ramp->base),
+              arith::Compute<T>(make_zero(b_ramp->stride.type()), b_ramp->stride),
               b_ramp->lanes);
         }
         if (b.type().lanes() == 1 && a_ramp) {
           return Ramp::make(
-              arith::ComputeExpr<T>(a_ramp->base, b), a_ramp->stride, a_ramp->lanes);
+              arith::Compute<T>(a_ramp->base, b), a_ramp->stride, a_ramp->lanes);
         }
       }
       return T::make(BroadcastTo(a, lanes), BroadcastTo(b, lanes));
diff --git a/src/relay/backend/build_module.cc b/src/relay/backend/build_module.cc
index 3feb7e4a4b543..7de77c8bcfd4b 100644
--- a/src/relay/backend/build_module.cc
+++ b/src/relay/backend/build_module.cc
@@ -21,6 +21,7 @@
  * \file relay/backend/build_module.cc
  * \brief Code generation for TVM's graph runtime.
  */
+#include <tvm/relay/analysis.h>
 #include <tvm/build_module.h>
 #include <tvm/runtime/device_api.h>
 #include <tvm/relay/expr.h>
@@ -433,7 +434,7 @@ class RelayBuildModule : public runtime::ModuleNode {
     relay_module = Optimize(relay_module, targets_, params);
     CHECK(relay_module.defined());
     // Get the updated function.
-    func = relay_module->Lookup(relay_module->entry_func->name_hint);
+    func = relay_module->Lookup("main");
 
     // Generate code for the updated function.
     graph_codegen_ = std::unique_ptr<GraphCodegen>(new GraphCodegen());
diff --git a/src/relay/backend/compile_engine.cc b/src/relay/backend/compile_engine.cc
index 7ae1befcfe895..83e4a36ff4f93 100644
--- a/src/relay/backend/compile_engine.cc
+++ b/src/relay/backend/compile_engine.cc
@@ -27,7 +27,7 @@
 #include <tvm/operation.h>
 #include <tvm/runtime/registry.h>
 #include <tvm/relay/attrs/device_copy.h>
-#include <tvm/relay/pass.h>
+#include <tvm/relay/analysis.h>
 #include <tvm/relay/expr_functor.h>
 #include <tvm/relay/op_attr_types.h>
 #include <topi/tags.h>
diff --git a/src/relay/backend/compile_engine.h b/src/relay/backend/compile_engine.h
index 9b510ad2fd293..9765cf90da18a 100644
--- a/src/relay/backend/compile_engine.h
+++ b/src/relay/backend/compile_engine.h
@@ -27,8 +27,9 @@
 #define TVM_RELAY_BACKEND_COMPILE_ENGINE_H_
 
 #include <tvm/lowered_func.h>
+#include <tvm/relay/analysis.h>
 #include <tvm/relay/expr.h>
-#include <tvm/relay/pass.h>
+#include <tvm/relay/transform.h>
 #include <string>
 #include <functional>
 
diff --git a/src/relay/backend/graph_plan_memory.cc b/src/relay/backend/graph_plan_memory.cc
index 5c2e5c4c289a1..91a597baceaf3 100644
--- a/src/relay/backend/graph_plan_memory.cc
+++ b/src/relay/backend/graph_plan_memory.cc
@@ -25,7 +25,7 @@
  */
 #include <tvm/relay/expr.h>
 #include <tvm/relay/expr_functor.h>
-#include <tvm/relay/pass.h>
+#include <tvm/relay/analysis.h>
 #include "../../common/arena.h"
 
 namespace tvm {
diff --git a/src/relay/backend/interpreter.cc b/src/relay/backend/interpreter.cc
index ff2d9e6117abb..913d7addea4d2 100644
--- a/src/relay/backend/interpreter.cc
+++ b/src/relay/backend/interpreter.cc
@@ -27,7 +27,7 @@
 #include <tvm/relay/expr_functor.h>
 #include <tvm/relay/pattern_functor.h>
 #include <tvm/relay/interpreter.h>
-#include <tvm/relay/pass.h>
+#include <tvm/relay/analysis.h>
 #include <tvm/relay/attrs/debug.h>
 #include "compile_engine.h"
 
@@ -103,7 +103,7 @@ TVM_STATIC_IR_FUNCTOR_REGISTER(IRPrinter, vtable)
                               p->stream << "RefValueNode(" << node->value << ")";
                             });
 
-ConstructorValue ConstructorValueNode::make(int tag,
+ConstructorValue ConstructorValueNode::make(int32_t tag,
                                             tvm::Array<Value> fields,
                                             Constructor constructor) {
   NodePtr<ConstructorValueNode> n = make_node<ConstructorValueNode>();
diff --git a/src/relay/backend/utils.h b/src/relay/backend/utils.h
index 65a7efd4c2051..139dab21e973d 100644
--- a/src/relay/backend/utils.h
+++ b/src/relay/backend/utils.h
@@ -27,7 +27,6 @@
 
 #include <dmlc/json.h>
 #include <tvm/relay/expr.h>
-#include <tvm/relay/pass.h>
 #include <tvm/relay/type.h>
 #include <tvm/tvm.h>
 #include <tvm/build_module.h>
diff --git a/src/relay/backend/vm/lambda_lift.cc b/src/relay/backend/vm/lambda_lift.cc
index 668c024a8d550..6290ef7c6e932 100644
--- a/src/relay/backend/vm/lambda_lift.cc
+++ b/src/relay/backend/vm/lambda_lift.cc
@@ -26,7 +26,7 @@
 #include <tvm/relay/expr.h>
 #include <tvm/relay/expr_functor.h>
 #include <tvm/logging.h>
-#include <tvm/relay/pass.h>
+#include <tvm/relay/analysis.h>
 #include <tvm/relay/transform.h>
 #include <tvm/runtime/vm.h>
 #include <iostream>
diff --git a/src/relay/backend/vm/vm.cc b/src/relay/backend/vm/vm.cc
index cf0b952005fcb..2f656c8cef992 100644
--- a/src/relay/backend/vm/vm.cc
+++ b/src/relay/backend/vm/vm.cc
@@ -28,17 +28,18 @@
 #include <tvm/logging.h>
 #include <tvm/relay/module.h>
 #include <tvm/runtime/vm.h>
-#include <tvm/relay/pass.h>
+#include <tvm/relay/analysis.h>
 
 namespace tvm {
 namespace relay {
 namespace vm {
 
+runtime::vm::VirtualMachine CompileModule(const Module& mod);
+
 using tvm::runtime::Object;
 using tvm::runtime::ObjectTag;
 using tvm::runtime::vm::VirtualMachine;
 
-
 VirtualMachine FromModule(const Module& module, const std::vector<TVMContext>& ctxs) {
   auto vm = CompileModule(module);
   vm.Init(ctxs);
@@ -51,10 +52,10 @@ Object EvaluateModule(const Module& module, const std::vector<TVMContext> ctxs,
   // TODO(zhiics): This measurement is for temporary usage. Remove it later. We
   // need to introduce a better profiling method.
 #if ENABLE_PROFILING
-  DLOG(INFO) << "Entry function is " << module->entry_func << std::endl;
+  DLOG(INFO) << "Entry function is main." << std::endl;
   auto start = std::chrono::high_resolution_clock::now();
 #endif  // ENABLE_PROFILING
-  Object res = vm.Invoke(module->entry_func->name_hint, vm_args);
+  Object res = vm.Invoke("main", vm_args);
 #if ENABLE_PROFILING
   auto end = std::chrono::high_resolution_clock::now();
   auto duration = std::chrono::duration_cast<std::chrono::milliseconds>(end - start).count();
diff --git a/src/relay/ir/adt.cc b/src/relay/ir/adt.cc
index b59281a4f1fd9..3eb1d99f5a889 100644
--- a/src/relay/ir/adt.cc
+++ b/src/relay/ir/adt.cc
@@ -6,9 +6,9 @@
  * to you under the Apache License, Version 2.0 (the
  * "License"); you may not use this file except in compliance
  * with the License.  You may obtain a copy of the License at
- * 
+ *
  *   http://www.apache.org/licenses/LICENSE-2.0
- * 
+ *
  * Unless required by applicable law or agreed to in writing,
  * software distributed under the License is distributed on an
  * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
@@ -18,7 +18,7 @@
  */
 
 /*!
- *  Copyright (c) 2018 by Contributors
+ *  Copyright (c) 2019 by Contributors
  * \file src/tvm/ir/adt.cc
  * \brief AST nodes for Relay algebraic data types (ADTs).
  */
diff --git a/src/relay/ir/alpha_equal.cc b/src/relay/ir/alpha_equal.cc
index 81017d4fddfa6..42e66261a5533 100644
--- a/src/relay/ir/alpha_equal.cc
+++ b/src/relay/ir/alpha_equal.cc
@@ -26,7 +26,7 @@
 #include <tvm/relay/expr_functor.h>
 #include <tvm/relay/pattern_functor.h>
 #include <tvm/runtime/ndarray.h>
-#include <tvm/relay/pass.h>
+#include <tvm/relay/analysis.h>
 #include "type_functor.h"
 #include "../../lang/attr_functor.h"
 
diff --git a/src/relay/ir/expr_functor.cc b/src/relay/ir/expr_functor.cc
index e09d790822274..0434e2ac59c64 100644
--- a/src/relay/ir/expr_functor.cc
+++ b/src/relay/ir/expr_functor.cc
@@ -6,9 +6,9 @@
  * to you under the Apache License, Version 2.0 (the
  * "License"); you may not use this file except in compliance
  * with the License.  You may obtain a copy of the License at
- * 
+ *
  *   http://www.apache.org/licenses/LICENSE-2.0
- * 
+ *
  * Unless required by applicable law or agreed to in writing,
  * software distributed under the License is distributed on an
  * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
@@ -18,7 +18,7 @@
  */
 
 /*!
- *  Copyright (c) 2018 by Contributors
+ *  Copyright (c) 2019 by Contributors
  * \file src/tvm/relay/expr_mutator.cc
  * \brief A wrapper around ExprFunctor which functionally updates the AST.
  *
@@ -26,6 +26,7 @@
  * the cost of using functional updates.
  */
 #include <tvm/relay/expr_functor.h>
+#include <tvm/relay/pattern_functor.h>
 #include "type_functor.h"
 
 namespace tvm {
@@ -345,7 +346,7 @@ void PostOrderVisit(const Expr& e, std::function<void(const Expr&)> fvisit) {
   ExprApplyVisit(fvisit).VisitExpr(e);
 }
 
-TVM_REGISTER_API("relay._ir_pass.post_order_visit")
+TVM_REGISTER_API("relay._analysis.post_order_visit")
 .set_body_typed<void(Expr, PackedFunc)>([](Expr expr, PackedFunc f) {
     PostOrderVisit(expr, [f](const Expr& n) {
         f(n);
@@ -353,7 +354,7 @@ TVM_REGISTER_API("relay._ir_pass.post_order_visit")
   });
 
 // Implement bind.
-class ExprBinder : public ExprMutator {
+class ExprBinder : public ExprMutator, PatternMutator {
  public:
   explicit ExprBinder(const tvm::Map<Var, Expr>& args_map)
     : args_map_(args_map) {
@@ -383,13 +384,26 @@ class ExprBinder : public ExprMutator {
     }
   }
 
+  Pattern VisitPattern(const Pattern& p) final {
+    return PatternMutator::VisitPattern(p);
+  }
+
+  Clause VisitClause(const Clause& c) final {
+    Pattern pat = VisitPattern(c->lhs);
+    return ClauseNode::make(pat, VisitExpr(c->rhs));
+  }
+
+  Var VisitVar(const Var& v) final {
+    return Downcast<Var>(VisitExpr(v));
+  }
+
  private:
   const tvm::Map<Var, Expr>& args_map_;
 };
 
 Expr Bind(const Expr& expr, const tvm::Map<Var, Expr>& args_map) {
   if (const FunctionNode* func = expr.as<FunctionNode>()) {
-    Expr new_body = ExprBinder(args_map).Mutate(func->body);
+    Expr new_body = ExprBinder(args_map).VisitExpr(func->body);
     Array<Var> new_params;
     for (Var param : func->params) {
       if (!args_map.count(param)) {
@@ -406,7 +420,7 @@ Expr Bind(const Expr& expr, const tvm::Map<Var, Expr>& args_map) {
                               func->type_params,
                               func->attrs);
   } else {
-    return ExprBinder(args_map).Mutate(expr);
+    return ExprBinder(args_map).VisitExpr(expr);
   }
 }
 
diff --git a/src/relay/ir/hash.cc b/src/relay/ir/hash.cc
index c57475476e589..6039ba272ddc1 100644
--- a/src/relay/ir/hash.cc
+++ b/src/relay/ir/hash.cc
@@ -26,7 +26,7 @@
 #include <tvm/relay/expr_functor.h>
 #include <tvm/relay/pattern_functor.h>
 #include <tvm/runtime/ndarray.h>
-#include <tvm/relay/pass.h>
+#include <tvm/relay/analysis.h>
 #include <tvm/attrs.h>
 #include "type_functor.h"
 #include "../../lang/attr_functor.h"
@@ -412,12 +412,12 @@ size_t StructuralHash::operator()(const Expr& expr) const {
   return RelayHashHandler().ExprHash(expr);
 }
 
-TVM_REGISTER_API("relay._ir_pass._expr_hash")
+TVM_REGISTER_API("relay._analysis._expr_hash")
 .set_body_typed<int64_t(NodeRef)>([](NodeRef ref) {
   return static_cast<int64_t>(RelayHashHandler().Hash(ref));
 });
 
-TVM_REGISTER_API("relay._ir_pass._type_hash")
+TVM_REGISTER_API("relay._analysis._type_hash")
 .set_body_typed<int64_t(Type)>([](Type type) {
   return static_cast<int64_t>(RelayHashHandler().TypeHash(type));
 });
diff --git a/src/relay/ir/module.cc b/src/relay/ir/module.cc
index 58f614a3cc77c..0ad0a91efd217 100644
--- a/src/relay/ir/module.cc
+++ b/src/relay/ir/module.cc
@@ -23,7 +23,8 @@
  * \brief The global module in Relay.
  */
 #include <tvm/relay/module.h>
-#include <tvm/relay/pass.h>
+#include <tvm/relay/analysis.h>
+#include <tvm/relay/transform.h>
 #include <sstream>
 
 namespace tvm {
@@ -45,18 +46,21 @@ Module ModuleNode::make(tvm::Map<GlobalVar, Function> global_funcs,
     n->global_var_map_.Set(kv.first->name_hint, kv.first);
   }
 
-  n->entry_func = GlobalVarNode::make("main");
-
   for (const auto& kv : n->type_definitions) {
     // set global typevar map
     CHECK(!n->global_type_var_map_.count(kv.first->var->name_hint))
       << "Duplicate global type definition name " << kv.first->var->name_hint;
     n->global_type_var_map_.Set(kv.first->var->name_hint, kv.first);
+    n->RegisterConstructors(kv.first, kv.second);
   }
 
   return Module(n);
 }
 
+bool ModuleNode::ContainGlobalVar(const std::string& name) const {
+  return global_var_map_.find(name) != global_var_map_.end();
+}
+
 GlobalVar ModuleNode::GetGlobalVar(const std::string& name) const {
   auto it = global_var_map_.find(name);
   CHECK(it != global_var_map_.end())
@@ -88,8 +92,9 @@ GlobalTypeVar ModuleNode::GetGlobalTypeVar(const std::string& name) const {
 }
 
 void ModuleNode::Add(const GlobalVar& var,
-                     const Function& func,
+                     const Function& f,
                      bool update) {
+  Function func = Downcast<Function>(DeDup(f));
   // Type check the item before we add it to the module.
   auto mod = GetRef<Module>(this);
   Function checked_func = InferType(func, mod, var);
@@ -106,15 +111,25 @@ void ModuleNode::Add(const GlobalVar& var,
   AddUnchecked(var, checked_func);
 }
 
+void ModuleNode::RegisterConstructors(const GlobalTypeVar& var, const TypeData& type) {
+  // We hash the global type var name to use as a globally unique prefix for tags.
+  // The hash will be used as the most significant byte of the tag, with the index of
+  // the constructor in the less significant bytes
+  size_t hash = std::hash<std::string>()(var->var->name_hint);
+  int32_t prefix = static_cast<int32_t>(hash & 0xff) << 24;
+  for (size_t i = 0; i < type->constructors.size(); ++i) {
+    type->constructors[i]->tag = prefix | static_cast<int32_t>(i);
+    constructor_tag_map_[type->constructors[i]->tag] = type->constructors[i];
+  }
+}
+
 void ModuleNode::AddDef(const GlobalTypeVar& var, const TypeData& type) {
   this->type_definitions.Set(var, type);
   // set global type var map
   CHECK(!global_type_var_map_.count(var->var->name_hint))
     << "Duplicate global type definition name " << var->var->name_hint;
   global_type_var_map_.Set(var->var->name_hint, var);
-  for (size_t i = 0; i < type->constructors.size(); ++i) {
-    type->constructors[i]->tag = i;
-  }
+  RegisterConstructors(var, type);
 
   // need to kind check at the end because the check can look up
   // a definition potentially
@@ -157,6 +172,13 @@ TypeData ModuleNode::LookupDef(const std::string& name) const {
   return this->LookupDef(id);
 }
 
+Constructor ModuleNode::LookupTag(const int32_t tag) {
+  auto it = constructor_tag_map_.find(tag);
+  CHECK(it != constructor_tag_map_.end())
+    << "There is no constructor with the tag " << tag;
+  return (*it).second;
+}
+
 void ModuleNode::Update(const Module& mod) {
   for (auto pair : mod->functions) {
     this->Update(pair.first, pair.second);
@@ -174,7 +196,8 @@ Module ModuleNode::FromExpr(
   } else {
     func = FunctionNode::make({}, expr, Type(), {}, {});
   }
-  mod->Add(mod->entry_func, func);
+  auto main_gv = GlobalVarNode::make("main");
+  mod->Add(main_gv, func);
   return mod;
 }
 
@@ -183,8 +206,27 @@ TVM_REGISTER_NODE_TYPE(ModuleNode);
 TVM_REGISTER_API("relay._make.Module")
 .set_body_typed(ModuleNode::make);
 
-TVM_REGISTER_API("relay._make.Module_Add")
-.set_body_method<Module>(&ModuleNode::Add);
+TVM_REGISTER_API("relay._module.Module_Add")
+.set_body([](TVMArgs args, TVMRetValue* ret) {
+  Module mod = args[0];
+  GlobalVar var = args[1];
+  NodeRef val = args[2];
+  bool update = args[3];
+  CHECK(val->derived_from<ExprNode>());
+  if (val->derived_from<FunctionNode>()) {
+    mod->Add(var, Downcast<Function>(val), update);
+  } else if (val->derived_from<GlobalVarNode>()) {
+    GlobalVar gv = Downcast<GlobalVar>(val);
+    auto mod_copy = Module(make_node<ModuleNode>(*mod.operator->()));
+    mod_copy = transform::EtaExpand()(mod_copy);
+    auto func = mod_copy->Lookup(gv->name_hint);
+    mod->Add(var, Downcast<Function>(func), update);
+  } else {
+    auto func = FunctionNode::make({}, Downcast<Expr>(val), Type(nullptr), {});
+    mod->Add(var, func, update);
+  }
+  *ret = mod;
+});
 
 TVM_REGISTER_API("relay._module.Module_AddDef")
 .set_body_method<Module>(&ModuleNode::AddDef);
@@ -192,44 +234,52 @@ TVM_REGISTER_API("relay._module.Module_AddDef")
 TVM_REGISTER_API("relay._module.Module_GetGlobalVar")
 .set_body_method<Module>(&ModuleNode::GetGlobalVar);
 
+TVM_REGISTER_API("relay._module.Module_ContainGlobalVar")
+.set_body_method<Module>(&ModuleNode::ContainGlobalVar);
+
 TVM_REGISTER_API("relay._module.Module_GetGlobalTypeVar")
 .set_body_method<Module>(&ModuleNode::GetGlobalTypeVar);
 
 TVM_REGISTER_API("relay._module.Module_Lookup")
 .set_body_typed<Function(Module, GlobalVar)>([](Module mod, GlobalVar var) {
-    return mod->Lookup(var);
-  });
+  return mod->Lookup(var);
+});
 
 TVM_REGISTER_API("relay._module.Module_Lookup_str")
 .set_body_typed<Function(Module, std::string)>([](Module mod, std::string var) {
-    return mod->Lookup(var);
-  });
+  return mod->Lookup(var);
+});
 
 TVM_REGISTER_API("relay._module.Module_LookupDef")
 .set_body_typed<TypeData(Module, GlobalTypeVar)>([](Module mod, GlobalTypeVar var) {
-    return mod->LookupDef(var);
-  });
+  return mod->LookupDef(var);
+});
 
 TVM_REGISTER_API("relay._module.Module_LookupDef_str")
 .set_body_typed<TypeData(Module, std::string)>([](Module mod, std::string var) {
-    return mod->LookupDef(var);
+  return mod->LookupDef(var);
+});
+
+TVM_REGISTER_API("relay._module.Module_LookupTag")
+.set_body_typed<Constructor(Module, int32_t)>([](Module mod, int32_t tag) {
+    return mod->LookupTag(tag);
   });
 
 TVM_REGISTER_API("relay._module.Module_FromExpr")
 .set_body_typed<Module(Expr)>([](Expr e) {
-    return ModuleNode::FromExpr(e);
+  return ModuleNode::FromExpr(e);
 });
 
 TVM_REGISTER_API("relay._module.Module_Update")
 .set_body_typed<void(Module, Module)>([](Module mod, Module from) {
-    mod->Update(from);
-  });
+  mod->Update(from);
+});
 
 TVM_STATIC_IR_FUNCTOR_REGISTER(IRPrinter, vtable)
 .set_dispatch<ModuleNode>(
-    [](const ModuleNode *node, tvm::IRPrinter *p) {
-      p->stream << "ModuleNode( " << node->functions << ")";
-    });
+  [](const ModuleNode *node, tvm::IRPrinter *p) {
+    p->stream << "ModuleNode( " << node->functions << ")";
+});
 
 }  // namespace relay
 }  // namespace tvm
diff --git a/src/relay/ir/pretty_printer.cc b/src/relay/ir/pretty_printer.cc
index 7a61079204edc..39fc36fba4baf 100644
--- a/src/relay/ir/pretty_printer.cc
+++ b/src/relay/ir/pretty_printer.cc
@@ -645,11 +645,21 @@ class PrettyPrinter :
 
   Doc VisitType_(const FuncTypeNode* node) final {
     Doc doc;
+    doc << "fn ";
+    if (node->type_params.size() != 0) {
+      doc << "<";
+      std::vector<Doc> type_params;
+      for (Type type_param : node->type_params) {
+        type_params.push_back(Print(type_param));
+      }
+      doc << PrintVec(type_params);
+      doc << ">";
+    }
     std::vector<Doc> arg_types;
     for (Type arg_type : node->arg_types) {
       arg_types.push_back(Print(arg_type));
     }
-    return doc << "fn (" << PrintVec(arg_types) << ") -> " << Print(node->ret_type);
+    return doc << "(" << PrintVec(arg_types) << ") -> " << Print(node->ret_type);
   }
 
   Doc VisitType_(const RefTypeNode* node) final {
diff --git a/src/relay/ir/type_functor.cc b/src/relay/ir/type_functor.cc
index 9fca2e0326859..cde68c50daeff 100644
--- a/src/relay/ir/type_functor.cc
+++ b/src/relay/ir/type_functor.cc
@@ -92,6 +92,10 @@ void TypeVisitor::VisitType_(const TypeDataNode* op) {
   }
 }
 
+Type TypeMutator::VisitType(const Type& t) {
+  return t.defined() ? TypeFunctor<Type(const Type&)>::VisitType(t) : t;
+}
+
 // Type Mutator.
 Array<Type> TypeMutator::MutateArray(Array<Type> arr) {
   // The array will do copy on write
diff --git a/src/relay/ir/type_functor.h b/src/relay/ir/type_functor.h
index 27ac288fe48db..c3ee14eedd487 100644
--- a/src/relay/ir/type_functor.h
+++ b/src/relay/ir/type_functor.h
@@ -139,6 +139,7 @@ class TypeVisitor : public TypeFunctor<void(const Type& n)> {
 // Mutator that transform a type to another one.
 class TypeMutator : public TypeFunctor<Type(const Type& n)> {
  public:
+  Type VisitType(const Type& t) override;
   Type VisitType_(const TypeVarNode* op) override;
   Type VisitType_(const TensorTypeNode* op) override;
   Type VisitType_(const IncompleteTypeNode* op) override;
diff --git a/src/relay/pass/alter_op_layout.cc b/src/relay/pass/alter_op_layout.cc
index cc71968fba585..82424500ffc8e 100644
--- a/src/relay/pass/alter_op_layout.cc
+++ b/src/relay/pass/alter_op_layout.cc
@@ -24,7 +24,8 @@
           other expressions. This pass can be used for computing convolution in
           custom layouts or other general weight pre-transformation.
  */
-#include <tvm/relay/pass.h>
+#include <tvm/relay/analysis.h>
+#include <tvm/relay/transform.h>
 #include <tvm/relay/op_attr_types.h>
 #include <tvm/relay/attrs/transform.h>
 #include <tvm/relay/transform.h>
@@ -348,9 +349,6 @@ Expr AlterOpLayout(const Expr& expr) {
   return ForwardRewrite(expr, AlterOpLayoutRewrite, fcontext);
 }
 
-TVM_REGISTER_API("relay._ir_pass.AlterOpLayout")
-.set_body_typed(AlterOpLayout);
-
 }  // namespace alter_op_layout
 
 namespace transform {
diff --git a/src/relay/pass/canonicalize_cast.cc b/src/relay/pass/canonicalize_cast.cc
index 99f4a7f44e7e7..04fec248f81c9 100644
--- a/src/relay/pass/canonicalize_cast.cc
+++ b/src/relay/pass/canonicalize_cast.cc
@@ -22,7 +22,7 @@
  * \file canonicalize_cast.cc
  * \brief Canonicalize cast expressions to make operator fusion more efficient.
  */
-#include <tvm/relay/pass.h>
+#include <tvm/relay/analysis.h>
 #include <tvm/relay/expr_functor.h>
 #include <tvm/relay/attrs/nn.h>
 #include <tvm/relay/transform.h>
diff --git a/src/relay/pass/canonicalize_ops.cc b/src/relay/pass/canonicalize_ops.cc
index ff9e2304a3bc3..fc0c43d200e5d 100644
--- a/src/relay/pass/canonicalize_ops.cc
+++ b/src/relay/pass/canonicalize_ops.cc
@@ -23,7 +23,7 @@
  * \brief Canonicalize special operators to basic operators.
     This can simplify latter analysis. (e.g. Expand bias_add to expand_dims and broadcast_add.)
  */
-#include <tvm/relay/pass.h>
+#include <tvm/relay/analysis.h>
 #include <tvm/relay/expr_functor.h>
 #include <tvm/relay/attrs/nn.h>
 #include <tvm/relay/transform.h>
@@ -61,9 +61,6 @@ Expr CanonicalizeOps(const Expr& e) {
   return BiasAddSimplifier().Mutate(e);
 }
 
-TVM_REGISTER_API("relay._ir_pass.canonicalize_ops")
-.set_body_typed(CanonicalizeOps);
-
 namespace transform {
 
 Pass CanonicalizeOps() {
diff --git a/src/relay/pass/combine_parallel_conv2d.cc b/src/relay/pass/combine_parallel_conv2d.cc
index c95c1ddf8e160..d72705c8ce470 100644
--- a/src/relay/pass/combine_parallel_conv2d.cc
+++ b/src/relay/pass/combine_parallel_conv2d.cc
@@ -33,7 +33,7 @@
  * convolution branches, such as Inception block.
  */
 
-#include <tvm/relay/pass.h>
+#include <tvm/relay/analysis.h>
 #include <tvm/relay/expr_functor.h>
 #include <tvm/relay/attrs/nn.h>
 #include <tvm/relay/attrs/transform.h>
@@ -355,9 +355,6 @@ Expr CombineParallelConv2D(const Expr& expr, uint64_t min_num_branches) {
   return ParallelConv2DCombiner(min_num_branches).Combine(expr);
 }
 
-TVM_REGISTER_API("relay._ir_pass.CombineParallelConv2D")
-.set_body_typed(CombineParallelConv2D);
-
 namespace transform {
 
 Pass CombineParallelConv2D(uint64_t min_num_branches) {
diff --git a/src/relay/pass/de_duplicate.cc b/src/relay/pass/de_duplicate.cc
new file mode 100644
index 0000000000000..d5d4f69606539
--- /dev/null
+++ b/src/relay/pass/de_duplicate.cc
@@ -0,0 +1,122 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+/*!
+ * Copyright (c) 2019 by Contributors
+ *
+ * \file de_duplicate.cc
+ * \brief Use a fresh Id for every Var to make the result well-formed.
+ */
+
+#include <tvm/relay/expr_functor.h>
+#include <tvm/relay/analysis.h>
+#include <tvm/relay/pattern_functor.h>
+#include "../ir/type_functor.h"
+
+namespace tvm {
+namespace relay {
+
+Expr DeDup(const Expr& e) {
+  class DeDupMutator : public TypeMutator,
+                       public ExprMutator,
+                       public PatternMutator {
+   public:
+    TypeVar Fresh(const TypeVar& tv) {
+      TypeVar ret = TypeVarNode::make(tv->var->name_hint, tv->kind);
+      type_rename_[tv] = ret;
+      return ret;
+    }
+
+    Var Fresh(const Var& v) {
+      Var ret = VarNode::make(v->name_hint(), VisitType(v->type_annotation));
+      rename_[v] = ret;
+      return ret;
+    }
+
+    Expr VisitExpr(const Expr& e) final {
+      return ExprMutator::VisitExpr(e);
+    }
+
+    Expr VisitExpr_(const VarNode* op) final {
+      Var v = GetRef<Var>(op);
+      return rename_.count(v) != 0 ? rename_.at(v) : v;
+    }
+
+    Expr VisitExpr_(const LetNode* op) final {
+      Var v = Fresh(op->var);
+      return LetNode::make(v, VisitExpr(op->value), VisitExpr(op->body));
+    }
+
+    Type VisitType(const Type& t) final {
+      return t.defined() ? TypeMutator::VisitType(t) : t;
+    }
+
+    Expr VisitExpr_(const FunctionNode* op) final {
+      tvm::Array<TypeVar> type_params;
+      for (const TypeVar& type_param : op->type_params) {
+        type_params.push_back(Fresh(type_param));
+      }
+      tvm::Array<Var> params;
+      for (const Var& param : op->params) {
+        params.push_back(Fresh(param));
+      }
+      return FunctionNode::make(params,
+                                VisitExpr(op->body),
+                                VisitType(op->ret_type),
+                                type_params,
+                                op->attrs);
+    }
+
+    Pattern VisitPattern(const Pattern& p) final {
+      return PatternMutator::VisitPattern(p);
+    }
+
+    Pattern VisitPattern_(const PatternVarNode* op) final {
+      return PatternVarNode::make(Fresh(op->var));
+    }
+
+    Clause VisitClause(const Clause& c) final {
+      Pattern pat = VisitPattern(c->lhs);
+      return ClauseNode::make(pat, VisitExpr(c->rhs));
+    }
+
+    Type VisitType_(const TypeVarNode* op) final {
+      TypeVar v = GetRef<TypeVar>(op);
+      return type_rename_.count(v) != 0 ? type_rename_.at(v) : v;
+    }
+
+    Var VisitVar(const Var& v) final {
+      return Fresh(v);
+    }
+
+   private:
+    std::unordered_map<Var, Var, NodeHash, NodeEqual> rename_;
+    std::unordered_map<TypeVar, TypeVar, NodeHash, NodeEqual> type_rename_;
+  };
+
+  Expr ret = DeDupMutator().VisitExpr(e);
+  CHECK_EQ(FreeVars(ret).size(), FreeVars(e).size());
+  return ret;
+}
+
+TVM_REGISTER_API("relay._transform.dedup")
+.set_body_typed(DeDup);
+
+}  // namespace relay
+}  // namespace tvm
diff --git a/src/relay/pass/dead_code.cc b/src/relay/pass/dead_code.cc
index 7e186f80df929..54075f0699e6f 100644
--- a/src/relay/pass/dead_code.cc
+++ b/src/relay/pass/dead_code.cc
@@ -28,8 +28,9 @@
  * CalcDep turn an expr into a dependency graph of expr,
  * GenLet turn the dependency graph into a let list, taking only the used value.
  */
-#include <tvm/relay/pass.h>
+#include <tvm/relay/analysis.h>
 #include <tvm/relay/expr_functor.h>
+#include <tvm/relay/transform.h>
 #include "let_list.h"
 
 namespace tvm {
@@ -156,9 +157,6 @@ Expr DeadCodeElimination(const Expr& e, bool inline_once) {
   return CalcDep::Eliminate(e, inline_once);
 }
 
-TVM_REGISTER_API("relay._ir_pass.dead_code_elimination")
-.set_body_typed(DeadCodeElimination);
-
 namespace transform {
 
 Pass DeadCodeElimination(bool inline_once) {
diff --git a/src/relay/pass/dependency_graph.h b/src/relay/pass/dependency_graph.h
index 7f53918ebcb7f..5e2b08c352f09 100644
--- a/src/relay/pass/dependency_graph.h
+++ b/src/relay/pass/dependency_graph.h
@@ -20,7 +20,7 @@
 /*!
  *  Copyright (c) 2019 by Contributors.
  * \file tvm/relay/pass/dependency_graph.h
- * \brief 
+ * \brief create a dependency graph.
  */
 #ifndef TVM_RELAY_PASS_DEPENDENCY_GRAPH_H_
 #define TVM_RELAY_PASS_DEPENDENCY_GRAPH_H_
diff --git a/src/relay/pass/device_annotation.cc b/src/relay/pass/device_annotation.cc
index 8eeb493f1feba..aec974b184d3f 100644
--- a/src/relay/pass/device_annotation.cc
+++ b/src/relay/pass/device_annotation.cc
@@ -34,7 +34,6 @@
 #include <tvm/relay/attrs/annotation.h>
 #include <tvm/relay/expr.h>
 #include <tvm/relay/expr_functor.h>
-#include <tvm/relay/pass.h>
 #include <tvm/relay/transform.h>
 
 #include <memory>
@@ -559,13 +558,13 @@ Map<Expr, Integer> CollectDeviceAnnotationOps(const Expr& expr) {
   return AnnotatationVisitor::GetAnnotations(expr);
 }
 
-TVM_REGISTER_API("relay._ir_pass.CollectDeviceInfo")
+TVM_REGISTER_API("relay._analysis.CollectDeviceInfo")
 .set_body_typed(CollectDeviceInfo);
 
-TVM_REGISTER_API("relay._ir_pass.RewriteDeviceAnnotation")
+TVM_REGISTER_API("relay._analysis.RewriteDeviceAnnotation")
 .set_body_typed(RewriteAnnotatedOps);
 
-TVM_REGISTER_API("relay._ir_pass.CollectDeviceAnnotationOps")
+TVM_REGISTER_API("relay._analysis.CollectDeviceAnnotationOps")
 .set_body_typed(CollectDeviceAnnotationOps);
 
 namespace transform {
diff --git a/src/relay/pass/eliminate_common_subexpr.cc b/src/relay/pass/eliminate_common_subexpr.cc
index 883681adcaf45..33a791b2bd996 100644
--- a/src/relay/pass/eliminate_common_subexpr.cc
+++ b/src/relay/pass/eliminate_common_subexpr.cc
@@ -27,7 +27,7 @@
  * to replace an expression with a previously appeared expression with the same input and
  * attributes. The fskip callback argument allows us to skip specific expressions.
  */
-#include <tvm/relay/pass.h>
+#include <tvm/relay/analysis.h>
 #include <tvm/relay/expr_functor.h>
 #include <tvm/relay/transform.h>
 #include <unordered_map>
@@ -85,9 +85,6 @@ Expr EliminateCommonSubexpr(const Expr& expr, PackedFunc callback) {
   return CommonSubexprEliminator(callback)(expr);
 }
 
-TVM_REGISTER_API("relay._ir_pass.eliminate_common_subexpr")
-.set_body_typed<Expr(Expr, PackedFunc)>(EliminateCommonSubexpr);
-
 namespace transform {
 
 Pass EliminateCommonSubexpr(PackedFunc fskip) {
diff --git a/src/relay/pass/eta_expand.cc b/src/relay/pass/eta_expand.cc
index 3139d41d63937..e73e3778395e9 100644
--- a/src/relay/pass/eta_expand.cc
+++ b/src/relay/pass/eta_expand.cc
@@ -25,7 +25,8 @@
  * \brief Add abstraction over a function. For example, abs will become (fun x -> abs x).
  *
  */
-#include <tvm/relay/pass.h>
+#include <tvm/relay/type.h>
+#include <tvm/relay/transform.h>
 
 namespace tvm {
 namespace relay {
@@ -44,10 +45,8 @@ Expr EtaExpand(const Expr& e, const Module& mod) {
     original_type_params = func->type_params;
     ret_type = func->ret_type;
   } else {
-    auto inferred = InferType(e, mod);
-    CHECK(inferred->is_type<FunctionNode>());
-
-    auto func = GetRef<Function>(inferred.as_derived<FunctionNode>());
+    CHECK(e->is_type<FunctionNode>());
+    auto func = GetRef<Function>(e.as_derived<FunctionNode>());
     original_params = func->params;
     original_type_params = func->type_params;
     ret_type = func->ret_type;
@@ -62,19 +61,18 @@ Expr EtaExpand(const Expr& e, const Module& mod) {
   auto new_func =
       FunctionNode::make(args, CallNode::make(e, params), ret_type, original_type_params);
 
-  return InferType(new_func, mod);
+  return new_func;
 }
 
-TVM_REGISTER_API("relay._ir_pass.eta_expand").set_body_typed(EtaExpand);
-
 namespace transform {
 
 Pass EtaExpand() {
   runtime::TypedPackedFunc<Function(Function, Module, PassContext)> pass_func =
     [=](Function f, Module m, PassContext pc) {
-    return Downcast<Function>(EtaExpand(f, m));
-  };
-  return CreateFunctionPass(pass_func, 1, "EtaExpand", {});
+      return Downcast<Function>(EtaExpand(f, m));
+    };
+  Pass expanded = CreateFunctionPass(pass_func, 1, "EtaExpand", {});
+  return Sequential({expanded, InferType()});
 }
 
 TVM_REGISTER_API("relay._transform.EtaExpand")
diff --git a/src/relay/pass/feature.cc b/src/relay/pass/feature.cc
index e86ca06211126..df3a5d7ecec52 100644
--- a/src/relay/pass/feature.cc
+++ b/src/relay/pass/feature.cc
@@ -23,7 +23,7 @@
  * \brief Detect features used in Expr/Module
  */
 #include <tvm/relay/feature.h>
-#include <tvm/relay/pass.h>
+#include <tvm/relay/analysis.h>
 #include <tvm/relay/expr.h>
 #include <tvm/relay/expr_functor.h>
 #include <tvm/relay/module.h>
@@ -97,7 +97,7 @@ Array<Integer> PyDetectFeature(const Expr& expr, const Module& mod) {
   return static_cast<Array<Integer>>(fs);
 }
 
-TVM_REGISTER_API("relay._ir_pass.detect_feature")
+TVM_REGISTER_API("relay._analysis.detect_feature")
 .set_body_typed(PyDetectFeature);
 
 }  // namespace relay
diff --git a/src/relay/pass/fold_constant.cc b/src/relay/pass/fold_constant.cc
index 815407038b082..7b896a8d0f7fe 100644
--- a/src/relay/pass/fold_constant.cc
+++ b/src/relay/pass/fold_constant.cc
@@ -21,7 +21,7 @@
  * Copyright (c) 2018 by Contributors
  * \file constant_folding.cc
  */
-#include <tvm/relay/pass.h>
+#include <tvm/relay/analysis.h>
 #include <tvm/relay/expr_functor.h>
 #include <tvm/relay/op_attr_types.h>
 #include <tvm/relay/interpreter.h>
@@ -156,9 +156,13 @@ class ConstantFolder : public ExprMutator {
   }
   // Constant evaluate a expression.
   Expr ConstEvaluate(Expr expr) {
-    expr = InferType(expr, Module(nullptr));
-    expr = FuseOps(expr, 0, Module(nullptr));
-    expr = InferType(expr, Module(nullptr));
+    std::vector<transform::Pass> passes = {transform::FuseOps(0),
+                                           transform::InferType()};
+    auto mod = ModuleNode::FromExpr(expr);
+    auto seq = transform::Sequential(passes);
+    mod = seq(mod);
+    auto entry_func = mod->Lookup("main");
+    expr = expr.as<FunctionNode>() == nullptr ? entry_func->body : entry_func;
     return ValueToExpr(executor_(expr));
   }
   // Evaluate shape_of op
@@ -213,9 +217,6 @@ Expr FoldConstant(const Expr& expr) {
       Module(nullptr), ctx, target)).Mutate(expr);
 }
 
-TVM_REGISTER_API("relay._ir_pass.FoldConstant")
-.set_body_typed(FoldConstant);
-
 namespace transform {
 
 Pass FoldConstant() {
diff --git a/src/relay/pass/fold_scale_axis.cc b/src/relay/pass/fold_scale_axis.cc
index 53089807ace5f..868a08f8b5769 100644
--- a/src/relay/pass/fold_scale_axis.cc
+++ b/src/relay/pass/fold_scale_axis.cc
@@ -26,7 +26,7 @@
  *  conv/dense operators.
  */
 #include <tvm/data_layout.h>
-#include <tvm/relay/pass.h>
+#include <tvm/relay/analysis.h>
 #include <tvm/relay/attrs/nn.h>
 #include <tvm/relay/expr_functor.h>
 #include <tvm/relay/transform.h>
@@ -545,10 +545,6 @@ Expr ForwardFoldScaleAxis(const Expr& data) {
       data, "FScaleAxisForwardRewrite", fcontext);
 }
 
-// Expose the FoldScaleAxisFoward
-TVM_REGISTER_API("relay._ir_pass.forward_fold_scale_axis")
-.set_body_typed<Expr(Expr)>(ForwardFoldScaleAxis);
-
 //----------------------------------------
 // Implement backward transformations.
 //----------------------------------------
@@ -947,9 +943,6 @@ Expr BackwardFoldScaleAxis(const Expr& data) {
   return make_node<BackwardTransformerNode>()->Fold(data);
 }
 
-TVM_REGISTER_API("relay._ir_pass.backward_fold_scale_axis")
-.set_body_typed<Expr(Expr)>(BackwardFoldScaleAxis);
-
 }  // namespace fold_scale_axis
 
 namespace transform {
@@ -964,6 +957,9 @@ Pass ForwardFoldScaleAxis() {
                             {ir::StringImm::make("InferType")});
 }
 
+TVM_REGISTER_API("relay._transform.ForwardFoldScaleAxis")
+.set_body_typed(ForwardFoldScaleAxis);
+
 Pass BackwardFoldScaleAxis() {
   runtime::TypedPackedFunc<Function(Function, Module, PassContext)> pass_func =
     [=](Function f, Module m, PassContext pc) {
@@ -974,6 +970,9 @@ Pass BackwardFoldScaleAxis() {
                             {ir::StringImm::make("InferType")});
 }
 
+TVM_REGISTER_API("relay._transform.BackwardFoldScaleAxis")
+.set_body_typed(BackwardFoldScaleAxis);
+
 Pass FoldScaleAxis() {
   // FoldScaleAxis pass contains the following three passes. Therefore, we can
   // register it as a sequential pass.
diff --git a/src/relay/pass/forward_rewrite.cc b/src/relay/pass/forward_rewrite.cc
index 8ad61270e33a8..6c66d6e982a71 100644
--- a/src/relay/pass/forward_rewrite.cc
+++ b/src/relay/pass/forward_rewrite.cc
@@ -23,9 +23,9 @@
  * \file forward_rewrite.cc
  * \brief Apply rewriting rules in a forward fashion.
  */
-#include <tvm/relay/pass.h>
 #include <tvm/relay/expr_functor.h>
 #include <tvm/relay/op_attr_types.h>
+#include <tvm/relay/transform.h>
 #include "pass_util.h"
 
 namespace tvm {
@@ -206,37 +206,5 @@ Expr ForwardRewrite(const Expr& expr,
   return ForwardRewriter(&rewrite_func, fcontext, fmulti_ref_trigger).Rewrite(expr);
 }
 
-namespace transform {
-
-using std::function;
-
-Pass ForwardRewrite(const std::string& rewrite_map_attr_name,
-                    function<NodeRef(const Call&)> fcontext,
-                    function<Expr(const Expr&)> fmulti_ref_trigger) {
-  runtime::TypedPackedFunc<Function(Function, Module, PassContext)> pass_func =
-    [=](Function f, Module m, PassContext pc) {
-    return Downcast<Function>(ForwardRewrite(f,
-                                             rewrite_map_attr_name,
-                                             fcontext,
-                                             fmulti_ref_trigger));
-  };
-  return CreateFunctionPass(pass_func, 1, "ForwardRewrite", {});
-}
-
-Pass ForwardRewrite(const FForwardRewrite& rewrite_func,
-                    function<NodeRef(const Call&)> fcontext,
-                    function<Expr(const Expr&)> fmulti_ref_trigger) {
-  runtime::TypedPackedFunc<Function(Function, Module, PassContext)> pass_func =
-    [=](Function f, Module m, PassContext pc) {
-    return Downcast<Function>(ForwardRewrite(f,
-                                             rewrite_func,
-                                             fcontext,
-                                             fmulti_ref_trigger));
-  };
-  return CreateFunctionPass(pass_func, 1, "ForwardRewriteFunc", {});
-}
-
-}  // namespace transform
-
 }  // namespace relay
 }  // namespace tvm
diff --git a/src/relay/pass/fuse_ops.cc b/src/relay/pass/fuse_ops.cc
index 9f940e54953b9..cdd2837463659 100644
--- a/src/relay/pass/fuse_ops.cc
+++ b/src/relay/pass/fuse_ops.cc
@@ -26,7 +26,7 @@
  *   Fuse necessary ops into a single one.
  */
 #include <tvm/expr_operator.h>
-#include <tvm/relay/pass.h>
+#include <tvm/relay/analysis.h>
 #include <tvm/relay/expr_functor.h>
 #include <tvm/relay/op_attr_types.h>
 #include <tvm/relay/transform.h>
@@ -963,9 +963,6 @@ Expr FuseOps(const Expr& expr, int fuse_opt_level, const Module& module) {
   }
 }
 
-TVM_REGISTER_API("relay._ir_pass.FuseOps")
-.set_body_typed(FuseOps);
-
 namespace transform {
 
 Pass FuseOps(int fuse_opt_level) {
diff --git a/src/relay/pass/gradient.cc b/src/relay/pass/gradient.cc
index 5d26f7adcff77..1abe7a94b621f 100644
--- a/src/relay/pass/gradient.cc
+++ b/src/relay/pass/gradient.cc
@@ -26,7 +26,8 @@
 #include <tvm/lowered_func.h>
 #include <tvm/operation.h>
 #include <tvm/relay/expr_functor.h>
-#include <tvm/relay/pass.h>
+#include <tvm/relay/analysis.h>
+#include <tvm/relay/transform.h>
 #include "pattern_util.h"
 #include "let_list.h"
 #include "../ir/type_functor.h"
@@ -246,7 +247,7 @@ Expr FirstOrderGradient(const Expr& re, const Module& mod) {
   return FunctionNode::make(f->params, body, GradRetType(GetRef<Function>(f)), {});
 }
 
-TVM_REGISTER_API("relay._ir_pass.first_order_gradient")
+TVM_REGISTER_API("relay._analysis.first_order_gradient")
 .set_body_typed(FirstOrderGradient);
 
 struct ReverseADType : TypeMutator {
@@ -351,7 +352,7 @@ Expr Gradient(const Expr& re, const Module& mod) {
   return FunctionNode::make(f->params, body, GradRetType(GetRef<Function>(f)), {});
 }
 
-TVM_REGISTER_API("relay._ir_pass.gradient")
+TVM_REGISTER_API("relay._transform.gradient")
 .set_body_typed(Gradient);
 
 }  // namespace relay
diff --git a/src/relay/pass/kind_check.cc b/src/relay/pass/kind_check.cc
index 976a2ef8ec54d..c0f4a7c5967d1 100644
--- a/src/relay/pass/kind_check.cc
+++ b/src/relay/pass/kind_check.cc
@@ -32,7 +32,7 @@
  * We check this by ensuring the `dtype` field of a Tensor always
  * contains a data type such as `int`, `float`, `uint`.
  */
-#include <tvm/relay/pass.h>
+#include <tvm/relay/analysis.h>
 #include <tvm/relay/error.h>
 #include "../ir/type_functor.h"
 
@@ -183,7 +183,7 @@ Kind KindCheck(const Type& t, const Module& mod) {
   return kc.Check(t);
 }
 
-TVM_REGISTER_API("relay._ir_pass.check_kind")
+TVM_REGISTER_API("relay._analysis.check_kind")
 .set_body([](TVMArgs args, TVMRetValue* ret) {
     if (args.size() == 1) {
       *ret = KindCheck(args[0], ModuleNode::make({}, {}));
diff --git a/src/relay/pass/let_list.h b/src/relay/pass/let_list.h
index 9f56b22fc13e9..73c5fe3abc22c 100644
--- a/src/relay/pass/let_list.h
+++ b/src/relay/pass/let_list.h
@@ -6,9 +6,9 @@
  * to you under the Apache License, Version 2.0 (the
  * "License"); you may not use this file except in compliance
  * with the License.  You may obtain a copy of the License at
- * 
+ *
  *   http://www.apache.org/licenses/LICENSE-2.0
- * 
+ *
  * Unless required by applicable law or agreed to in writing,
  * software distributed under the License is distributed on an
  * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
@@ -18,7 +18,7 @@
  */
 
 /*!
- *  Copyright (c) 2018 by Contributors
+ *  Copyright (c) 2019 by Contributors
  * \file let_list.h
  * \brief LetList record let binding and insert let expression implicitly.
  *  using it, one can treat AST as value instead of expression,
@@ -46,6 +46,11 @@ namespace relay {
  */
 class LetList {
  public:
+  ~LetList() {
+    if (lets_.size() > 0 && !used_) {
+      LOG(WARNING) << "letlist not used";
+    }
+  }
   /*!
    * \brief insert a binding.
    *
@@ -64,13 +69,13 @@ class LetList {
   /*!
    * \brief insert a binding.
    *
-   * \param ty the type of the binding.
-   *
    * \param expr the value of the binding.
    *
+   * \param ty the type of the binding.
+   *
    * \return a Var that hold the inserted expr.
    */
-  Var Push(Type ty, Expr expr) {
+  Var Push(Expr expr, Type ty) {
     return Push(VarNode::make("x", ty), expr);
   }
 
@@ -82,7 +87,7 @@ class LetList {
    *  \return a Var that hold the inserted expr.
    */
   Var Push(Expr expr) {
-    return Push(Type(), expr);
+    return Push(expr, Type());
   }
 
   /*!
@@ -129,6 +134,12 @@ class LetList {
     return ll.Get(f(&ll));
   }
 
+  static Expr Let(const Expr& e, const std::function<Expr(const Var&)>& f) {
+    return With([&](LetList* ll) {
+      return f(ll->Push(e));
+    });
+  }
+
  private:
   std::vector<std::pair<Var, Expr> > lets_;
   bool used_ = false;
diff --git a/src/relay/pass/mac_count.cc b/src/relay/pass/mac_count.cc
index 3d77fabe6fe91..48a0dfb847466 100644
--- a/src/relay/pass/mac_count.cc
+++ b/src/relay/pass/mac_count.cc
@@ -30,7 +30,7 @@
 #include <tvm/relay/op.h>
 #include <tvm/relay/attrs/nn.h>
 #include <tvm/relay/expr_functor.h>
-#include <tvm/relay/pass.h>
+#include <tvm/relay/analysis.h>
 #include <tvm/data_layout.h>
 #include "pattern_util.h"
 
@@ -88,11 +88,44 @@ int64_t ConvMacCount(const Call& call_node) {
     << "The dimension of the output tensor in Conv 2D should be 4 or 5.";
   int64_t count = GetCartesianProd(output_tensor) * GetCartesianProd(kernel_size);
   CHECK_EQ(input_channel % conv_2d_attr->groups, 0)
-  << "The number of input channels is not divisble by groups.";
+    << "The number of input channels is not divisble by groups.";
   count *= input_channel/conv_2d_attr->groups;
   return count;
 }
 
+int64_t Conv2dTransposeMacCount(const Call& call_node) {
+  if (!call_node->checked_type_.defined()) {
+    LOG(WARNING) << "The infer type pass should be called before the mac count pass";
+    return 0;
+  }
+  Array<Expr> args = call_node->args;
+  CHECK(args.size() == 2)
+    << "The number of input arguments of a CONV 2D Transpose node should be 2.";
+  const auto* conv_2d_transpose_attr = call_node->attrs.as<Conv2DTransposeAttrs>();
+  const auto* data_type = args[0]->checked_type().as<TensorTypeNode>();
+  Array<IndexExpr> data_shape = data_type->shape;
+  std::string data_layout = conv_2d_transpose_attr->data_layout;
+  int32_t C_ind = Layout(data_layout).IndexOf(LayoutAxis::Get('C'));
+  int32_t c_ind = Layout(data_layout).IndexOf(LayoutAxis::Get('c'));
+  CHECK(C_ind != -1)
+    << "There is no input channel dimension.";
+  int64_t input_channel = static_cast<int64_t>(data_shape[C_ind].as<IntImm>()->value);
+  if (c_ind != -1)
+    input_channel *= static_cast<int64_t>(data_shape[c_ind].as<IntImm>()->value);
+  Array<IndexExpr> kernel_size = conv_2d_transpose_attr->kernel_size;
+  CHECK(kernel_size.size() == 2)
+    << "The dimension of the kernel in Conv 2D Transpose should be 2.";
+  const auto* expr = call_node->checked_type().as<TensorTypeNode>();
+  Array<IndexExpr> output_tensor = expr->shape;
+  CHECK(output_tensor.size() == 4 || output_tensor.size() == 5)
+    << "The dimension of the output tensor in Conv 2D Transpose should be 4 or 5.";
+  int64_t count = GetCartesianProd(output_tensor) * GetCartesianProd(kernel_size);
+  CHECK_EQ(input_channel % conv_2d_transpose_attr->groups, 0)
+    << "The number of input channels is not divisble by groups.";
+  count *= input_channel/conv_2d_transpose_attr->groups;
+  return count;
+}
+
 int64_t DenseMacCount(const Call& call_node) {
   if (!call_node->checked_type_.defined()) {
     LOG(WARNING) << "The infer type pass should be called before the mac count pass";
@@ -106,13 +139,13 @@ int64_t DenseMacCount(const Call& call_node) {
   Array<IndexExpr> data_shape = data_type->shape;
   Array<IndexExpr> weight_shape = weight_type->shape;
   CHECK(data_shape.size() == 2 && weight_shape.size() == 2)
-      << "The dimension of an input tensor to Dense node should be 2.";
+    << "The dimension of an input tensor to Dense node should be 2.";
   int64_t d1 = static_cast<int64_t>(data_shape[0].as<IntImm>()->value);
   int64_t d2 = static_cast<int64_t>(data_shape[1].as<IntImm>()->value);
   int64_t d3 = static_cast<int64_t>(weight_shape[0].as<IntImm>()->value);
   int64_t d4 = static_cast<int64_t>(weight_shape[1].as<IntImm>()->value);
   CHECK(d2 == d4)
-      << "The dimensions of input arguments do not match.";
+    << "The dimensions of input arguments do not match.";
   int64_t count = d1 * d2 * d3;
   return count;
 }
@@ -120,6 +153,9 @@ int64_t DenseMacCount(const Call& call_node) {
 RELAY_REGISTER_OP("nn.conv2d")
 .set_attr<FMacCount>("FMacCount", ConvMacCount);
 
+RELAY_REGISTER_OP("nn.conv2d_transpose")
+.set_attr<FMacCount>("FMacCount", Conv2dTransposeMacCount);
+
 RELAY_REGISTER_OP("nn.dense")
 .set_attr<FMacCount>("FMacCount", DenseMacCount);
 
@@ -129,7 +165,8 @@ class MacCounter : private ExprVisitor {
     count_ = 0;
   }
   static int64_t GetTotalMacNumber(const Expr& expr) {
-    LOG(INFO) << "This pass only counts MACs in direct CONV 2D and Dense ops";
+    LOG(INFO) << "This pass only counts MACs in direct CONV 2D, "
+              << "CONV 2D Transpose and Dense ops";
     MacCounter counter;
     counter(expr);
     return counter.count_;
@@ -151,7 +188,7 @@ int64_t GetTotalMacNumber(const Expr& expr) {
   return MacCounter::GetTotalMacNumber(expr);
 }
 
-TVM_REGISTER_API("relay._ir_pass.GetTotalMacNumber")
+TVM_REGISTER_API("relay._analysis.GetTotalMacNumber")
 .set_body_typed(GetTotalMacNumber);
 
 }  // namespace mac_count
diff --git a/src/relay/pass/match_exhaustion.cc b/src/relay/pass/match_exhaustion.cc
index 173d6eacf528f..cc00a54cde0ab 100644
--- a/src/relay/pass/match_exhaustion.cc
+++ b/src/relay/pass/match_exhaustion.cc
@@ -32,7 +32,6 @@
 #include <tvm/relay/error.h>
 #include <tvm/relay/expr_functor.h>
 #include <tvm/relay/pattern_functor.h>
-#include <tvm/relay/pass.h>
 #include <stack>
 
 namespace tvm {
@@ -236,15 +235,15 @@ Array<Pattern> UnmatchedCases(const Match& match, const Module& mod) {
 }
 
 // expose for testing only
-TVM_REGISTER_API("relay._ir_pass.unmatched_cases")
-.set_body_typed<Array<Pattern>(const Match&,
-                               const Module&)>([](const Match& match,
-                                                  const Module& mod_ref) {
-                                                 Module call_mod = mod_ref;
-                                                 if (!call_mod.defined()) {
-                                                   call_mod = ModuleNode::make({}, {});
-                                                 }
-                                                 return UnmatchedCases(match, call_mod);
-                                               });
+TVM_REGISTER_API("relay._analysis.unmatched_cases")
+.set_body_typed<Array<Pattern>(const Match&, const Module&)>(
+  [](const Match& match, const Module& mod_ref) {
+    Module call_mod = mod_ref;
+    if (!call_mod.defined()) {
+      call_mod = ModuleNode::make({}, {});
+    }
+    return UnmatchedCases(match, call_mod);
+  });
+
 }  // namespace relay
 }  // namespace tvm
diff --git a/src/relay/pass/partial_eval.cc b/src/relay/pass/partial_eval.cc
index b95c5844f8a40..3b7628a10789c 100644
--- a/src/relay/pass/partial_eval.cc
+++ b/src/relay/pass/partial_eval.cc
@@ -18,7 +18,7 @@
  */
 
 /*!
- * Copyright (c) 2018 by Contributors
+ * Copyright (c) 2019 by Contributors
  *
  * \file partial_eval.cc
  *
@@ -64,7 +64,7 @@
  * 3: The generated code reuses bindings (although they are not shadowed),
  * so we have to deduplicate them.
  *
- * 4: In the generated code, multiple VarNode might have same Id.
+ * 4: In the generated code, as it call TypeSubst, multiple VarNode might have same Id.
  * While it is permitted, most pass use NodeHash for Var,
  * and having multiple VarNode for same Id break them.
  * Thus we remap them to a single Id for now.
@@ -91,7 +91,8 @@
  *
  * These assumptions do not affect the correctness of the algorithm, however.
  */
-#include <tvm/relay/pass.h>
+#include <tvm/relay/analysis.h>
+#include <tvm/relay/transform.h>
 #include <tvm/relay/expr_functor.h>
 #include <tvm/relay/pattern_functor.h>
 #include <tvm/relay/interpreter.h>
@@ -215,9 +216,9 @@ Static MkSRef() {
 }
 
 using Func = std::function<PStatic(const std::vector<PStatic>&,
-                                      const Attrs&,
-                                      const Array<Type>&,
-                                      LetList*)>;
+                                   const Attrs&,
+                                   const Array<Type>&,
+                                   LetList*)>;
 
 struct SFuncNode : StaticNode {
   Func func;
@@ -255,6 +256,7 @@ class Environment {
 
   void Insert(const Var& v, const PStatic& ps) {
     CHECK(ps.defined());
+    CHECK_EQ(env_.back().locals.count(v), 0);
     env_.back().locals[v] = ps;
   }
 
@@ -286,12 +288,17 @@ class Environment {
 
 /*!
  * \brief As our store require rollback, we implement it as a frame.
- * every time we need to copy the store, a new frame is insert.
- * every time we roll back, a frame is popped.
+ *
+ * Every time we need to copy the store, a new frame is insert.
+ * Every time we roll back, a frame is popped.
  */
 struct StoreFrame {
   std::unordered_map<const SRefNode*, PStatic> store;
-  /*! \brief on unknown effect, history_valid is set to true to signal above frame is outdated */
+  /*!
+   * \brief On unknown effect, history_valid is set to true to signal above frame is outdated.
+   *
+   * It only outdate the frame above it, but not the current frame.
+   */
   bool history_valid = true;
   explicit StoreFrame(const std::unordered_map<const SRefNode*, PStatic>& store) : store(store) { }
   StoreFrame() = default;
@@ -309,6 +316,7 @@ class Store {
   }
 
   void Insert(const SRefNode* r, const PStatic& ps) {
+    CHECK(r);
     store_.back().store[r] = ps;
   }
 
@@ -316,19 +324,21 @@ class Store {
   PStatic Lookup(const SRefNode* r) {
     auto rit = store_.rbegin();
     while (rit != store_.rend()) {
-      if (!rit->history_valid) {
-        return PStatic();
-      }
       if (rit->store.find(r) != rit->store.end()) {
         return rit->store.find(r)->second;
       }
+      if (!rit->history_valid) {
+        return PStatic();
+      }
       ++rit;
     }
     return PStatic();
   }
 
   void Invalidate() {
-    store_.back().history_valid = false;
+    StoreFrame sf;
+    sf.history_valid = false;
+    store_.push_back(sf);
   }
 
  private:
@@ -340,6 +350,10 @@ class Store {
       store_->store_.push_back(StoreFrame());
     }
     ~StoreFrameContext() {
+      // push one history valid frame off.
+      while (!store_->store_.back().history_valid) {
+        store_->store_.pop_back();
+      }
       store_->store_.pop_back();
     }
   };
@@ -425,8 +439,6 @@ TVM_ADD_FILELINE)
 
 Expr StripWithFuncId(const Expr& e);
 
-Expr DeDup(const Expr& e);
-
 Function AsFunc(const Expr& e) {
   if (e.as<FunctionNode>()) {
     return Downcast<Function>(e);
@@ -443,13 +455,7 @@ Function AsFunc(const Expr& e) {
 class PartialEvaluator : public ExprFunctor<PStatic(const Expr& e, LetList* ll)>,
                          public PatternFunctor<MatchStatus(const Pattern&, const PStatic&)> {
  public:
-  PartialEvaluator(const tvm::Array<Var>& free_vars,
-                   const Module& mod) :
-    mod_(mod) {
-    for (const Var& v : free_vars) {
-      env_.Insert(v, NoStatic(v));
-    }
-  }
+  PartialEvaluator(const Module& mod) : mod_(mod) { }
 
   PStatic VisitExpr(const Expr& e, LetList* ll) final {
     PStatic ret = ExprFunctor<PStatic(const Expr&, LetList*)>::VisitExpr(e, ll);
@@ -485,23 +491,23 @@ class PartialEvaluator : public ExprFunctor<PStatic(const Expr& e, LetList* ll)>
     return env_.Lookup(GetRef<Var>(op));
   }
 
-  PStatic VisitExpr_(const GlobalVarNode* op, LetList* ll) final {
-    GlobalVar gv = GetRef<GlobalVar>(op);
+  PStatic VisitGlobalVar(const GlobalVar& gv) {
+    CHECK(mod_.defined());
     if (gv_map_.count(gv) == 0) {
-      if (mod_.defined()) {
-        Function func = mod_->Lookup(gv);
-        InitializeFuncId(func);
-        Func f = VisitFuncStatic(func, gv);
-        gv_map_.insert({gv, HasStatic(MkSFunc(f), gv)});
-        func = AsFunc(PostProcess(VisitFuncDynamic(func, f)));
-        mod_->Update(gv, func);
-      } else {
-        gv_map_.insert({gv, NoStatic(gv)});
-      }
+      Function func = mod_->Lookup(gv);
+      InitializeFuncId(func);
+      Func f = VisitFuncStatic(func, gv);
+      gv_map_.insert({gv, HasStatic(MkSFunc(f), gv)});
+      func = AsFunc(PostProcess(VisitFuncDynamic(func, f)));
+      mod_->Update(gv, func);
     }
     return gv_map_.at(gv);
   }
 
+  PStatic VisitExpr_(const GlobalVarNode* op, LetList* ll) final {
+    return VisitGlobalVar(GetRef<GlobalVar>(op));
+  }
+
   PStatic VisitExpr_(const LetNode* op, LetList* ll) final {
     env_.Insert(op->var, VisitExpr(op->value, ll));
     return VisitExpr(op->body, ll);
@@ -630,7 +636,7 @@ class PartialEvaluator : public ExprFunctor<PStatic(const Expr& e, LetList* ll)>
             subst.Set(func->type_params[i], type_args[i]);
           }
           for (size_t i = type_args.size(); i < func->type_params.size(); ++i) {
-            subst.Set(func->type_params[i], Type());
+            subst.Set(func->type_params[i], IncompleteTypeNode::make(kType));
           }
           std::vector<Time> args_time;
           for (const auto& v : pv) {
@@ -673,22 +679,22 @@ class PartialEvaluator : public ExprFunctor<PStatic(const Expr& e, LetList* ll)>
     };
   }
 
-
   Expr VisitFuncDynamic(const Function& func, const Func& f) {
     return store_.Extend<Expr>([&]() {
-        store_.Invalidate();
-        return FunctionNode::make(func->params, LetList::With([&](LetList* ll) {
-              std::vector<PStatic> pv;
-              for (const auto& v : func->params) {
-                pv.push_back(NoStatic(v));
-              }
-              tvm::Array<Type> type_args;
-              for (const auto& tp : func->type_params) {
-                type_args.push_back(tp);
-              }
-              return f(pv, Attrs(), type_args, ll)->dynamic;
-            }), func->ret_type, func->type_params, func->attrs);
-      });
+      store_.Invalidate();
+      return FunctionNode::make(func->params,
+                                LetList::With([&](LetList* ll) {
+        std::vector<PStatic> pv;
+        for (const auto& v : func->params) {
+          pv.push_back(NoStatic(v));
+        }
+        tvm::Array<Type> type_args;
+        for (const auto& tp : func->type_params) {
+          type_args.push_back(tp);
+        }
+        return f(pv, Attrs(), type_args, ll)->dynamic;
+      }), func->ret_type, func->type_params, func->attrs);
+    });
   }
 
   PStatic VisitFunc(const Function& func, LetList* ll) {
@@ -740,9 +746,14 @@ class PartialEvaluator : public ExprFunctor<PStatic(const Expr& e, LetList* ll)>
 
   // Constant evaluate a expression.
   PStatic ConstEvaluate(const Expr& expr, LetList* ll) {
-    Expr infered = InferType(expr, Module(nullptr));
-    Expr fused = FuseOps(infered, 0, Module(nullptr));
-    Expr fused_infered = InferType(fused, Module(nullptr));
+    std::vector<transform::Pass> passes = {transform::FuseOps(0),
+                                           transform::InferType()};
+    auto mod = ModuleNode::FromExpr(expr);
+    auto seq = transform::Sequential(passes);
+    mod = seq(mod);
+    auto entry_func = mod->Lookup("main");
+    auto fused_infered =
+        expr.as<FunctionNode>() == nullptr ? entry_func->body : entry_func;
     return Reify(executor_(fused_infered), ll);
   }
 
@@ -957,86 +968,6 @@ class PartialEvaluator : public ExprFunctor<PStatic(const Expr& e, LetList* ll)>
   FInterpreter executor_ = CPUInterpreter();
 };
 
-/*! \brief Use a fresh Id for every Var to make the result well-formed. */
-Expr DeDup(const Expr& e) {
-  class DeDupMutator : public TypeMutator,
-                       public ExprMutator,
-                       public PatternMutator {
-   public:
-    TypeVar Fresh(const TypeVar& tv) {
-      TypeVar ret = TypeVarNode::make(tv->var->name_hint, tv->kind);
-      type_rename_[tv] = ret;
-      return ret;
-    }
-
-    Var Fresh(const Var& v) {
-      Var ret = VarNode::make(v->name_hint(), VisitType(v->type_annotation));
-      rename_[v] = ret;
-      return ret;
-    }
-
-    Expr VisitExpr(const Expr& e) final {
-      return ExprMutator::VisitExpr(e);
-    }
-
-    Expr VisitExpr_(const VarNode* op) final {
-      Var v = GetRef<Var>(op);
-      return rename_.count(v) != 0 ? rename_.at(v) : v;
-    }
-
-    Expr VisitExpr_(const LetNode* op) final {
-      Var v = Fresh(op->var);
-      return LetNode::make(v, VisitExpr(op->value), VisitExpr(op->body));
-    }
-
-    Type VisitType(const Type& t) final {
-      return t.defined() ? TypeMutator::VisitType(t) : t;
-    }
-
-    Expr VisitExpr_(const FunctionNode* op) final {
-      tvm::Array<TypeVar> type_params;
-      for (const TypeVar& type_param : op->type_params) {
-        type_params.push_back(Fresh(type_param));
-      }
-      tvm::Array<Var> params;
-      for (const Var& param : op->params) {
-        params.push_back(Fresh(param));
-      }
-      return FunctionNode::make(params,
-                                VisitExpr(op->body),
-                                VisitType(op->ret_type),
-                                type_params,
-                                op->attrs);
-    }
-
-    Pattern VisitPattern(const Pattern& p) final {
-      return PatternMutator::VisitPattern(p);
-    }
-
-    Clause VisitClause(const Clause& c) final {
-      Pattern pat = VisitPattern(c->lhs);
-      return ClauseNode::make(pat, VisitExpr(c->rhs));
-    }
-
-    Type VisitType_(const TypeVarNode* op) final {
-      TypeVar v = GetRef<TypeVar>(op);
-      return type_rename_.count(v) != 0 ? type_rename_.at(v) : v;
-    }
-
-    Var VisitVar(const Var& v) final {
-      return Fresh(v);
-    }
-
-   private:
-    std::unordered_map<Var, Var, NodeHash, NodeEqual> rename_;
-    std::unordered_map<TypeVar, TypeVar, NodeHash, NodeEqual> type_rename_;
-  };
-
-  Expr ret = DeDupMutator().VisitExpr(e);
-  CHECK_EQ(FreeVars(ret).size(), FreeVars(e).size());
-  return ret;
-}
-
 /*! \brief Remap multiple Var sharing the same Id into the same Var. */
 Expr Remap(const Expr& e) {
   class RemapMutator : public ExprMutator, public PatternMutator {
@@ -1086,27 +1017,26 @@ Expr PostProcess(const Expr& e) {
 
 }  // namespace partial_eval
 
-Expr PartialEval(const Expr& e, const Module& m) {
-  return TransformF([&](const Expr& e) {
-      return LetList::With([&](LetList* ll) {
-          relay::partial_eval::PartialEvaluator pe(FreeVars(e), m);
-          pe.InitializeFuncId(e);
-          return relay::partial_eval::PostProcess(pe.VisitExpr(e, ll)->dynamic);
-        });
-    }, e);
+Module PartialEval(const Module& m) {
+  relay::partial_eval::PartialEvaluator pe(m);
+  std::vector<GlobalVar> gvs;
+  for (const auto& p : m->functions) {
+    gvs.push_back(p.first);
+  }
+  for (const auto& gv : gvs) {
+    pe.VisitGlobalVar(gv);
+  }
+  return m;
 }
 
-TVM_REGISTER_API("relay._ir_pass.partial_evaluate")
-.set_body_typed(PartialEval);
-
 namespace transform {
 
 Pass PartialEval() {
-  runtime::TypedPackedFunc<Function(Function, Module, PassContext)> pass_func =
-    [=](Function f, Module m, PassContext pc) {
-    return Downcast<Function>(PartialEval(f, m));
+  runtime::TypedPackedFunc<Module(Module, PassContext)> pass_func =
+    [=](Module m, PassContext pc) {
+    return PartialEval(m);
   };
-  return CreateFunctionPass(pass_func, 1, "PartialEvaluate", {});
+  return CreateModulePass(pass_func, 1, "PartialEvaluate", {});
 }
 
 TVM_REGISTER_API("relay._transform.PartialEvaluate")
diff --git a/src/relay/pass/quantize.cc b/src/relay/pass/quantize.cc
index 1503d67feaf10..dbfbb7ef1de31 100644
--- a/src/relay/pass/quantize.cc
+++ b/src/relay/pass/quantize.cc
@@ -27,9 +27,10 @@
  */
 #include <dmlc/thread_local.h>
 #include <tvm/base.h>
-#include <tvm/relay/pass.h>
+#include <tvm/relay/analysis.h>
 #include <tvm/relay/expr_functor.h>
 #include <tvm/relay/op_attr_types.h>
+#include <tvm/relay/transform.h>
 #include <cmath>
 #include <string>
 #include <vector>
@@ -259,6 +260,13 @@ Expr QuantizeRealize(const Call& ref_call,
   return QRealizeIntExprNode::make(round_data, dom_scale, Float(32));
 }
 
+Expr FoldConstantOpt(const Expr& expr) {
+  auto mod = ModuleNode::FromExpr(expr);
+  mod = transform::FoldConstant()(mod);
+  auto entry_func = mod->Lookup("main");
+  return expr.as<FunctionNode>() == nullptr ? entry_func->body : entry_func;
+}
+
 RELAY_REGISTER_OP("relay.op.annotation.simulated_quantize")
 .set_attr<FForwardRewrite>("FQRealizeRewrite", QuantizeRealize);
 
@@ -290,7 +298,8 @@ Expr Conv2dRealize(const Call& ref_call,
 
   Expr ret = CallNode::make(ref_call->op,
     {ldata, rdata}, Attrs(attrs), ref_call->type_args);
-  Expr dom_scale = FoldConstant(Multiply(lhs->dom_scale, rhs->dom_scale));
+  Expr mul = Multiply(lhs->dom_scale, rhs->dom_scale);
+  Expr dom_scale = FoldConstantOpt(mul);
   return QRealizeIntExprNode::make(ret, dom_scale, out_dtype);
 }
 
@@ -323,7 +332,8 @@ Expr DenseRealize(const Call& ref_call,
 
   Expr ret = CallNode::make(ref_call->op,
           {ldata, rdata}, Attrs(attrs), ref_call->type_args);
-  Expr dom_scale = FoldConstant(Multiply(lhs->dom_scale, rhs->dom_scale));
+  Expr mul = Multiply(lhs->dom_scale, rhs->dom_scale);
+  Expr dom_scale = FoldConstantOpt(mul);
   return QRealizeIntExprNode::make(ret, dom_scale, out_dtype);
 }
 
@@ -356,7 +366,8 @@ Expr MulRealize(const Call& ref_call,
     }
 
     Expr ret = ForwardOp(ref_call, {ldata, rdata});
-    Expr dom_scale = FoldConstant(Multiply(lhs->dom_scale, rhs->dom_scale));
+    Expr mul = Multiply(lhs->dom_scale, rhs->dom_scale);
+    Expr dom_scale = FoldConstantOpt(mul);
     return QRealizeIntExprNode::make(ret, dom_scale, dtype);
   }
   CHECK(!new_args[0]->derived_from<TempExprNode>() && !new_args[1]->derived_from<TempExprNode>());
diff --git a/src/relay/pass/simplify_inference.cc b/src/relay/pass/simplify_inference.cc
index 6d6b24abec203..daf48c44173e4 100644
--- a/src/relay/pass/simplify_inference.cc
+++ b/src/relay/pass/simplify_inference.cc
@@ -21,7 +21,7 @@
  * Copyright (c) 2018 by Contributors
  * \file simplify_inference.cc
  */
-#include <tvm/relay/pass.h>
+#include <tvm/relay/analysis.h>
 #include <tvm/relay/expr_functor.h>
 #include <tvm/relay/attrs/nn.h>
 #include <tvm/relay/transform.h>
@@ -103,9 +103,6 @@ Expr SimplifyInference(const Expr& e) {
   return InferenceSimplifier().Mutate(e);
 }
 
-TVM_REGISTER_API("relay._ir_pass.simplify_inference")
-.set_body_typed(SimplifyInference);
-
 namespace transform {
 
 Pass SimplifyInference() {
diff --git a/src/relay/pass/to_a_normal_form.cc b/src/relay/pass/to_a_normal_form.cc
index 324eddd21c5ca..19bf2cb4dc85c 100644
--- a/src/relay/pass/to_a_normal_form.cc
+++ b/src/relay/pass/to_a_normal_form.cc
@@ -18,13 +18,15 @@
  */
 
 /*!
- * Copyright (c) 2018 by Contributors
+ * Copyright (c) 2019 by Contributors
  *
- * \file to_anf.cc
+ * \file to_a_normal_form.cc
  *
  * \brief Turn implicit sharing into observable sharing.
  */
-#include <tvm/relay/pass.h>
+#include <tvm/relay/analysis.h>
+#include <tvm/relay/expr_functor.h>
+#include <tvm/relay/transform.h>
 #include <tvm/relay/expr_functor.h>
 #include <tvm/logging.h>
 #include "let_list.h"
@@ -35,10 +37,6 @@
 namespace tvm {
 namespace relay {
 
-Expr ToANormalForm(const Expr& e,
-                   const Module& m,
-                   std::unordered_set<GlobalVar, NodeHash, NodeEqual>* gv);
-
 struct ScopeNode;
 using Scope = std::shared_ptr<ScopeNode>;
 
@@ -74,13 +72,16 @@ Scope LCA(Scope lhs, Scope rhs) {
 
 std::unordered_map<DependencyGraph::Node*, Scope> CalcScope(const DependencyGraph& dg) {
   std::unordered_map<DependencyGraph::Node*, Scope> expr_scope;
+  bool global_scope_used = false;
   Scope global_scope = std::make_shared<ScopeNode>();
   for (auto it = dg.post_dfs_order.rbegin(); it != dg.post_dfs_order.rend(); ++it) {
     DependencyGraph::Node* n = *it;
     auto iit = n->parents.head;
     Scope s;
     if (iit == nullptr) {
+      CHECK(!global_scope_used);
       s = global_scope;
+      global_scope_used = true;
     } else {
       s = expr_scope.at(iit->value);
       iit = iit->next;
@@ -90,13 +91,10 @@ std::unordered_map<DependencyGraph::Node*, Scope> CalcScope(const DependencyGrap
     }
     expr_scope.insert({n, n->new_scope ? ChildScope(s) : s});
   }
+  CHECK(global_scope_used);
   return expr_scope;
 }
 
-bool IsPrimitiveFunction(const Expr& e) {
-  return e.as<FunctionNode>() && Downcast<Function>(e)->IsPrimitive();
-}
-
 /* Special care is needed to handle local recursion.
  * Fill additionally take a (possibly null) Var argument,
  * If it is not null, Fill is required to bind the transformed result to that var.
@@ -104,29 +102,21 @@ bool IsPrimitiveFunction(const Expr& e) {
 class Fill : ExprFunctor<Expr(const Expr&, const Var&)> {
  public:
   static Expr ToANormalForm(const Expr& e,
-                            const Module& m,
                             const DependencyGraph& dg,
-                            std::unordered_map<DependencyGraph::Node*, Scope>* node_scope,
-                            std::unordered_set<GlobalVar, NodeHash, NodeEqual>* gv) {
-    Fill fi(m, dg, node_scope, gv);
+                            std::unordered_map<DependencyGraph::Node*, Scope>* node_scope) {
+    Fill fi(dg, node_scope);
     return fi.GetScope(e)->ll->Get(fi.VisitExpr(e));
   }
 
  private:
-  Module mod_;
   const DependencyGraph& dg_;
   std::unordered_map<DependencyGraph::Node*, Scope>* node_scope_;
-  std::unordered_set<GlobalVar, NodeHash, NodeEqual>* visited_;
   std::unordered_map<Expr, Expr, NodeHash, NodeEqual> memo;
 
-  Fill(Module mod,
-       const DependencyGraph& dg,
-       std::unordered_map<DependencyGraph::Node*, Scope>* node_scope,
-       std::unordered_set<GlobalVar, NodeHash, NodeEqual>* visited) :
-    mod_(mod),
+  Fill(const DependencyGraph& dg,
+       std::unordered_map<DependencyGraph::Node*, Scope>* node_scope) :
     dg_(dg),
-    node_scope_(node_scope),
-    visited_(visited) { }
+    node_scope_(node_scope) { }
 
   Scope GetScope(const Expr& e) {
     return node_scope_->at(dg_.expr_node.at(e));
@@ -147,22 +137,26 @@ class Fill : ExprFunctor<Expr(const Expr&, const Var&)> {
   Expr VisitExpr(const Expr& e, const Var& v) final {
     if (memo.count(e) == 0) {
       memo.insert({e, ExprFunctor<Expr(const Expr&, const Var&)>::VisitExpr(e, v)});
+    } else if (v.defined()) {
+      GetScope(e)->ll->Push(v, memo.at(e));
     }
-    return memo.at(e);
+    auto ret = memo.at(e);
+    CHECK(IsAtomic(ret));
+    return ret;
   }
 
   Expr VisitExpr(const Expr& e) {
     return this->VisitExpr(e, Var());
   }
 
-  Expr Atomic(const Expr& orig, const Expr& now, const Var& v) {
-    return v.defined() ? GetScope(orig)->ll->Push(v, now) : now;
+  Expr Atomic(const Expr& e, const Var& v) {
+    return v.defined() ? GetScope(e)->ll->Push(v, e) : e;
   }
 
   Expr Compound(const Expr& orig, const Expr& now, const Var& v) {
     Var var = v.defined() ?
       v :
-      VarNode::make(std::string("x"), IncompleteTypeNode::make(Kind::kType));
+      VarNode::make(std::string("x"), Type());
     return GetScope(orig)->ll->Push(var, now);
   }
 
@@ -215,7 +209,7 @@ class Fill : ExprFunctor<Expr(const Expr&, const Var&)> {
   Expr VisitExpr_(const FunctionNode* f, const Var& v) final {
     Expr e = GetRef<Expr>(f);
     Expr ret;
-    if (IsPrimitiveFunction(e)) {
+    if (f->IsPrimitive()) {
       ret = e;
     } else {
       ret = FunctionNode::make(f->params,
@@ -241,26 +235,22 @@ class Fill : ExprFunctor<Expr(const Expr&, const Var&)> {
 
   Expr VisitExpr_(const VarNode* vn, const Var& v) final {
     Expr e = GetRef<Expr>(vn);
-    return Atomic(e, e, v);
+    return Atomic(e, v);
   }
 
   Expr VisitExpr_(const GlobalVarNode* gvn, const Var& v) final {
     GlobalVar gv = GetRef<GlobalVar>(gvn);
-    if (visited_->count(gv) == 0) {
-      visited_->insert(gv);
-      mod_->Update(gv, Downcast<Function>(relay::ToANormalForm(mod_->Lookup(gv), mod_, visited_)));
-    }
-    return Atomic(gv, gv, v);
+    return Atomic(gv, v);
   }
 
   Expr VisitExpr_(const OpNode* op, const Var& v) final {
     Expr e = GetRef<Expr>(op);
-    return Atomic(e, e, v);
+    return Atomic(e, v);
   }
 
   Expr VisitExpr_(const ConstructorNode* c, const Var& v) final {
     Expr e = GetRef<Expr>(c);
-    return Atomic(e, e, v);
+    return Atomic(e, v);
   }
 
   Expr VisitExpr_(const MatchNode* m, const Var& v) final {
@@ -276,9 +266,7 @@ class Fill : ExprFunctor<Expr(const Expr&, const Var&)> {
   }
 };
 
-Expr ToANormalFormAux(const Expr& e,
-                      const Module& m,
-                      std::unordered_set<GlobalVar, NodeHash, NodeEqual>* gv) {
+Expr ToANormalFormAux(const Expr& e) {
   /* When you lift a lambda, what is inside is also being lift.
    *
    * So we must determine the scope of the lambda before determining the scope of it's body.
@@ -301,46 +289,44 @@ Expr ToANormalFormAux(const Expr& e,
    * We do an additional pass to fill all the LetList and we are done.
    */
   std::unordered_map<DependencyGraph::Node*, Scope> node_scope = CalcScope(dg);
-  return Fill::ToANormalForm(e, m, dg, &node_scope, gv);
+  return Fill::ToANormalForm(e, dg, &node_scope);
 }
 
-Expr ToANormalForm(const Expr& e,
-                   const Module& m,
-                   std::unordered_set<GlobalVar, NodeHash, NodeEqual>* gv) {
-  DLOG(INFO)
-  << "ToANF:" << std::endl
-  << AsText(e, false);
-
-  Expr ret =
-    TransformF([&](const Expr& e) {
-      return ToANormalFormAux(e, m, gv);
-    }, e);
+Module ToANormalForm(const Module& m) {
+  DLOG(INFO) << "ToANF:" << std::endl << m;
+
+  tvm::Map<GlobalVar, Function> updates;
+  auto funcs = m->functions;
+  for (const auto& it : funcs) {
+    CHECK_EQ(FreeVars(it.second).size(), 0);
+    Expr ret =
+      TransformF([&](const Expr& e) {
+        return ToANormalFormAux(e);
+      }, it.second);
+    CHECK_EQ(FreeVars(ret).size(), 0)
+      << AsText(ret)
+      << "should not has free vars: "
+      << FreeVars(ret);
+    updates.Set(it.first, Downcast<Function>(ret));
+  }
 
-  CHECK_EQ(FreeVars(ret).size(), 0);
+  for (auto pair : updates) {
+    m->Add(pair.first, pair.second, true);
+  }
 
-  DLOG(INFO)
-    << "ToANF: transformed" << std::endl
-    << AsText(ret, false);
+  DLOG(INFO) << "ToANF: transformed" << std::endl << m;
 
-  return ret;
+  return m;
 }
 
-Expr ToANormalForm(const Expr& e, const Module& m) {
-  std::unordered_set<GlobalVar, NodeHash, NodeEqual> gv;
-  return ToANormalForm(e, m, &gv);
-}
-
-TVM_REGISTER_API("relay._ir_pass.to_a_normal_form")
-.set_body_typed(static_cast<Expr (*)(const Expr&, const Module&)>(ToANormalForm));
-
 namespace transform {
 
 Pass ToANormalForm() {
-  runtime::TypedPackedFunc<Function(Function, Module, PassContext)> pass_func =
-    [=](Function f, Module m, PassContext pc) {
-    return Downcast<Function>(ToANormalForm(f, m));
+  runtime::TypedPackedFunc<Module(Module, PassContext)> pass_func =
+    [=](Module m, PassContext pc) {
+    return ToANormalForm(m);
   };
-  return CreateFunctionPass(pass_func, 1, "ToANormalForm", {});
+  return CreateModulePass(pass_func, 1, "ToANormalForm", {});
 }
 
 TVM_REGISTER_API("relay._transform.ToANormalForm")
diff --git a/src/relay/pass/to_cps.cc b/src/relay/pass/to_cps.cc
new file mode 100644
index 0000000000000..830b3b25a69b8
--- /dev/null
+++ b/src/relay/pass/to_cps.cc
@@ -0,0 +1,397 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+/*!
+ * Copyright (c) 2019 by Contributors
+ *
+ * \file to_cps.cc
+ *
+ * \brief Turn a program to continuation passing style.
+ *
+ * Given a fresh type variable 'answer',
+ * continuation passing style(CPS) convert every function of a -> b to a -> (b -> anwer) -> answer.
+ *
+ * That is, instead of returning the result directly,
+ * function will now call another function (called the continuation)
+ * and return that value as a result instead.
+ *
+ * Continuation passing style turn all function call into tail call,
+ * which bound the stack size, prevent stack from overflowing during recursion,
+ * and allow tail call optimization.
+ *
+ * In relay, as tensor operation is the bottleneck,
+ * CPS is currently intended to transform the program before partial eval (PE),
+ * as it reify the control flow and enable PE to handle control flow join more agressively.
+ *
+ * For example, given 'let a = if b then c else d in e', it will transform the code into
+ * 'let f a = e in if b then f c else f d'.
+ * This allow f to be optimized individually in both branch.
+ *
+ * We implement CPS conversion by higher order transform
+ * (see http://matt.might.net/articles/cps-conversion/).
+ * The basic idea is that we will recursively traverse the AST.
+ * During the traversal, there is an extra parameter, mcont, of expr -> expr.
+ * It is basically a continuation at the metalevel.
+ * All cases in the transform must return via the mcont,
+ * wheter directly invoking it, or indirectly by recursion.
+ */
+#include <tvm/relay/transform.h>
+#include <tvm/relay/expr_functor.h>
+#include <tvm/relay/pattern_functor.h>
+#include "../ir/type_functor.h"
+#include "let_list.h"
+#include "pass_util.h"
+
+namespace tvm {
+namespace relay {
+
+// we assume the data type has no closure - no idea how to look into datatype right now.
+
+Type Arrow(const Type& l, const Type& r) {
+  return FuncTypeNode::make({l}, r, {}, {});
+}
+
+Type CPSType(const Type& t, const TypeVar& answer);
+
+FuncType CPSFuncType(const FuncType& f, const TypeVar& answer) {
+  tvm::Array<Type> new_arg_types;
+  for (const Type& t : f->arg_types) {
+    new_arg_types.push_back(CPSType(t, answer));
+  }
+  new_arg_types.push_back(Arrow(CPSType(f->ret_type, answer), answer));
+  return FuncTypeNode::make(new_arg_types, answer, f->type_params, f->type_constraints);
+}
+
+Type CPSType(const Type& t, const TypeVar& answer) {
+  struct CPSTypeMutator : TypeMutator {
+    explicit CPSTypeMutator(const TypeVar& answer) : answer(answer) { }
+    TypeVar answer;
+    Type VisitType_(const FuncTypeNode* t) final {
+      return CPSFuncType(GetRef<FuncType>(t), answer);
+    }
+  } mut(answer);
+  return mut(t);
+}
+
+// transform global functions into cps form.
+using CPSMap = std::unordered_map<GlobalVar, GlobalVar, NodeHash, NodeEqual>;
+
+// transform vars from the original program into new vars, so their type will be correct.
+using VarMap = std::unordered_map<Var, Var, NodeHash, NodeEqual>;
+
+/*
+ * The meta continuation.
+ * There is 3 rules on the metacontinuation:
+ * 0: It can only use the argument once.
+ *    The argument is code, and using it twice will duplicate code.
+ *    Bound the argument via let instead.
+ * 1: If the size of the metacontinuation is unbounded, it can only be called once.
+ *    It contain code, so calling it twice duplicate code.
+ *    Reify the continuation and bound it instead.
+ *    See the function 'reify' and the if case for more detail.
+ * 2: The argument must be effect free.
+ *    It might reorder or drop the argument.
+ *    Again, bound the argument via let instead.
+ *    See the call case for more detail.
+ */
+using MCont = std::function<Expr(const Expr&)>;
+
+Function ToCPS(const Function& f, const Module& m, CPSMap* cm);
+
+Function ToCPS(const Function& f, const Module& m, CPSMap* cm, VarMap* vm, const TypeVar& answer) {
+  std::function<Var(Var)> remap = [&](const Var& v) { return vm->count(v) == 0 ? v : vm->at(v); };
+  auto function_type = Downcast<FuncType>(f->checked_type());
+  // Each MCont can be used at most once.
+  struct CPSFunctor : ExprFunctor<Expr(const Expr&, const MCont&)>, PatternMutator {
+    CPSFunctor(const std::function<Var(Var)>& remap,
+               const TypeVar& answer,
+               const Module& m,
+               VarMap* vm,
+               CPSMap* cm) : remap(remap), answer(answer), m(m), vm(vm), cm(cm) { }
+    const std::function<Var(Var)>& remap;
+    TypeVar answer;
+    Module m;
+    VarMap* vm;
+    CPSMap* cm;
+
+    Expr VisitExpr_(const LetNode* op, const MCont& k) final {
+      return VisitExpr(op->value, [&](const Expr& v) {
+        return LetNode::make(remap(op->var), v, VisitExpr(op->body, k));
+      });
+    }
+
+    Expr VisitExpr_(const FunctionNode* op, const MCont& k) final {
+      CHECK(!op->IsPrimitive()) << "primitive func not supported yet.";
+      return k(ToCPS(GetRef<Function>(op), m, cm, vm, answer));
+    }
+
+    Expr VisitExpr_(const ConstantNode* op, const MCont& k) final {
+      return k(GetRef<Constant>(op));
+    }
+
+    Expr VisitExpr_(const VarNode* op, const MCont& k) final {
+      return k(remap(GetRef<Var>(op)));
+    }
+
+    Pattern VisitPattern_(const PatternVarNode* op) final {
+      return PatternVarNode::make(remap(op->var));
+    }
+
+    Expr VisitExpr_(const GlobalVarNode* op, const MCont& k) final {
+      auto gv = GetRef<GlobalVar>(op);
+      if (cm->count(gv) == 0) {
+        auto cps_gv = GlobalVarNode::make(gv->name_hint + "_cps");
+        cm->insert({gv, cps_gv});
+        m->Add(cps_gv, ToCPS(m->Lookup(gv), m, cm));
+      }
+      return k(cm->at(gv));
+    }
+
+    Expr VisitExpr_(const RefCreateNode* op, const MCont& k) final {
+      return VisitExpr(op->value, [&](const Expr& v) { return k(RefCreateNode::make(v)); });
+    }
+
+    Expr reify(const MCont& k) {
+      Var arg = VarNode::make("arg", Type());
+      return FunctionNode::make({arg}, k(arg), Type(), {}, {});
+    }
+
+    Expr reify(const MCont& k, const std::function<Expr(MCont)>& cont) {
+      return LetList::Let(reify(k),
+                          [&](const Var& f) {
+        return cont([&](const Expr& e) { return CallNode::make(f, {e}); });
+      });
+    }
+
+    Expr VisitExpr_(const IfNode* op, const MCont& k) final {
+      return reify(k, [&](const MCont& kf) {
+        return VisitExpr(op->cond,
+                         [&](const Expr& v) {
+          return IfNode::make(v, VisitExpr(op->true_branch, kf), VisitExpr(op->false_branch, kf));
+        });
+      });
+    }
+
+    Expr VisitExpr_(const MatchNode* op, const MCont& k) final {
+      return reify(k, [&](const MCont& kf) {
+        return VisitExpr(op->data, [&](const Expr& v) {
+          tvm::Array<Clause> clauses;
+          for (const auto& c : op->clauses) {
+            clauses.push_back(ClauseNode::make(VisitPattern(c->lhs), VisitExpr(c->rhs, kf)));
+          }
+          return MatchNode::make(v, clauses);
+        });
+      });
+    }
+
+    Expr VisitExpr_(const RefReadNode* op, const MCont& k) final {
+      return VisitExpr(op->ref,
+                       [&](const Expr& r) {
+        return LetList::Let(RefReadNode::make(r), k);
+      });
+    }
+
+    Expr VisitExpr_(const RefWriteNode* op, const MCont& k) final {
+      return VisitExpr(op->ref,
+                       [&](const Expr& r) {
+        return VisitExpr(op->value,
+                         [&](const Expr& v) {
+          return LetList::Let(RefWriteNode::make(r, v), k);
+        });
+      });
+    }
+
+    Expr VisitExpr_(const TupleNode* op, const MCont& k) final {
+      tvm::Array<Expr> fields;
+      std::function<Expr()> next;
+      next = [&]() {
+        return (fields.size() == op->fields.size()) ?
+          k(TupleNode::make(fields)) :
+          VisitExpr(op->fields[fields.size()], [&](const Expr& v) {
+            fields.push_back(v);
+            return next();
+          });
+      };
+      return next();
+    }
+
+    Expr VisitExpr_(const TupleGetItemNode* op, const MCont& k) final {
+      return VisitExpr(op->tuple, [&](const Expr& v) {
+        return k(TupleGetItemNode::make(v, op->index));
+      });
+    }
+
+    Expr VisitExpr_(const CallNode* op, const MCont& k) final {
+      if (op->op.as<OpNode>() || op->op.as<ConstructorNode>()) {
+        tvm::Array<Expr> args;
+        std::function<Expr()> next;
+        next = [&]() {
+          if (args.size() == op->args.size()) {
+            return LetList::Let(CallNode::make(op->op, args, op->attrs, op->type_args), k);
+          } else {
+            return VisitExpr(op->args[args.size()], [&](const Expr& v) {
+                args.push_back(v);
+                return next();
+              });
+          }
+        };
+        return next();
+      } else {
+        Expr f;
+        tvm::Array<Expr> args;
+        std::function<Expr()> next;
+        next = [&]() {
+          if (args.size() == op->args.size()) {
+            args.push_back(reify(k));
+            return Expr(CallNode::make(f, args, op->attrs, op->type_args));
+          } else {
+            return VisitExpr(op->args[args.size()], [&](const Expr& v) {
+              args.push_back(v);
+              return next();
+            });
+          }
+         };
+        return VisitExpr(op->op, [&](const Expr& v) {
+          f = v;
+          return next();
+        });
+      }
+    }
+  } mut(remap, answer, m, vm, cm);
+  Var k = VarNode::make("k", Arrow(CPSType(function_type->ret_type, answer), answer));
+  tvm::Array<Var> new_params;
+  for (const Var& v : f->params) {
+    new_params.push_back(remap(v));
+  }
+  new_params.push_back(k);
+  return FunctionNode::make(new_params,
+                            mut.VisitExpr(f->body,
+                                          [&](const Expr& e) { return CallNode::make(k, {e}); }),
+                            answer,
+                            f->type_params,
+                            f->attrs);
+}
+
+Function ToCPS(const Function& f, const Module& m, CPSMap* cm) {
+  TypeVar answer = TypeVarNode::make("answer", kType);
+  VarMap var;
+  struct Remapper : ExprVisitor, PatternVisitor {
+    Remapper(const TypeVar& answer, VarMap* vm) : answer(answer), vm(vm) { }
+    TypeVar answer;
+    VarMap* vm;
+    void VisitExpr_(const VarNode* vn) final {
+      Var v = GetRef<Var>(vn);
+      if (vm->count(v) == 0) {
+        auto ret = VarNode::make(v->name_hint(), CPSType(v->checked_type(), answer));
+        vm->insert({v, ret});
+      }
+    }
+
+    void VisitPattern(const Pattern& p) final {
+      PatternVisitor::VisitPattern(p);
+    }
+
+    void VisitPattern_(const PatternVarNode* op) final {
+      VisitExpr(op->var);
+    }
+  } remap(answer, &var);
+  remap.VisitExpr(f);
+  Function ret = ToCPS(f, m, cm, &var, answer);
+  auto new_type_params = ret->type_params;
+  new_type_params.push_back(answer);
+  return FunctionNode::make(ret->params, ret->body, ret->ret_type, new_type_params, ret->attrs);
+}
+
+Function ToCPS(const Function& f, const Module& m) {
+  CPSMap cps;
+  return ToCPS(f, m, &cps);
+}
+
+Function UnCPS(const Function& f) {
+  CHECK_GT(f->params.size(), 0);
+  std::vector<Var> new_params;
+  for (const auto& p : f->params) {
+    new_params.push_back(VarNode::make(p->name_hint(), p->checked_type()));
+  }
+  auto cont_type = Downcast<FuncType>(new_params.back()->type_annotation);
+  new_params.pop_back();
+  CHECK_EQ(cont_type->arg_types.size(), 1);
+  auto new_ret_type = Type(cont_type->arg_types[0]);
+  std::vector<TypeVar> new_type_params;
+  for (const auto& tp : f->type_params) {
+    new_type_params.push_back(TypeVarNode::make(tp->var->name_hint, tp->kind));
+  }
+  auto answer_type = new_type_params.back();
+  new_type_params.pop_back();
+  // TODO(@M.K.): make alphaequal work on free term
+  // CHECK(AlphaEqual(cont_type, Arrow(new_ret_type, answer_type)));
+  auto x = VarNode::make("x", new_ret_type);
+  auto cont = FunctionNode::make({x}, x, new_ret_type, {}, {});
+  tvm::Array<Expr> args;
+  for (const auto& p : new_params) {
+    args.push_back(p);
+  }
+  args.push_back(cont);
+  tvm::Array<Type> type_args;
+  for (const auto& tp : new_type_params) {
+    type_args.push_back(tp);
+  }
+  type_args.push_back(new_ret_type);
+  return FunctionNode::make(new_params,
+                            CallNode::make(f, args, {}, type_args),
+                            new_ret_type,
+                            new_type_params,
+                            f->attrs);
+}
+
+TVM_REGISTER_API("relay._transform.to_cps")
+.set_body_typed(static_cast<Function (*)(const Function&, const Module&)>(ToCPS));
+
+TVM_REGISTER_API("relay._transform.un_cps")
+.set_body_typed(UnCPS);
+
+namespace transform {
+
+Pass ToCPS() {
+  runtime::TypedPackedFunc<Function(Function, Module, PassContext)> pass_func =
+    [=](Function f, Module m, PassContext pc) {
+    return Function(ToCPS(f, m));
+  };
+  return CreateFunctionPass(pass_func, 1, "ToCPS", {});
+}
+
+TVM_REGISTER_API("relay._transform.ToCPS")
+.set_body_typed(ToCPS);
+
+
+Pass UnCPS() {
+  runtime::TypedPackedFunc<Function(Function, Module, PassContext)> pass_func =
+    [=](Function f, Module m, PassContext pc) {
+      return Function(UnCPS(f));
+    };
+  return CreateFunctionPass(pass_func, 1, "UnCPS", {});
+}
+
+TVM_REGISTER_API("relay._transform.UnCPS")
+.set_body_typed(UnCPS);
+
+}  // namespace transform
+
+}  // namespace relay
+}  // namespace tvm
diff --git a/src/relay/pass/to_graph_normal_form.cc b/src/relay/pass/to_graph_normal_form.cc
index 9c166f98c1a5c..f6f2a07bc80f4 100644
--- a/src/relay/pass/to_graph_normal_form.cc
+++ b/src/relay/pass/to_graph_normal_form.cc
@@ -24,8 +24,9 @@
  *
  * \brief Turn A normal form into graph normal form.
  */
-#include <tvm/relay/pass.h>
+#include <tvm/relay/analysis.h>
 #include <tvm/relay/expr_functor.h>
+#include <tvm/relay/transform.h>
 #include "let_list.h"
 
 namespace tvm {
@@ -76,9 +77,6 @@ Expr ToGraphNormalForm(const Expr& e) {
   return GNF()(e);
 }
 
-TVM_REGISTER_API("relay._ir_pass.to_graph_normal_form")
-.set_body_typed(ToGraphNormalForm);
-
 namespace transform {
 
 Pass ToGraphNormalForm() {
diff --git a/src/relay/pass/type_infer.cc b/src/relay/pass/type_infer.cc
index 4b126e5299cfd..64f125a905065 100644
--- a/src/relay/pass/type_infer.cc
+++ b/src/relay/pass/type_infer.cc
@@ -42,7 +42,7 @@
 #include <tvm/relay/error.h>
 #include <tvm/relay/expr_functor.h>
 #include <tvm/relay/pattern_functor.h>
-#include <tvm/relay/pass.h>
+#include <tvm/relay/analysis.h>
 #include <tvm/relay/transform.h>
 #include "./pass_util.h"
 #include "type_solver.h"
@@ -172,6 +172,7 @@ class TypeInferencer : private ExprFunctor<Type(const Expr&)>,
       return it->second.checked_type;
     }
     Type ret = this->VisitExpr(expr);
+    CHECK(ret.defined());
     KindCheck(ret, mod_);
     ResolvedTypeInfo& rti = type_map_[expr];
     rti.checked_type = ret;
@@ -368,10 +369,14 @@ class TypeInferencer : private ExprFunctor<Type(const Expr&)>,
 
     // Build a subsitituion map up from the function type and type arguments.
     // Eventually allow the type vars to be passed in.
-    for (size_t i = 0; i < fn_ty->type_params.size(); i++) {
+    for (size_t i = 0; i < ty_args.size(); ++i) {
       subst_map.Set(fn_ty->type_params[i], ty_args[i]);
     }
 
+    for (size_t i = ty_args.size(); i < fn_ty->type_params.size(); ++i) {
+      subst_map.Set(fn_ty->type_params[i], IncompleteTypeNode::make(Kind::kType));
+    }
+
     Type ret_type = fn_ty->ret_type;
 
     // If the function type is incomplete, place a new IncompleteType
@@ -437,13 +442,7 @@ class TypeInferencer : private ExprFunctor<Type(const Expr&)>,
     }
 
     Array<Type> type_args = call->type_args;
-    if (type_args.size() == 0) {
-      for (size_t i = 0; i < fn_ty_node->type_params.size(); i++) {
-        type_args.push_back(IncompleteTypeNode::make(Kind::kType));
-      }
-    }
-
-    if (type_args.size() != fn_ty_node->type_params.size()) {
+    if (type_args.size() > fn_ty_node->type_params.size()) {
       this->ReportFatalError(GetRef<Call>(call),
         RELAY_ERROR("Incorrect number of type args in "
           << call->span << ": "
@@ -775,7 +774,7 @@ Expr InferType(const Expr& expr, const Module& mod_ref) {
     // type check it anyway; afterwards we can just recover type
     // from the type-checked function to avoid doing unnecessary work.
 
-    Function func = mod->Lookup(mod->entry_func);
+    Function func = mod->Lookup("main");
 
     // FromExpr wraps a naked expression as a function, we will unbox
     // it here.
@@ -785,7 +784,7 @@ Expr InferType(const Expr& expr, const Module& mod_ref) {
       return func->body;
     }
   } else {
-    auto e = TypeInferencer(mod_ref, mod_ref->entry_func).Infer(expr);
+    auto e = TypeInferencer(mod_ref, mod_ref->GetGlobalVar("main")).Infer(expr);
     CHECK(WellFormed(e));
     auto free_tvars = FreeTypeVars(e, mod_ref);
     CHECK(free_tvars.size() == 0)
@@ -813,11 +812,6 @@ Function InferType(const Function& func,
   return Downcast<Function>(func_ret);
 }
 
-TVM_REGISTER_API("relay._ir_pass.infer_type")
-.set_body_typed<Expr(const Expr&, const Module&)>([](const Expr& expr, const Module& mod_ref) {
-    return InferType(expr, mod_ref);
-  });
-
 namespace transform {
 
 Pass InferType() {
diff --git a/src/relay/pass/type_solver.cc b/src/relay/pass/type_solver.cc
index 84f72e0d5a008..8289130f53d85 100644
--- a/src/relay/pass/type_solver.cc
+++ b/src/relay/pass/type_solver.cc
@@ -512,7 +512,7 @@ bool TypeSolver::Solve() {
 }
 
 // Expose type solver only for debugging purposes.
-TVM_REGISTER_API("relay._ir_pass._test_type_solver")
+TVM_REGISTER_API("relay._analysis._test_type_solver")
 .set_body([](runtime::TVMArgs args, runtime::TVMRetValue* ret) {
     using runtime::PackedFunc;
     using runtime::TypedPackedFunc;
diff --git a/src/relay/pass/type_solver.h b/src/relay/pass/type_solver.h
index 8b24e8605f5f7..002ccac356f02 100644
--- a/src/relay/pass/type_solver.h
+++ b/src/relay/pass/type_solver.h
@@ -27,7 +27,7 @@
 
 #include <tvm/relay/expr.h>
 #include <tvm/relay/type.h>
-#include <tvm/relay/pass.h>
+#include <tvm/relay/analysis.h>
 #include <tvm/relay/error.h>
 #include <vector>
 #include <queue>
diff --git a/src/relay/pass/util.cc b/src/relay/pass/util.cc
index 3ec4f75cd1ad8..e2b71570bd2f0 100644
--- a/src/relay/pass/util.cc
+++ b/src/relay/pass/util.cc
@@ -24,7 +24,7 @@
  *
  * \brief Utility functions for Relay.
  */
-#include <tvm/relay/pass.h>
+#include <tvm/relay/analysis.h>
 #include <tvm/relay/expr_functor.h>
 #include <tvm/relay/pattern_functor.h>
 #include "pass_util.h"
@@ -274,10 +274,10 @@ tvm::Array<Var> AllVars(const Expr& expr) {
   return VarVisitor().All(expr);
 }
 
-TVM_REGISTER_API("relay._ir_pass.free_vars")
+TVM_REGISTER_API("relay._analysis.free_vars")
 .set_body_typed(FreeVars);
 
-TVM_REGISTER_API("relay._ir_pass.bound_vars")
+TVM_REGISTER_API("relay._analysis.bound_vars")
   .set_body([](TVMArgs args, TVMRetValue* ret) {
       NodeRef x = args[0];
       if (x.as_derived<ExprNode>()) {
@@ -287,10 +287,10 @@ TVM_REGISTER_API("relay._ir_pass.bound_vars")
       }
     });
 
-TVM_REGISTER_API("relay._ir_pass.all_vars")
+TVM_REGISTER_API("relay._analysis.all_vars")
 .set_body_typed(AllVars);
 
-TVM_REGISTER_API("relay._ir_pass.free_type_vars")
+TVM_REGISTER_API("relay._analysis.free_type_vars")
 .set_body([](TVMArgs args, TVMRetValue* ret) {
     NodeRef x = args[0];
     Module mod = args[1];
@@ -301,7 +301,7 @@ TVM_REGISTER_API("relay._ir_pass.free_type_vars")
     }
   });
 
-TVM_REGISTER_API("relay._ir_pass.bound_type_vars")
+TVM_REGISTER_API("relay._analysis.bound_type_vars")
   .set_body([](TVMArgs args, TVMRetValue* ret) {
       NodeRef x = args[0];
       Module mod = args[1];
@@ -312,7 +312,7 @@ TVM_REGISTER_API("relay._ir_pass.bound_type_vars")
       }
     });
 
-TVM_REGISTER_API("relay._ir_pass.all_type_vars")
+TVM_REGISTER_API("relay._analysis.all_type_vars")
   .set_body([](TVMArgs args, TVMRetValue* ret) {
       NodeRef x = args[0];
       Module mod = args[1];
@@ -425,6 +425,16 @@ Expr TypeSubst(const Expr& expr, const tvm::Map<TypeVar, Type>& subst_map) {
     Var VisitVar(const Var& v) final {
       return Downcast<Var>(VisitExpr(v));
     }
+
+    Pattern VisitPattern(const Pattern& p) final {
+      return PatternMutator::VisitPattern(p);
+    }
+
+    Clause VisitClause(const Clause& c) final {
+      Pattern pat = VisitPattern(c->lhs);
+      return ClauseNode::make(pat, VisitExpr(c->rhs));
+    }
+
    private:
     const tvm::Map<TypeVar, Type>& subst_map_;
   };
diff --git a/src/relay/pass/well_formed.cc b/src/relay/pass/well_formed.cc
index dea9374812896..bfe8865ab52f9 100644
--- a/src/relay/pass/well_formed.cc
+++ b/src/relay/pass/well_formed.cc
@@ -22,7 +22,7 @@
  * \file well_formed.cc
  * \brief check that expression is well formed.
  */
-#include <tvm/relay/pass.h>
+#include <tvm/relay/analysis.h>
 #include <tvm/relay/expr_functor.h>
 #include <tvm/relay/pattern_functor.h>
 #include <unordered_set>
@@ -78,7 +78,7 @@ bool WellFormed(const Expr& e) {
   return WellFormedChecker().CheckWellFormed(e);
 }
 
-TVM_REGISTER_API("relay._ir_pass.well_formed")
+TVM_REGISTER_API("relay._analysis.well_formed")
 .set_body_typed(WellFormed);
 
 }  // namespace relay
diff --git a/src/schedule/message_passing.cc b/src/schedule/message_passing.cc
index a7f974613aa15..12c5db703ec58 100644
--- a/src/schedule/message_passing.cc
+++ b/src/schedule/message_passing.cc
@@ -18,7 +18,6 @@
  */
 
 /*!
- *  Copyright (c) 2017 by Contributors
  * \file message_passing.cc
  * \brief The message passing domain.
  */
@@ -32,12 +31,11 @@ namespace tvm {
 namespace schedule {
 
 using namespace ir;
-using namespace arith;
 
 void Update(std::unordered_map<IterVar, Range>* p_state,
             const IterVar& iv,
             Range r,
-            Analyzer* analyzer) {
+            arith::Analyzer* analyzer) {
   auto it = p_state->find(iv);
   if (it == p_state->end()) {
     (*p_state)[iv] = r;
@@ -145,8 +143,8 @@ void PassUpIndex(const Stage& stage,
       Expr factor = dom_map.at(s->inner)->extent;
       Expr outer_min = dom_map.at(s->outer)->min;
       Expr inner_min = dom_map.at(s->inner)->min;
-      state[s->outer] = ComputeExpr<Div>(value, factor);
-      state[s->inner] = ComputeExpr<Mod>(value, factor);
+      state[s->outer] = value / factor;
+      state[s->inner] = value % factor;
       // add min if they exist
       if (!is_zero(outer_min)) {
         state[s->outer] = state[s->outer] + outer_min;
@@ -189,8 +187,8 @@ void PassDownIndex(const Stage& stage,
       CHECK(is_zero(r->min));
       Expr parent = state.at(s->parent);
       Expr factor = r->extent;
-      state[s->outer] = ComputeExpr<Div>(parent, factor);
-      state[s->inner] = ComputeExpr<Mod>(parent, factor);
+      state[s->outer] = parent / factor;
+      state[s->inner] = parent % factor;
     } else if (const FuseNode* s = rel.as<FuseNode>()) {
       if (!state.count(s->inner) && !state.count(s->outer)) {
         CHECK(allow_missing);
@@ -240,7 +238,7 @@ void PassUpDomain(const SplitNode* s,
   CHECK(outer.defined());
   CHECK(inner.defined());
   CHECK(factor.defined());
-  *parent = EvalSet(
+  *parent = arith::EvalSet(
       s->outer->var * factor + s->inner->var + parent_min,
       {{s->outer, outer}, {s->inner, inner}});
 }
@@ -290,8 +288,8 @@ void PassUpDomain(const RebaseNode* s,
     return;
   }
   Expr parent_min = dom_map.at(s->parent)->min;
-  *parent = EvalSet(s->rebased->var + parent_min,
-                    {{s->rebased, rebased}});
+  *parent = arith::EvalSet(s->rebased->var + parent_min,
+                           {{s->rebased, rebased}});
 }
 
 void PassUpDomain(const Stage& stage,
@@ -432,9 +430,9 @@ void PassDownBitMaskOr(const Stage& stage,
  */
 void PassUpBoundCheck(const Stage& s,
                       const Map<IterVar, Range>& dom_map,
-                      std::unordered_map<IterVar, bool>* p_state) {
+                      std::unordered_map<IterVar, bool>* p_state,
+                      arith::Analyzer* analyzer) {
   auto& state = *p_state;
-  using HalideIR::Internal::can_prove;
   for (size_t i = s->relations.size(); i != 0; --i) {
     IterVarRelation rel = s->relations[i - 1];
     if (const SplitNode* s = rel.as<SplitNode>()) {
@@ -447,7 +445,7 @@ void PassUpBoundCheck(const Stage& s,
         if (outer || inner) {
           state[s->parent] = true;
         } else {
-          if (can_prove(dom_map.at(s->parent)->extent == factor * step)) {
+          if (analyzer->CanProve(dom_map.at(s->parent)->extent == factor * step)) {
             state[s->parent] = false;
           } else {
             state[s->parent] = true;
@@ -476,11 +474,13 @@ std::vector<Expr> MakeBoundCheck(
     const std::unordered_map<IterVar, Expr>& value_map,
     bool skip_ivar_domain,
     const std::unordered_set<IterVar>& skip_iter) {
+  arith::Analyzer analyzer;
+
   std::unordered_map<IterVar, bool> bound_state;
   for (IterVar iv : stage->leaf_iter_vars) {
     bound_state[iv] = false;
   }
-  PassUpBoundCheck(stage, dom_map, &bound_state);
+  PassUpBoundCheck(stage, dom_map, &bound_state, &analyzer);
 
   std::vector<Expr> preds;
   std::unordered_map<const Variable*, IntSet> iset_dmap;
@@ -494,9 +494,9 @@ std::vector<Expr> MakeBoundCheck(
     if (skip_iter.count(iv) || iv->iter_type == kOpaque) continue;
     if (bound_state.at(iv)) {
       Range dom = dom_map.at(iv);
-      Expr value = ComputeExpr<Sub>(value_map.at(iv), dom->min);
+      Expr value = value_map.at(iv) - dom->min;
       Expr vmax = EvalSet(value, iset_dmap).max();
-      if (vmax.type() != value.type() || !can_prove(vmax < dom->extent)) {
+      if (vmax.type() != value.type() || !analyzer.CanProve(vmax < dom->extent)) {
         preds.emplace_back(value < dom->extent);
       }
     }
@@ -506,15 +506,15 @@ std::vector<Expr> MakeBoundCheck(
     Range dom = dom_map.at(iv);
     CHECK(iv->dom.defined());
     if (!skip_ivar_domain && !iv->dom.same_as(dom)) {
-      Expr value = ComputeExpr<Sub>(value_map.at(iv), iv->dom->min);
+      Expr value = value_map.at(iv) - iv->dom->min;
       IntSet s = EvalSet(value, iset_dmap);
       Expr vmin = s.min();
       Expr vmax = s.max();
       // The range of `value` resides in [vmin, vmax]
-      if (vmin.type() != value.type() || !can_prove(vmin >= 0)) {
+      if (vmin.type() != value.type() || !analyzer.CanProve(vmin >= 0)) {
         preds.emplace_back(value >= 0);
       }
-      if (vmax.type() != value.type() || !can_prove(vmax < iv->dom->extent)) {
+      if (vmax.type() != value.type() || !analyzer.CanProve(vmax < iv->dom->extent)) {
         preds.emplace_back(value < iv->dom->extent);
       }
     }
diff --git a/src/schedule/schedule_dataflow_rewrite.cc b/src/schedule/schedule_dataflow_rewrite.cc
index c5f1b1656dd5f..760ed0f233f7e 100644
--- a/src/schedule/schedule_dataflow_rewrite.cc
+++ b/src/schedule/schedule_dataflow_rewrite.cc
@@ -740,7 +740,7 @@ Array<Tensor> Schedule::rfactor(const Tensor& tensor,
   const Reduce* reduce = compute_op->body[idx].as<Reduce>();
   CHECK(reduce) << "Can only rfactor non-inline reductions";
   predicates.push_back(reduce->condition);
-  Expr predicate = likely(simplify(arith::ComputeReduce<ir::And>(predicates, Expr())));
+  Expr predicate = likely(arith::ComputeReduce<ir::And>(predicates, Expr()));
 
   std::unordered_map<const Variable*, Expr> vsub;
 
diff --git a/tests/cpp/ir_simplify_test.cc b/tests/cpp/ir_simplify_test.cc
index 35968f8524de6..5a5dc03f0165b 100644
--- a/tests/cpp/ir_simplify_test.cc
+++ b/tests/cpp/ir_simplify_test.cc
@@ -6,9 +6,9 @@
  * to you under the Apache License, Version 2.0 (the
  * "License"); you may not use this file except in compliance
  * with the License.  You may obtain a copy of the License at
- * 
+ *
  *   http://www.apache.org/licenses/LICENSE-2.0
- * 
+ *
  * Unless required by applicable law or agreed to in writing,
  * software distributed under the License is distributed on an
  * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
@@ -21,12 +21,6 @@
 #include <gtest/gtest.h>
 #include <tvm/ir_pass.h>
 #include <tvm/tvm.h>
-#include <arithmetic/Simplify.h>
-
-TEST(IRSIMPLIFY, Basic) {
-  using namespace HalideIR::Internal;
-  simplify_test();
-}
 
 TEST(IRSIMPLIFY, MinMax) {
   auto x = tvm::var("x");
diff --git a/tests/cpp/relay_build_module_test.cc b/tests/cpp/relay_build_module_test.cc
index 3f46eed9f10ec..a8a63dd44ef95 100644
--- a/tests/cpp/relay_build_module_test.cc
+++ b/tests/cpp/relay_build_module_test.cc
@@ -22,7 +22,8 @@
 #include <tvm/tvm.h>
 #include <tvm/relay/expr.h>
 #include <tvm/relay/type.h>
-#include <tvm/relay/pass.h>
+#include <tvm/relay/analysis.h>
+#include <tvm/relay/transform.h>
 #include <topi/generic/injective.h>
 #include <tvm/runtime/packed_func.h>
 #include <tvm/runtime/module.h>
diff --git a/tests/cpp/relay_pass_type_infer_test.cc b/tests/cpp/relay_pass_type_infer_test.cc
index ffd0f7c4a26fa..38a88309ed1ef 100644
--- a/tests/cpp/relay_pass_type_infer_test.cc
+++ b/tests/cpp/relay_pass_type_infer_test.cc
@@ -21,7 +21,8 @@
 #include <tvm/tvm.h>
 #include <tvm/relay/expr.h>
 #include <tvm/relay/type.h>
-#include <tvm/relay/pass.h>
+#include <tvm/relay/analysis.h>
+#include <tvm/relay/transform.h>
 
 TEST(Relay, SelfReference) {
   using namespace tvm;
@@ -32,10 +33,9 @@ TEST(Relay, SelfReference) {
   auto y = relay::VarNode::make("y", tensor_type);
   auto call = relay::CallNode::make(f, Array<relay::Expr>{ y });
   auto fx = relay::FunctionNode::make(tvm::Array<relay::Var>{ y }, call, relay::Type(), {});
-  auto empty_module =
-    relay::ModuleNode::make(Map<relay::GlobalVar, relay::Function>{},
-                            Map<relay::GlobalTypeVar, relay::TypeData>{});
-  auto type_fx = relay::InferType(fx, empty_module);
+  auto mod = relay::ModuleNode::FromExpr(fx);
+  mod = relay::transform::InferType()(mod);
+  auto type_fx = mod->Lookup("main");
 
   auto expected = relay::FuncTypeNode::make(tvm::Array<relay::Type>{ tensor_type }, tensor_type, {}, {});
   CHECK(AlphaEqual(type_fx->checked_type(), expected));
diff --git a/tests/cpp/relay_transform_sequential.cc b/tests/cpp/relay_transform_sequential.cc
index b61a5cc0daade..0df78fc62f42e 100644
--- a/tests/cpp/relay_transform_sequential.cc
+++ b/tests/cpp/relay_transform_sequential.cc
@@ -23,7 +23,7 @@
 #include <tvm/packed_func_ext.h>
 #include <tvm/relay/expr.h>
 #include <tvm/relay/module.h>
-#include <tvm/relay/pass.h>
+#include <tvm/relay/analysis.h>
 #include <tvm/relay/transform.h>
 #include <tvm/relay/type.h>
 #include <tvm/runtime/packed_func.h>
@@ -84,9 +84,9 @@ TEST(Relay, Sequential) {
   }
 
   CHECK(mod.defined());
-  auto entry_func = mod->entry_func;
+  auto entry_func = mod->GetGlobalVar("main");
   CHECK(entry_func.defined());
-  relay::Function f = mod->Lookup(entry_func->name_hint);
+  relay::Function f = mod->Lookup("main");
   CHECK(f.defined());
 
   // Expected function
@@ -100,7 +100,9 @@ TEST(Relay, Sequential) {
       relay::FunctionNode::make(relay::FreeVars(zz), zz, relay::Type(), {});
 
   // Infer type for the expected function.
-  auto expected = relay::InferType(expected_func, relay::Module(nullptr));
+  auto mod1 = relay::ModuleNode::FromExpr(expected_func);
+  mod1 = relay::transform::InferType()(mod1);
+  auto expected = mod1->Lookup("main");
   CHECK(relay::AlphaEqual(f, expected));
 }
 
diff --git a/tests/python/frontend/caffe2/model_zoo/squeezenet.py b/tests/python/frontend/caffe2/model_zoo/squeezenet.py
index 74ade8989d053..3c21138343c61 100644
--- a/tests/python/frontend/caffe2/model_zoo/squeezenet.py
+++ b/tests/python/frontend/caffe2/model_zoo/squeezenet.py
@@ -95,7 +95,7 @@ def get_net(batch_size, image_shape, num_classes, dtype):
     net = relay.nn.relu(net)
     net = relay.nn.global_avg_pool2d(net)
     net = relay.nn.softmax(net, axis=1)
-    args = relay.ir_pass.free_vars(net)
+    args = relay.analysis.free_vars(net)
     return relay.Function(args, net)
 
 
diff --git a/tests/python/frontend/caffe2/test_graph.py b/tests/python/frontend/caffe2/test_graph.py
index ea3a36e606634..35914ec1f9bfe 100644
--- a/tests/python/frontend/caffe2/test_graph.py
+++ b/tests/python/frontend/caffe2/test_graph.py
@@ -16,13 +16,14 @@
 # under the License.
 """Test graph equality of caffe2 models."""
 from tvm import relay
+from tvm.relay import transform
 from model_zoo import c2_squeezenet, relay_squeezenet
 
 
-def compare_graph(f1, f2):
-    f1 = relay.ir_pass.infer_type(f1)
-    f2 = relay.ir_pass.infer_type(f2)
-    assert relay.ir_pass.alpha_equal(f1, f2)
+def compare_graph(lhs_mod, rhs_mod):
+    lhs_mod = transform.InferType()(lhs_mod)
+    rhs_mod = transform.InferType()(rhs_mod)
+    assert relay.analysis.alpha_equal(lhs_mod["main"], rhs_mod["main"])
 
 
 def test_squeeze_net():
@@ -30,8 +31,8 @@ def test_squeeze_net():
     dtype_dict = {'data': 'float32'}
     mod, _, = relay.frontend.from_caffe2(
         c2_squeezenet.init_net, c2_squeezenet.predict_net, shape_dict, dtype_dict)
-    relay_func, _ = relay_squeezenet()
-    compare_graph(mod[mod.entry_func], relay_func)
+    relay_mod, _ = relay_squeezenet()
+    compare_graph(mod, relay_mod)
 
 
 if __name__ == '__main__':
diff --git a/tests/python/frontend/coreml/test_forward.py b/tests/python/frontend/coreml/test_forward.py
index 13f987c32be78..59d4dd6f29b75 100644
--- a/tests/python/frontend/coreml/test_forward.py
+++ b/tests/python/frontend/coreml/test_forward.py
@@ -48,7 +48,7 @@ def run_model_checkonly(model_file, model_name='', input_name='image'):
     shape_dict = {input_name : x.shape}
     mod, params = relay.frontend.from_coreml(model, shape_dict)
     for target, ctx in ctx_list():
-        tvm_output = get_tvm_output(mod[mod.entry_func], x, params, target, ctx)
+        tvm_output = get_tvm_output(mod["main"], x, params, target, ctx)
         print(target, ctx, model_name, 'prediction id: ', np.argmax(tvm_output.flat))
 
 def test_mobilenet_checkonly():
diff --git a/tests/python/frontend/mxnet/test_graph.py b/tests/python/frontend/mxnet/test_graph.py
index b7d3ba4a5b605..467d5529d0c14 100644
--- a/tests/python/frontend/mxnet/test_graph.py
+++ b/tests/python/frontend/mxnet/test_graph.py
@@ -16,19 +16,20 @@
 # under the License.
 import mxnet as mx
 from tvm import relay
+from tvm.relay import transform
 import model_zoo
 
-def compare_graph(f1, f2):
-    f1 = relay.ir_pass.infer_type(f1)
-    f2 = relay.ir_pass.infer_type(f2)
-    assert relay.ir_pass.alpha_equal(f1, f2)
+def compare_graph(lhs_mod, rhs_mod):
+    lhs_mod = transform.InferType()(lhs_mod)
+    rhs_mod = transform.InferType()(rhs_mod)
+    assert relay.analysis.alpha_equal(lhs_mod["main"], rhs_mod["main"])
 
 def test_mlp():
     shape = {"data": (1, 1, 28, 28)}
     mx_fun = model_zoo.mx_mlp()
     mod, _ = relay.frontend.from_mxnet(mx_fun, shape=shape)
     relay_fun = model_zoo.relay_mlp()
-    compare_graph(mod[mod.entry_func], relay_fun)
+    compare_graph(mod, relay_fun)
 
 
 def test_vgg():
@@ -36,8 +37,8 @@ def test_vgg():
     for n in [11, 13, 16, 19]:
         mx_sym = model_zoo.mx_vgg(n)
         mod, _ = relay.frontend.from_mxnet(mx_sym, shape=shape)
-        relay_sym = model_zoo.relay_vgg(n)
-        compare_graph(mod[mod.entry_func], relay_sym)
+        relay_mod = model_zoo.relay_vgg(n)
+        compare_graph(mod, relay_mod)
 
 
 def test_resnet():
@@ -45,8 +46,8 @@ def test_resnet():
     for n in [18, 34, 50, 101]:
         mx_sym = model_zoo.mx_resnet(n)
         mod, _ = relay.frontend.from_mxnet(mx_sym, shape=shape)
-        relay_sym = model_zoo.relay_resnet(n)
-        compare_graph(mod[mod.entry_func], relay_sym)
+        relay_mod = model_zoo.relay_resnet(n)
+        compare_graph(mod, relay_mod)
 
 
 def test_squeezenet():
@@ -54,32 +55,32 @@ def test_squeezenet():
     for version in ['1.0', '1.1']:
         mx_sym = model_zoo.mx_squeezenet(version)
         mod, _ = relay.frontend.from_mxnet(mx_sym, shape)
-        relay_sym = model_zoo.relay_squeezenet(version)
-        compare_graph(mod[mod.entry_func], relay_sym)
+        relay_mod = model_zoo.relay_squeezenet(version)
+        compare_graph(mod, relay_mod)
 
 
 def test_inception_v3():
     shape = {"data": (1, 3, 299, 299)}
     mx_sym = model_zoo.mx_inception_v3()
     mod, _ = relay.frontend.from_mxnet(mx_sym, shape)
-    relay_sym = model_zoo.relay_inception_v3()
-    compare_graph(mod[mod.entry_func], relay_sym)
+    relay_mod = model_zoo.relay_inception_v3()
+    compare_graph(mod, relay_mod)
 
 
 def test_dqn():
     shape = {"data": (1, 4, 84, 84)}
     mx_sym = model_zoo.mx_dqn()
     mod, _ = relay.frontend.from_mxnet(mx_sym, shape)
-    relay_sym = model_zoo.relay_dqn()
-    compare_graph(mod[mod.entry_func], relay_sym)
+    relay_mod = model_zoo.relay_dqn()
+    compare_graph(mod, relay_mod)
 
 
 def test_dcgan():
     shape = {"data": (2, 100)}
     mx_sym = model_zoo.mx_dcgan()
     mod, _ = relay.frontend.from_mxnet(mx_sym, shape)
-    relay_sym = model_zoo.relay_dcgan(batch_size=2)
-    compare_graph(mod[mod.entry_func], relay_sym)
+    relay_mod = model_zoo.relay_dcgan(batch_size=2)
+    compare_graph(mod, relay_mod)
 
 
 def test_multi_outputs():
@@ -97,13 +98,14 @@ def relay_compose(F, **kwargs):
         y = F.var("y", shape=yshape)
         z = F.split(x, **kwargs)
         z = F.subtract(F.add(z[0], z[2]), y)
-        return relay.Function(relay.ir_pass.free_vars(z), z)
+        func = relay.Function(relay.analysis.free_vars(z), z)
+        return relay.Module.from_expr(func)
 
     mx_sym = mx_compose(mx, num_outputs=3, axis=1)
     mod, _ = relay.frontend.from_mxnet(
         mx_sym, shape={"x":xshape, "y":yshape})
-    relay_sym = relay_compose(relay, indices_or_sections=3, axis=1)
-    compare_graph(mod[mod.entry_func], relay_sym)
+    relay_mod = relay_compose(relay, indices_or_sections=3, axis=1)
+    compare_graph(mod, relay_mod)
 
 
 if __name__ == "__main__":
diff --git a/tests/python/frontend/nnvm_to_relay/test_alter_conv2d.py b/tests/python/frontend/nnvm_to_relay/test_alter_conv2d.py
index d3538bb0085b6..b7d21912e44ea 100644
--- a/tests/python/frontend/nnvm_to_relay/test_alter_conv2d.py
+++ b/tests/python/frontend/nnvm_to_relay/test_alter_conv2d.py
@@ -20,7 +20,8 @@
 
 from tvm import relay
 from tvm import autotvm
-from tvm.relay.ir_pass import infer_type, alpha_equal
+from tvm.relay import transform
+from tvm.relay.analysis import alpha_equal
 
 
 def test_alter_layout_conv2d():
@@ -57,12 +58,11 @@ def convnet():
         n15 = relay.reshape(n14, newshape=[1, 1, 3, 3, 224, 224])
         n16 = relay.transpose(n15, axes=[0, 1, 4, 2, 5, 3])
         net = relay.reshape(n16, newshape=[1, 1, 672, 672])
-        args = relay.ir_pass.free_vars(net)
+        args = relay.analysis.free_vars(net)
         return relay.Function(args, net)
 
     # orig net
     N = convnet()
-    N = infer_type(N)
 
     # trigger a test
     # for each known alter_conv2d
@@ -75,11 +75,12 @@ def convnet():
     for tgt in targets:
         with tvm.target.create(tgt) as target:
             with autotvm.tophub.context(target):
-                O = relay.ir_pass.alter_op_layout(N)
-                O = relay.ir_pass.infer_type(O)
+                mod = relay.Module.from_expr(N)
+                mod = transform.AlterOpLayout()(mod)
+                O = mod["main"]
 
                 # graph should differ
-                assert not relay.ir_pass.alpha_equal(N, O)
+                assert not relay.analysis.alpha_equal(N, O)
 
 if __name__ == "__main__":
     np.random.seed(42)
diff --git a/tests/python/relay/benchmarking/benchmark_vm.py b/tests/python/relay/benchmarking/benchmark_vm.py
index e359ade864e21..26301e90f789d 100644
--- a/tests/python/relay/benchmarking/benchmark_vm.py
+++ b/tests/python/relay/benchmarking/benchmark_vm.py
@@ -23,15 +23,15 @@
 from tvm.relay import testing
 
 
-def benchmark_execution(net,
+def benchmark_execution(mod,
                         params,
                         measure=False,
                         data_shape=(1, 3, 224, 224),
                         out_shape=(1, 1000),
                         dtype='float32'):
-    def get_tvm_output(net, data, params, target, ctx, dtype='float32'):
+    def get_tvm_output(mod, data, params, target, ctx, dtype='float32'):
         with relay.build_config(opt_level=1):
-            graph, lib, params = relay.build(net, target, params=params)
+            graph, lib, params = relay.build(mod, target, params=params)
 
         m = graph_runtime.create(graph, lib, ctx)
         # set inputs
@@ -50,9 +50,9 @@ def get_tvm_output(net, data, params, target, ctx, dtype='float32'):
 
         return out.asnumpy()
 
-    def get_tvm_vm_output(net, data, params, target, ctx, dtype='float32'):
-        ex = relay.create_executor('vm', mod=relay.Module(), ctx=ctx)
-        result = ex.evaluate(net)(data, **params)
+    def get_tvm_vm_output(mod, data, params, target, ctx, dtype='float32'):
+        ex = relay.create_executor('vm', mod=mod, ctx=ctx)
+        result = ex.evaluate()(data, **params)
         return result.asnumpy().astype(dtype)
 
     # random input
@@ -60,64 +60,64 @@ def get_tvm_vm_output(net, data, params, target, ctx, dtype='float32'):
     target = "llvm"
     ctx = tvm.cpu(0)
 
-    tvm_out = get_tvm_output(net, tvm.nd.array(data.astype(dtype)), params,
+    tvm_out = get_tvm_output(mod, tvm.nd.array(data.astype(dtype)), params,
                              target, ctx, dtype)
-    vm_out = get_tvm_vm_output(net, tvm.nd.array(data.astype(dtype)), params,
+    vm_out = get_tvm_vm_output(mod, tvm.nd.array(data.astype(dtype)), params,
                                target, ctx, dtype)
     tvm.testing.assert_allclose(vm_out, tvm_out, rtol=1e-5, atol=1e-5)
 
 
 def test_mlp():
-    image_shape = (1, 28, 28)
-    net, params = testing.mlp.get_workload(1)
-    benchmark_execution(net, params, data_shape=image_shape, out_shape=(1, 10))
+    image_shape = (1, 1, 28, 28)
+    mod, params = testing.mlp.get_workload(1)
+    benchmark_execution(mod, params, data_shape=image_shape, out_shape=(1, 10))
 
 
 def test_vgg():
     for n in [11, 16]:
-        net, params = testing.vgg.get_workload(1, num_layers=n)
-        benchmark_execution(net, params)
+        mod, params = testing.vgg.get_workload(1, num_layers=n)
+        benchmark_execution(mod, params)
 
 
 def test_resnet():
     for n in [18, 50]:
-        net, params = testing.resnet.get_workload(batch_size=1, num_layers=n)
-        benchmark_execution(net, params, True)
+        mod, params = testing.resnet.get_workload(batch_size=1, num_layers=n)
+        benchmark_execution(mod, params, True)
 
 
 def test_squeezenet():
     for version in ['1.0', '1.1']:
-        net, params = testing.squeezenet.get_workload(version=version)
-        benchmark_execution(net, params)
+        mod, params = testing.squeezenet.get_workload(version=version)
+        benchmark_execution(mod, params)
 
 
 def test_inception_v3():
-    image_shape = (3, 299, 299)
-    net, params = testing.inception_v3.get_workload(image_shape=image_shape)
-    benchmark_execution(net, params, data_shape=image_shape)
+    image_shape = (1, 3, 299, 299)
+    mod, params = testing.inception_v3.get_workload(image_shape=image_shape)
+    benchmark_execution(mod, params, data_shape=image_shape)
 
 
 def test_dqn():
-    image_shape = (4, 84, 84)
-    net, params = testing.dqn.get_workload(
+    image_shape = (1, 4, 84, 84)
+    mod, params = testing.dqn.get_workload(
         batch_size=1, image_shape=image_shape)
-    benchmark_execution(net, params, data_shape=image_shape, out_shape=(1, 18))
+    benchmark_execution(mod, params, data_shape=image_shape, out_shape=(1, 18))
 
 
 def test_dcgan():
     image_shape = (1, 100)
-    net, params = testing.dcgan.get_workload(batch_size=1)
-    benchmark_execution(net, params, data_shape=image_shape)
+    mod, params = testing.dcgan.get_workload(batch_size=1)
+    benchmark_execution(mod, params, data_shape=image_shape)
 
 
 def test_mobilenet():
-    net, params = testing.mobilenet.get_workload(batch_size=1)
-    benchmark_execution(net, params)
+    mod, params = testing.mobilenet.get_workload(batch_size=1)
+    benchmark_execution(mod, params)
 
 
 def test_densenet():
-    net, params = testing.densenet.get_workload(batch_size=1)
-    benchmark_execution(net, params)
+    mod, params = testing.densenet.get_workload(batch_size=1)
+    benchmark_execution(mod, params)
 
 
 if __name__ == '__main__':
diff --git a/tests/python/relay/test_adt.py b/tests/python/relay/test_adt.py
index f3a08a8698410..390576f87c184 100644
--- a/tests/python/relay/test_adt.py
+++ b/tests/python/relay/test_adt.py
@@ -14,12 +14,10 @@
 # KIND, either express or implied.  See the License for the
 # specific language governing permissions and limitations
 # under the License.
-import numpy as np
 import tvm
 from tvm import relay
-from tvm.relay.ir_pass import infer_type
-from tvm.relay.backend.interpreter import Value, TupleValue, ConstructorValue
-from tvm.relay import testing, create_executor
+from tvm.relay.backend.interpreter import ConstructorValue
+from tvm.relay import create_executor
 from tvm.relay.prelude import Prelude
 from tvm.relay.testing import add_nat_definitions, count as count_, make_nat_value, make_nat_expr
 
@@ -125,8 +123,14 @@ def test_nat_value():
 
 
 def test_nat_constructor():
-    assert relay.ir_pass.infer_type(z(), mod).checked_type == nat()
-    assert relay.ir_pass.infer_type(s(z()), mod).checked_type == nat()
+    func = relay.Function([], z())
+    test_z = relay.GlobalVar("test_z")
+    mod[test_z] = func
+    assert mod[test_z].body.checked_type == nat()
+    test_sz = relay.GlobalVar("test_sz")
+    func = relay.Function([], s(z()))
+    mod[test_sz] = func
+    assert mod[test_sz].body.checked_type == nat()
 
 
 def test_double():
@@ -142,8 +146,10 @@ def test_add():
 
 
 def test_list_constructor():
-    a = relay.TypeVar("a")
-    assert relay.ir_pass.infer_type(cons(z(), nil()), mod).checked_type == l(nat())
+    test_consz = relay.GlobalVar("test_consz")
+    func = relay.Function([], cons(z(), nil()))
+    mod[test_consz] = func
+    assert mod[test_consz].body.checked_type == l(nat())
 
 def test_hd_tl():
     expected = list(range(10))
diff --git a/tests/python/relay/test_autotvm_task_extraction.py b/tests/python/relay/test_autotvm_task_extraction.py
index 07116cd5faf50..0bef382cb5d0b 100644
--- a/tests/python/relay/test_autotvm_task_extraction.py
+++ b/tests/python/relay/test_autotvm_task_extraction.py
@@ -24,48 +24,48 @@ def get_network(name, batch_size):
     input_shape = (batch_size, 3, 224, 224)
 
     if name == 'resnet-18':
-        net, params = relay.testing.resnet.get_workload(num_layers=18, batch_size=batch_size)
+        mod, params = relay.testing.resnet.get_workload(num_layers=18, batch_size=batch_size)
     elif name == 'mobilenet':
-        net, params = relay.testing.mobilenet.get_workload(batch_size=batch_size)
+        mod, params = relay.testing.mobilenet.get_workload(batch_size=batch_size)
     elif name == 'dcgan':
-        net, params = relay.testing.dcgan.get_workload(batch_size=batch_size)
+        mod, params = relay.testing.dcgan.get_workload(batch_size=batch_size)
         input_shape = (batch_size, 100)
     else:
         raise ValueError("Unsupported network: " + name)
 
-    return net, params, input_shape
+    return mod, params, input_shape
 
 def test_task_extraction():
     target = 'llvm'
 
-    net, params, input_shape = get_network('resnet-18', batch_size=1)
-    tasks = autotvm.task.extract_from_program(net, target=target,
-                                            params=params,
-                                            ops=(relay.op.nn.conv2d,))
+    mod, params, input_shape = get_network('resnet-18', batch_size=1)
+    tasks = autotvm.task.extract_from_program(mod["main"], target=target,
+                                              params=params,
+                                              ops=(relay.op.nn.conv2d,))
     assert len(tasks) == 12
 
-    net, params, input_shape = get_network('resnet-18', batch_size=1)
-    tasks = autotvm.task.extract_from_program(net, target=target,
-                                            params=params,
-                                            ops=(relay.op.nn.dense,))
+    mod, params, input_shape = get_network('resnet-18', batch_size=1)
+    tasks = autotvm.task.extract_from_program(mod["main"], target=target,
+                                              params=params,
+                                              ops=(relay.op.nn.dense,))
     assert len(tasks) == 1
 
-    net, params, input_shape = get_network('resnet-18', batch_size=1)
-    tasks = autotvm.task.extract_from_program(net, target=target,
-                                            params=params,
-                                            ops=(relay.op.nn.conv2d, relay.op.nn.dense))
+    mod, params, input_shape = get_network('resnet-18', batch_size=1)
+    tasks = autotvm.task.extract_from_program(mod["main"], target=target,
+                                              params=params,
+                                              ops=(relay.op.nn.conv2d, relay.op.nn.dense))
     assert len(tasks) == 13
 
-    net, params, input_shape = get_network('mobilenet', batch_size=1)
-    tasks = autotvm.task.extract_from_program(net, target=target,
-                                            params=params,
-                                            ops=(relay.op.nn.conv2d, relay.op.nn.dense))
+    mod, params, input_shape = get_network('mobilenet', batch_size=1)
+    tasks = autotvm.task.extract_from_program(mod["main"], target=target,
+                                              params=params,
+                                              ops=(relay.op.nn.conv2d, relay.op.nn.dense))
     assert len(tasks) == 20
 
-    net, params, input_shape = get_network('dcgan', batch_size=1)
-    tasks = autotvm.task.extract_from_program(net, target=target,
-                                            params=params,
-                                            ops=(relay.op.nn.conv2d_transpose,))
+    mod, params, input_shape = get_network('dcgan', batch_size=1)
+    tasks = autotvm.task.extract_from_program(mod["main"], target=target,
+                                              params=params,
+                                              ops=(relay.op.nn.conv2d_transpose,))
     assert len(tasks) == 4
 
 if __name__ == '__main__':
diff --git a/tests/python/relay/test_backend_compile_engine.py b/tests/python/relay/test_backend_compile_engine.py
index ca4619c978860..ea16a8d6122eb 100644
--- a/tests/python/relay/test_backend_compile_engine.py
+++ b/tests/python/relay/test_backend_compile_engine.py
@@ -26,8 +26,10 @@ def get_func(shape):
         x = relay.var("x", shape=shape)
         y = relay.add(x, x)
         z = relay.add(y, x)
-        f = relay.ir_pass.infer_type(relay.Function([x], z))
-        return f
+        f = relay.Function([x], z)
+        mod = relay.Module.from_expr(f)
+        mod = relay.transform.InferType()(mod)
+        return mod["main"]
     z1 = engine.lower(get_func((10,)), "llvm")
     z2 = engine.lower(get_func((10,)), "llvm")
     z3 = engine.lower(get_func(()), "llvm")
@@ -55,9 +57,9 @@ def test_compile_placeholder_bypass():
     y = relay.var("y", shape=(2, 3))
     z = relay.var("z", shape=(2, 3))
     result = relay.Tuple([x, relay.op.concatenate([y, z], axis=0)])
-    func = relay.Function(relay.ir_pass.free_vars(result), result)
+    func = relay.Function(relay.analysis.free_vars(result), result)
     with relay.build_config(opt_level=0):
-       graph, lib, params = relay.build(func, 'llvm')
+       graph, lib, params = relay.build(relay.Module.from_expr(func), 'llvm')
 
 
 def test_compile_injective_with_tuple():
@@ -66,7 +68,7 @@ def test_compile_injective_with_tuple():
     x_transpose = relay.transpose(x)
     output = relay.Tuple([x_transpose, y])
     func = relay.Function([x, y], output)
-    relay.build(func, 'llvm')
+    relay.build(relay.Module.from_expr(func), 'llvm')
 
 
 def test_compile_tuple_dup():
@@ -74,7 +76,7 @@ def test_compile_tuple_dup():
     log = relay.log(x)
     output = relay.Tuple([log, log])
     f = relay.Function([x], output)
-    relay.build(f, 'llvm')
+    relay.build(relay.Module.from_expr(f), 'llvm')
 
 
 if __name__ == "__main__":
diff --git a/tests/python/relay/test_backend_graph_runtime.py b/tests/python/relay/test_backend_graph_runtime.py
index 32687a4e80130..fbccb94bc6708 100644
--- a/tests/python/relay/test_backend_graph_runtime.py
+++ b/tests/python/relay/test_backend_graph_runtime.py
@@ -19,7 +19,6 @@
 import tvm
 from tvm import relay
 from tvm.contrib import graph_runtime
-from tvm.relay.ir_pass import infer_type
 from tvm.relay.scope_builder import ScopeBuilder
 from tvm.relay.op import add
 from tvm.relay.module import Module
@@ -101,7 +100,7 @@ def test_with_params():
     x_data = np.random.rand(10, 5).astype('float32')
     y_data = np.random.rand(1, 5).astype('float32')
     params = {"y": y_data}
-    graph, lib, params = relay.build(func, "llvm", params=params)
+    graph, lib, params = relay.build(relay.Module.from_expr(func), "llvm", params=params)
     mod = graph_runtime.create(graph, lib, ctx=tvm.cpu(0))
     mod.set_input(**params)
     mod.set_input(x=x_data)
@@ -124,9 +123,9 @@ def test_plan_memory():
     z = relay.exp(z)
     z = relay.exp(z)
     func = relay.Function([x, y], z)
-    func = relay.ir_pass.infer_type(func)
-    func = relay.ir_pass.fuse_ops(func, opt_level=0)
-    func = relay.ir_pass.infer_type(func)
+    mod = relay.Module.from_expr(func)
+    mod = relay.transform.FuseOps(0)(mod)
+    func = mod["main"]
     smap = relay.backend._backend.GraphPlanMemory(func)
     storage_ids = set()
     device_types = set()
@@ -170,7 +169,7 @@ def unit_numpy(X, W):
 
     for target, ctx in ctx_list():
         with relay.build_config(opt_level=2):
-            graph, lib, params = relay.build(z, target)
+            graph, lib, params = relay.build(relay.Module.from_expr(z), target)
             m = graph_runtime.create(graph, lib, ctx)
             m.set_input("X", tvm.nd.array(x.astype(dtype)))
             m.set_input("y", tvm.nd.array(y.astype(dtype)))
diff --git a/tests/python/relay/test_backend_interpreter.py b/tests/python/relay/test_backend_interpreter.py
index 11ce11e483226..0e5e981a53216 100644
--- a/tests/python/relay/test_backend_interpreter.py
+++ b/tests/python/relay/test_backend_interpreter.py
@@ -224,10 +224,9 @@ def test_tuple_passing():
 
     fn = relay.Function([x], relay.expr.TupleGetItem(x, 0))
     mod = relay.Module({})
-    gv = relay.GlobalVar('fn')
+    gv = relay.GlobalVar('main')
     mod[gv] = fn
-    mod.entry_func = gv
-    mod[gv] = relay.ir_pass.infer_type(mod[gv], mod=mod)
+    mod = relay.transform.InferType()(mod)
 
     ctx = tvm.cpu()
     target = tvm.target.create('llvm')
diff --git a/tests/python/relay/test_cpp_build_module.py b/tests/python/relay/test_cpp_build_module.py
index affc6ce04c6b1..e2db81dab1c9f 100644
--- a/tests/python/relay/test_cpp_build_module.py
+++ b/tests/python/relay/test_cpp_build_module.py
@@ -43,7 +43,7 @@ def test_basic_build():
     targets = {
         tvm.expr.IntImm("int32", ctx.device_type): tgt
     }
-    g_json, mmod, params = relay.build(func, targets, "llvm", params=params)
+    g_json, mmod, params = relay.build(relay.Module.from_expr(func), targets, "llvm", params=params)
 
     # test
     rt = tvm.contrib.graph_runtime.create(g_json, mmod, ctx)
@@ -115,7 +115,7 @@ def check_conversion(tgt, ctx):
 
             # build
             with relay.build_config(opt_level=1):
-                g_json, mmod, params = relay.build(func, tgt)
+                g_json, mmod, params = relay.build(relay.Module.from_expr(func), tgt)
 
             # test
             rt = tvm.contrib.graph_runtime.create(g_json, mmod, ctx)
diff --git a/tests/python/relay/test_error_reporting.py b/tests/python/relay/test_error_reporting.py
index c608ebba9b6d5..c446f361101d8 100644
--- a/tests/python/relay/test_error_reporting.py
+++ b/tests/python/relay/test_error_reporting.py
@@ -19,7 +19,10 @@
 
 def check_type_err(expr, msg):
     try:
-        expr = relay.ir_pass.infer_type(expr)
+        mod = relay.Module.from_expr(expr)
+        mod = relay.transform.InferType()(mod)
+        entry = mod["main"]
+        expr = entry if isinstance(expr, relay.Function) else entry.body
         assert False
     except tvm.TVMError as err:
         assert msg in str(err)
diff --git a/tests/python/relay/test_feature.py b/tests/python/relay/test_feature.py
index 637e184704f2d..2e0cd374b0251 100644
--- a/tests/python/relay/test_feature.py
+++ b/tests/python/relay/test_feature.py
@@ -17,7 +17,8 @@
 
 import tvm
 from tvm import relay
-from tvm.relay.ir_pass import detect_feature, gradient
+from tvm.relay.analysis import detect_feature
+from tvm.relay.transform import gradient
 from tvm.relay.feature import Feature
 from tvm.relay.prelude import Prelude
 
@@ -46,7 +47,9 @@ def test_ad():
     t = relay.TensorType(shape, dtype)
     x = relay.var("x", t)
     func = relay.Function([x], x + x)
-    back_func = relay.ir_pass.infer_type(gradient(func))
+    mod = relay.Module.from_expr(gradient(func))
+    mod = relay.transform.InferType()(mod)
+    back_func = mod["main"]
     feats = detect_feature(back_func)
     assert feats == set([
         Feature.fVar,
diff --git a/tests/python/relay/test_ir_bind.py b/tests/python/relay/test_ir_bind.py
index 754efa557db6e..df280e2fa2482 100644
--- a/tests/python/relay/test_ir_bind.py
+++ b/tests/python/relay/test_ir_bind.py
@@ -28,11 +28,11 @@ def test_bind_params():
     fexpected =relay.Function(
         [y],
         relay.add(relay.const(1, "float32"),  y))
-    assert relay.ir_pass.alpha_equal(fbinded, fexpected)
+    assert relay.analysis.alpha_equal(fbinded, fexpected)
 
     zbinded = relay.bind(z, {y: x})
     zexpected = relay.add(x, x)
-    assert relay.ir_pass.alpha_equal(zbinded, zexpected)
+    assert relay.analysis.alpha_equal(zbinded, zexpected)
 
 
 if __name__ == "__main__":
diff --git a/tests/python/relay/test_ir_module.py b/tests/python/relay/test_ir_module.py
new file mode 100644
index 0000000000000..72a92c8697fc4
--- /dev/null
+++ b/tests/python/relay/test_ir_module.py
@@ -0,0 +1,68 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+"""Tests for module functionality."""
+import tvm
+from tvm import relay
+from tvm.relay import Module
+from tvm.relay.prelude import Prelude
+from tvm.relay.testing import add_nat_definitions
+
+def constructor_list(p):
+    return [p.nil, p.cons, p.rose, p.some, p.none, p.z, p.s]
+
+
+def adt_list(p):
+    return [p.nat, p.l, p.optional, p.tree]
+
+
+def test_constructor_tag_round_trip():
+    mod1 = Module()
+    p1 = Prelude(mod1)
+    add_nat_definitions(p1)
+    mod2 = Module()
+    p2 = Prelude(mod2)
+    add_nat_definitions(p2)
+
+    # ensure hashes match across modules
+    ctors1 = constructor_list(p1)
+    ctors2 = constructor_list(p2)
+
+    for i in range(len(ctors1)):
+        tag = ctors1[i].tag
+        ctor = mod2.get_constructor(tag)
+        assert ctor == ctors2[i]
+        assert ctor.name_hint == ctors1[i].name_hint
+
+
+def test_constructor_tag_differences():
+    # ensure that if we have the type data for a given ADT, the tags
+    # for the constructors of the *same ADT* are simple offsets from
+    # each other
+    mod = Module()
+    p = Prelude(mod)
+    add_nat_definitions(p)
+
+    adts = adt_list(p)
+    for adt in adts:
+        data = mod[adt]
+        for i in range(len(data.constructors) - 1):
+            ctor1 = data.constructors[i]
+            ctor2 = data.constructors[i + 1]
+            assert ctor2.tag - ctor1.tag == 1
+            # make sure there is something present at the MSB
+            assert ctor1.tag - i != 0
+            assert ctor2.tag - (i + 1) != 0
diff --git a/tests/python/relay/test_ir_nodes.py b/tests/python/relay/test_ir_nodes.py
index cec277371252b..b42a1e6d52c6d 100644
--- a/tests/python/relay/test_ir_nodes.py
+++ b/tests/python/relay/test_ir_nodes.py
@@ -19,7 +19,7 @@
 from tvm import relay
 from tvm.expr import *
 from tvm.relay import op
-from tvm.relay.ir_pass import graph_equal
+from tvm.relay.analysis import graph_equal
 
 
 def check_json_roundtrip(node):
diff --git a/tests/python/relay/test_ir_parser.py b/tests/python/relay/test_ir_parser.py
index 79b010ba0cb06..5f1f65ffb47c8 100644
--- a/tests/python/relay/test_ir_parser.py
+++ b/tests/python/relay/test_ir_parser.py
@@ -16,7 +16,7 @@
 # under the License.
 import tvm
 from tvm import relay
-from tvm.relay.ir_pass import alpha_equal
+from tvm.relay.analysis import alpha_equal
 from nose.tools import nottest, raises
 from numpy import isclose
 from typing import Union
diff --git a/tests/python/relay/test_ir_well_formed.py b/tests/python/relay/test_ir_well_formed.py
index 3cf73ae2cc667..bee0a021ac5b6 100644
--- a/tests/python/relay/test_ir_well_formed.py
+++ b/tests/python/relay/test_ir_well_formed.py
@@ -16,7 +16,7 @@
 # under the License.
 import tvm
 from tvm import relay
-from tvm.relay.ir_pass import well_formed
+from tvm.relay.analysis import well_formed
 from tvm.relay.prelude import Prelude
 
 def test_let():
diff --git a/tests/python/relay/test_op_grad_level1.py b/tests/python/relay/test_op_grad_level1.py
index 072271218bdf4..3dcba4778f5fa 100644
--- a/tests/python/relay/test_op_grad_level1.py
+++ b/tests/python/relay/test_op_grad_level1.py
@@ -14,16 +14,24 @@
 # KIND, either express or implied.  See the License for the
 # specific language governing permissions and limitations
 # under the License.
-import tvm
 import numpy as np
+import tvm
 from tvm import relay
-from tvm.relay.ir_pass import gradient, infer_type
+from tvm.relay.transform import gradient
 from tvm.relay.testing import ctx_list
 
+
+def run_infer_type(expr):
+    mod = relay.Module.from_expr(expr)
+    mod = relay.transform.InferType()(mod)
+    return mod["main"]
+
+
 def sigmoid(x):
     one = np.ones_like(x)
     return one / (one + np.exp(-x))
 
+
 def relu(x):
     x_copy = np.copy(x)
     np.maximum(x_copy, 0, x_copy)
@@ -41,7 +49,7 @@ def check_single_op(opfunc, ref):
             data = np.random.rand(*shape).astype(dtype)
             ref_grad = ref(data)
             fwd_func = relay.Function([x], y)
-            bwd_func = infer_type(gradient(fwd_func))
+            bwd_func = run_infer_type(gradient(fwd_func))
 
             for target, ctx in ctx_list():
                 intrp = relay.create_executor(ctx=ctx, target=target)
@@ -73,7 +81,7 @@ def check_binary_op(opfunc, ref):
         y_data = np.random.rand(*s).astype(t.dtype)
         ref_grad0, ref_grad1 = ref(x_data, y_data)
         fwd_func = relay.Function([x, y], z)
-        bwd_func = infer_type(gradient(fwd_func))
+        bwd_func = run_infer_type(gradient(fwd_func))
 
         for target, ctx in ctx_list():
             intrp = relay.create_executor(ctx=ctx, target=target)
diff --git a/tests/python/relay/test_op_level1.py b/tests/python/relay/test_op_level1.py
index 202464493d4b1..b5abafadf49eb 100644
--- a/tests/python/relay/test_op_level1.py
+++ b/tests/python/relay/test_op_level1.py
@@ -14,13 +14,19 @@
 # KIND, either express or implied.  See the License for the
 # specific language governing permissions and limitations
 # under the License.
-import math
-import tvm
 import numpy as np
+import tvm
 from tvm import relay
+from tvm.relay import transform
 from tvm.relay.testing import ctx_list
 import topi.testing
 
+def run_infer_type(expr):
+    mod = relay.Module.from_expr(expr)
+    mod = transform.InferType()(mod)
+    entry = mod["main"]
+    return entry if isinstance(expr, relay.Function) else entry.body
+
 def sigmoid(x):
     one = np.ones_like(x)
     return one / (one + np.exp(-x))
@@ -44,7 +50,8 @@ def check_single_op(opfunc, ref):
         # test printer
         assert ("{}(%x)".format(y.op.name)) in y.astext()
         # test type inference
-        assert relay.ir_pass.infer_type(y).checked_type == tp
+        yy = run_infer_type(y)
+        assert yy.checked_type == tp
 
         if ref is not None:
             data = np.random.rand(*shape).astype(dtype)
@@ -84,7 +91,8 @@ def check_binary_op(opfunc, ref):
         z = opfunc(x, y)
         # test printer
         assert ("{}(%x, %y)".format(z.op.name)) in z.astext()
-        assert relay.ir_pass.infer_type(z).checked_type == t1
+        zz = run_infer_type(z)
+        assert zz.checked_type == t1
 
         if ref is not None:
             t1 = relay.TensorType((5, 10, 5))
@@ -134,7 +142,7 @@ def test_bias_add():
     x = relay.var("x", shape=xshape)
     bias = relay.var("bias")
     z = relay.nn.bias_add(x, bias)
-    zz = relay.ir_pass.infer_type(z)
+    zz = run_infer_type(z)
     assert "axis=" not in zz.astext()
     assert zz.args[1].checked_type == relay.TensorType(bshape)
 
@@ -153,8 +161,8 @@ def test_expand_dims_infer_type():
     x = relay.var("x", shape=(n, t, d))
     y = relay.expand_dims(x, axis=2)
     assert "axis=2" in y.astext()
-    checked = relay.ir_pass.infer_type(y)
-    assert checked.checked_type == relay.TensorType((n, t, 1, 100))
+    yy = run_infer_type(y)
+    assert yy.checked_type == relay.TensorType((n, t, 1, 100))
 
 
 def test_softmax():
@@ -162,7 +170,7 @@ def test_softmax():
     x = relay.var("x", shape=shape)
     y = relay.nn.softmax(x, axis=1)
     assert "nn.softmax" in y.astext()
-    yy = relay.ir_pass.infer_type(y)
+    yy = run_infer_type(y)
     assert yy.checked_type == relay.TensorType(shape)
     func = relay.Function([x], y)
     x_data = np.random.uniform(size=shape).astype("float32")
@@ -178,7 +186,7 @@ def test_log_softmax():
     x = relay.var("x", shape=shape)
     y = relay.nn.log_softmax(x, axis=1)
     assert "nn.log_softmax" in y.astext()
-    yy = relay.ir_pass.infer_type(y)
+    yy = run_infer_type(y)
     assert yy.checked_type == relay.TensorType(shape)
     func = relay.Function([x], y)
     x_data = np.random.uniform(size=shape).astype("float32")
@@ -195,16 +203,16 @@ def test_concatenate():
     y = relay.var("y", shape=(n, t, d))
     z = relay.concatenate((x, y), axis=-1)
     assert "axis=" in z.astext()
-    zz = relay.ir_pass.infer_type(z)
+    zz = run_infer_type(z)
     assert zz.checked_type == relay.TensorType((n, t, 200))
 
     x = relay.exp(x)
     z = relay.concatenate((x, y), axis=2)
-    zz = relay.ir_pass.infer_type(z)
+    zz = run_infer_type(z)
     assert zz.checked_type == relay.TensorType((n, t, 200))
 
     z = relay.concatenate((x, y), axis=1)
-    zz = relay.ir_pass.infer_type(z)
+    zz = run_infer_type(z)
     assert zz.checked_type == relay.TensorType((n, t + t, 100))
 
     x = relay.var("x", shape=(10, 5))
@@ -233,7 +241,7 @@ def test_dropout():
     x = relay.var("x", input_ty)
     y = relay.nn.dropout(x, rate=0.75)
     assert "rate=" in y.astext()
-    yy = relay.ir_pass.infer_type(y)
+    yy = run_infer_type(y)
     assert yy.checked_type == input_ty
 
 
@@ -246,7 +254,7 @@ def test_batch_norm():
     moving_var = relay.var("moving_var", relay.TensorType((2,)))
     y = relay.nn.batch_norm(data, gamma, beta, moving_mean, moving_var,
                             center=False, scale=False)
-    yy = relay.ir_pass.infer_type(y.astuple())
+    yy = run_infer_type(y.astuple())
     assert "center=" in yy.astext()
     assert yy.checked_type == relay.ty.TupleType(tvm.convert([
         relay.TensorType((3, 2, 1), "float32"),
@@ -261,7 +269,7 @@ def test_batch_norm():
 
     y = relay.nn.batch_norm(data, gamma, beta, moving_mean, moving_var,
                             axis=0, center=False, scale=False)
-    yy = relay.ir_pass.infer_type(y.astuple())
+    yy = run_infer_type(y.astuple())
     assert yy.checked_type == relay.ty.TupleType(tvm.convert([
         relay.ty.TensorType((3, 2, 1), "float32"),
         relay.ty.TensorType((3,), "float32"),
@@ -276,7 +284,7 @@ def test_batch_norm():
     moving_var = relay.var("moving_var", relay.TensorType((3,)))
     y = relay.nn.batch_norm(data, gamma, beta, moving_mean, moving_var,
                             axis=-1, center=False, scale=False)
-    yy = relay.ir_pass.infer_type(y.astuple())
+    yy = run_infer_type(y.astuple())
     assert yy.checked_type == relay.ty.TupleType(tvm.convert([
         relay.ty.TensorType((1, 2, 3), "float32"),
         relay.ty.TensorType((3,), "float32"),
@@ -290,7 +298,7 @@ def test_dense():
     w = relay.var("w", relay.TensorType((2, w), "float32"))
     y = relay.nn.dense(x, w, units=2)
     "units=2" in y.astext()
-    yy = relay.ir_pass.infer_type(y)
+    yy = run_infer_type(y)
     assert yy.checked_type == relay.TensorType((n, c, h, 2), "float32")
 
     n, c , h, w = tvm.var("n"), tvm.var("c"), tvm.var("h"), 2
@@ -298,14 +306,14 @@ def test_dense():
     wh, ww = tvm.var("wh"), tvm.var("ww")
     w = relay.var("w", relay.TensorType((ww, wh), "float32"))
     y = relay.nn.dense(x, w)
-    yy = relay.ir_pass.infer_type(y)
+    yy = run_infer_type(y)
     assert yy.checked_type == relay.TensorType((n, c, h, ww), "float32")
 
     n, c , h, w = tvm.var("n"), tvm.var("c"), tvm.var("h"), 2
     x = relay.var("x", relay.TensorType((n, c, h, w), "float32"))
     w = relay.var("w", relay.IncompleteType())
     y = relay.nn.dense(x, w, units=2)
-    yy = relay.ir_pass.infer_type(y)
+    yy = run_infer_type(y)
     assert yy.checked_type == relay.TensorType((n, c, h, 2), "float32")
 
     x = relay.var("x", shape=(10, 5))
diff --git a/tests/python/relay/test_op_level10.py b/tests/python/relay/test_op_level10.py
index f904fb01fdb90..046da8de5fe89 100644
--- a/tests/python/relay/test_op_level10.py
+++ b/tests/python/relay/test_op_level10.py
@@ -20,10 +20,17 @@
 import tvm
 import topi.testing
 from tvm import relay
+from tvm.relay import transform
 from tvm.relay.testing import ctx_list
 import topi
 import topi.testing
 
+def run_infer_type(expr):
+    mod = relay.Module.from_expr(expr)
+    mod = transform.InferType()(mod)
+    entry = mod["main"]
+    return entry if isinstance(expr, relay.Function) else entry.body
+
 def test_collapse_sum_like():
     shape = (3, 4, 5, 6)
     shape_like = (4, 5, 6)
@@ -31,7 +38,7 @@ def test_collapse_sum_like():
     x = relay.Var("x", relay.ty.TensorType(shape , dtype))
     y = relay.Var("y", relay.ty.TensorType(shape_like, dtype))
     z = relay.collapse_sum_like(x, y)
-    zz = relay.ir_pass.infer_type(z)
+    zz = run_infer_type(z)
     assert zz.checked_type == relay.ty.TensorType(shape_like, dtype)
 
     func = relay.Function([x, y], z)
@@ -50,7 +57,7 @@ def test_broadcast_to():
     dtype = "float32"
     x = relay.Var("x", relay.ty.TensorType(shape , dtype))
     z = relay.broadcast_to(x, shape=shape_like)
-    zz = relay.ir_pass.infer_type(z)
+    zz = run_infer_type(z)
     assert zz.checked_type == relay.ty.TensorType(shape_like, dtype)
 
     func = relay.Function([x], z)
@@ -69,7 +76,7 @@ def test_broadcast_to_like():
     x = relay.Var("x", relay.ty.TensorType(shape , dtype))
     y = relay.Var("y", relay.ty.TensorType(shape_like, dtype))
     z = relay.broadcast_to_like(x, y)
-    zz = relay.ir_pass.infer_type(z)
+    zz = run_infer_type(z)
     assert zz.checked_type == relay.ty.TensorType(shape_like, dtype)
 
     func = relay.Function([x, y], z)
@@ -106,7 +113,7 @@ def verify_slice_like(data, slice_like, axes, output, dtype="float32"):
     x = relay.var("data", relay.TensorType(data, dtype))
     y = relay.var("slice_like", relay.TensorType(slice_like, dtype))
     z = relay.slice_like(x, y, axes)
-    zz = relay.ir_pass.infer_type(z)
+    zz = run_infer_type(z)
     if axes:
         assert "axes" in z.astext()
     assert zz.checked_type == relay.ty.TensorType(output, dtype)
@@ -144,7 +151,7 @@ def test_reverse_reshape():
     def verify_reverse_reshape(shape, newshape, oshape):
         x = relay.var("x", relay.TensorType(shape, "float32"))
         z = relay.reverse_reshape(x, newshape=newshape)
-        zz = relay.ir_pass.infer_type(z)
+        zz = run_infer_type(z)
         assert "newshape=" in z.astext()
         assert zz.checked_type == relay.ty.TensorType(oshape, "float32")
 
@@ -166,7 +173,7 @@ def verify_batch_matmul(x_shape, y_shape, out_shape, dtype="float32"):
     x = relay.var("x", relay.TensorType(x_shape, dtype))
     y = relay.var("y", relay.TensorType(y_shape, dtype))
     z = relay.nn.batch_matmul(x, y)
-    zz = relay.ir_pass.infer_type(z)
+    zz = run_infer_type(z)
     assert zz.checked_type == relay.ty.TensorType(out_shape, dtype)
 
     func = relay.Function([x, y], z)
@@ -185,7 +192,7 @@ def test_batch_matmul():
     x = relay.var("x", relay.TensorType((b, m, k), "float32"))
     y = relay.var("y", relay.TensorType((b, n, k), "float32"))
     z = relay.nn.batch_matmul(x, y)
-    zz = relay.ir_pass.infer_type(z)
+    zz = run_infer_type(z)
     assert zz.checked_type == relay.TensorType((b, m, n), "float32")
 
     verify_batch_matmul((1, 16, 32), (1, 16, 32), (1, 16, 16))
@@ -197,7 +204,7 @@ def test_shape_of():
     shape = (10, 5, 12)
     x = relay.var("x", shape=shape)
     func = relay.Function([x], relay.op.shape_of(x))
-    func = relay.ir_pass.infer_type(func)
+    func = run_infer_type(func)
     x_data = np.random.rand(*shape).astype('float32')
     for target, ctx in ctx_list():
         # Because using graph executor, this op will be optimized after
@@ -256,7 +263,8 @@ def _verify(data_shape, mask_value, axis, dtype, itype):
         data = relay.var("data", relay.TensorType(data_shape, dtype))
         valid_length = relay.var("valid_length", relay.TensorType((nbatch,), itype))
         out = relay.sequence_mask(data, valid_length, mask_value, axis)
-        assert relay.ir_pass.infer_type(out).checked_type == relay.ty.TensorType(data_shape, dtype)
+        checked = run_infer_type(out)
+        assert checked.checked_type == relay.ty.TensorType(data_shape, dtype)
         func = relay.Function([data, valid_length], out)
         data_np = np.random.uniform(size=data_shape).astype(dtype)
         valid_length_np = np.random.randint(0, max_length, size=nbatch).astype(itype)
diff --git a/tests/python/relay/test_op_level2.py b/tests/python/relay/test_op_level2.py
index c8f5b1d27a2a8..9f49f61c0d5f2 100644
--- a/tests/python/relay/test_op_level2.py
+++ b/tests/python/relay/test_op_level2.py
@@ -16,12 +16,19 @@
 # under the License.
 """ Support level2 operator test cases.
 """
+import numpy as np
 import tvm
 from tvm import relay
+from tvm.relay import transform
 from tvm.relay.testing import ctx_list
-import numpy as np
 import topi.testing
 
+def run_infer_type(expr):
+    mod = relay.Module.from_expr(expr)
+    mod = transform.InferType()(mod)
+    entry = mod["main"]
+    return entry if isinstance(expr, relay.Function) else entry.body
+
 def test_conv2d_infer_type():
     # symbolic in batch dimension
     n, c, h, w = tvm.var("n"), 10, 224, 224
@@ -31,7 +38,7 @@ def test_conv2d_infer_type():
                         kernel_size=(3, 3),
                         padding=(1, 1),
                         channels=2)
-    yy = relay.ir_pass.infer_type(y)
+    yy = run_infer_type(y)
     assert yy.checked_type ==  relay.TensorType(
         (n, 2, 224, 224), "float32")
     assert yy.args[1].checked_type == relay.TensorType(
@@ -44,7 +51,7 @@ def test_conv2d_infer_type():
     w = relay.var("w", relay.TensorType((2, 10, 3, 3), "int8"))
     y = relay.nn.conv2d(x, w, out_dtype="int32")
     assert "out_dtype=\"int32\"" in y.astext()
-    yy = relay.ir_pass.infer_type(y)
+    yy = run_infer_type(y)
     assert yy.checked_type ==  relay.TensorType(
         (n, 2, 222, 222), "int32")
 
@@ -59,7 +66,7 @@ def test_conv2d_infer_type():
                         data_layout="NCHW4n4c",
                         kernel_layout="OIHW4o4i",
                         out_dtype="int32")
-    yy = relay.ir_pass.infer_type(y)
+    yy = run_infer_type(y)
     assert yy.checked_type ==  relay.TensorType(
         (1, 4, 224, 224, 4, 4), "int32")
     assert yy.args[1].checked_type == relay.TensorType(
@@ -75,7 +82,7 @@ def test_conv2d_infer_type():
                         channels=16,
                         data_layout="NHWC",
                         out_dtype="int32")
-    yy = relay.ir_pass.infer_type(y)
+    yy = run_infer_type(y)
     assert yy.checked_type ==  relay.TensorType(
         (n, h, w, 16), "int32")
 
@@ -169,7 +176,7 @@ def test_conv2d_transpose_infer_type():
                                   padding=(1, 1),
                                   channels=15)
     assert "channels=15" in y.astext()
-    yy = relay.ir_pass.infer_type(y)
+    yy = run_infer_type(y)
     assert yy.checked_type == relay.TensorType(
         (n, 15, 10, 12), "float32")
     assert yy.args[1].checked_type == relay.TensorType(
@@ -183,7 +190,7 @@ def test_conv2d_transpose_infer_type():
                                   output_padding=(1, 1),
                                   channels=11,
                                   data_layout="NHWC")
-    yy = relay.ir_pass.infer_type(y)
+    yy = run_infer_type(y)
     assert yy.checked_type == relay.TensorType(
         (n, 15, 15, 11), "float32")
 
@@ -219,12 +226,12 @@ def test_upsampling_infer_type():
     x = relay.var("x", relay.TensorType((n, c, h, w), "float32"))
     y = relay.nn.upsampling(x, scale=2, layout="NCHW", method="BILINEAR")
     "method=\"BINLINEAR\"" in y.astext()
-    yy = relay.ir_pass.infer_type(y)
+    yy = run_infer_type(y)
     assert yy.checked_type == relay.TensorType((n, c, h*2, w*2), "float32")
     n, c = tvm.var("n"), tvm.var("c")
     x = relay.var("x", relay.TensorType((n, c, 100, 200), "float32"))
     y = relay.nn.upsampling(x, scale=2, layout="NCHW", method="BILINEAR")
-    yy = relay.ir_pass.infer_type(y)
+    yy = run_infer_type(y)
     assert yy.checked_type == relay.TensorType((n, c, 200, 400), "float32")
 
 
@@ -233,7 +240,7 @@ def _test_pool2d(opfunc, reffunc):
     x = relay.var("x", relay.TensorType((n, c, h, w), "float32"))
     y = opfunc(x, pool_size=(1, 1))
     assert "pool_size=" in y.astext()
-    yy = relay.ir_pass.infer_type(y)
+    yy = run_infer_type(y)
     assert yy.checked_type == relay.TensorType((n, 10, 224, 224), "float32")
     # test execution
     dtype = "float32"
@@ -253,13 +260,13 @@ def _test_global_pool2d(opfunc, reffunc):
     n, c, h, w = tvm.var("n"), tvm.var("c"), 224, 224
     x = relay.var("x", relay.TensorType((n, h, w, c), "float32"))
     y = opfunc(x, layout="NHWC")
-    yy = relay.ir_pass.infer_type(y)
+    yy = run_infer_type(y)
     assert yy.checked_type == relay.TensorType((n, 1, 1, c), "float32")
 
     n, c, h, w = tvm.var("n"), tvm.var("c"), tvm.var("h"), tvm.var("w")
     x = relay.var("x", relay.TensorType((n, c, h, w), "float32"))
     y = opfunc(x)
-    yy = relay.ir_pass.infer_type(y)
+    yy = run_infer_type(y)
     assert yy.checked_type == relay.TensorType((n, c, 1, 1), "float32")
     # test execution
     dtype = "float32"
@@ -320,17 +327,17 @@ def test_flatten_infer_type():
     d1, d2, d3, d4 = tvm.var("d1"), tvm.var("d2"), tvm.var("d3"), tvm.var("d4")
     x = relay.var("x", relay.TensorType((d1, d2, d3, d4), "float32"))
     y = relay.nn.batch_flatten(x)
-    yy = relay.ir_pass.infer_type(y)
+    yy = run_infer_type(y)
     assert yy.checked_type == relay.TensorType((d1, ((d2*d3)*d4)), "float32")
 
     x = relay.var("x", relay.TensorType((3, 2, 4, 3), "float32"))
     y = relay.nn.batch_flatten(x)
-    yy = relay.ir_pass.infer_type(y)
+    yy = run_infer_type(y)
     assert yy.checked_type == relay.TensorType((3, 24), "float32")
 
     x = relay.var("x", relay.TensorType((d1, 2, d3, 3), "float32"))
     y = relay.nn.batch_flatten(x)
-    yy = relay.ir_pass.infer_type(y)
+    yy = run_infer_type(y)
     assert yy.checked_type == relay.TensorType((d1, ((2*d3)*3)), "float32")
 
     shape = (1, 5, 10, 10)
@@ -338,7 +345,7 @@ def test_flatten_infer_type():
     dtype = "float32"
     x = relay.var("x", relay.TensorType(shape, dtype))
     z = relay.nn.batch_flatten(x)
-    yy = relay.ir_pass.infer_type(z)
+    yy = run_infer_type(z)
     assert yy.checked_type == relay.TensorType(o_shape, dtype)
     func = relay.Function([x], z)
     x_data = np.random.uniform(low=-1, high=1, size=shape).astype(dtype)
@@ -358,14 +365,14 @@ def test_pad_infer_type():
     t = relay.var("t", relay.TensorType((n, c, h, w), "float32"))
     y = relay.nn.pad(t, ((1, 1), (2, 2), (3, 3), (4, 4)))
     "pad_width=" in y.astext()
-    yy = relay.ir_pass.infer_type(y)
+    yy = run_infer_type(y)
     assert yy.checked_type == relay.TensorType((3, 6, 9, 12), "float32")
 
     # some symbolic values
     n, c, h, w = tvm.var("n"), 2, 3, tvm.var("w")
     t = relay.var("t", relay.TensorType((n, c, h, w), "float32"))
     y = relay.nn.pad(t, ((1, 1), (2, 2), (3, 3), (4, 4)))
-    yy = relay.ir_pass.infer_type(y)
+    yy = run_infer_type(y)
     assert yy.checked_type == relay.TensorType((n + 2, 6, 9, w + 8), "float32")
 
 def test_pad_run():
@@ -389,7 +396,7 @@ def test_lrn():
     x = relay.var("x", shape=(n, c , h, w))
     y = relay.nn.lrn(x, size=10, axis=2, bias=0.5, alpha=.00001, beta=0.75)
     "alpha=" in y.astext()
-    yy = relay.ir_pass.infer_type(y)
+    yy = run_infer_type(y)
     assert yy.checked_type == relay.TensorType((n, c , h, w))
 
     shape = (1, 5, 10, 10)
@@ -401,7 +408,7 @@ def test_lrn():
     alpha=.00001
     beta=0.75
     z = relay.nn.lrn(x, size=size, axis=axis, bias=bias, alpha=alpha, beta=beta)
-    yy = relay.ir_pass.infer_type(z)
+    yy = run_infer_type(z)
     assert yy.checked_type == relay.TensorType(shape, dtype)
     func = relay.Function([x], z)
     x_data = np.random.uniform(low=-1, high=1, size=shape).astype(dtype)
@@ -420,7 +427,7 @@ def test_l2_normalize():
     x = relay.var("x", shape=(n, c , h, w))
     y = relay.nn.l2_normalize(x, eps=0.001, axis=[1])
     "axis=" in y.astext()
-    yy = relay.ir_pass.infer_type(y)
+    yy = run_infer_type(y)
     assert yy.checked_type == relay.TensorType((n, c , h, w))
 
     shape = (1, 5, 10, 10)
@@ -429,7 +436,7 @@ def test_l2_normalize():
     eps=0.001
     axis=1
     z = relay.nn.l2_normalize(x, eps=0.001, axis=[axis])
-    yy = relay.ir_pass.infer_type(z)
+    yy = run_infer_type(z)
     assert yy.checked_type == relay.TensorType(shape, dtype)
     func = relay.Function([x], z)
     x_data = np.random.uniform(low=-1, high=1, size=shape).astype(dtype)
@@ -477,7 +484,7 @@ def get_shape():
     ishape, oshape = get_shape()
     x = relay.var("x", relay.TensorType((n,) + ishape, dtype))
     y = relay.nn.upsampling(x, scale=scale, layout=layout, method=method)
-    yy = relay.ir_pass.infer_type(y)
+    yy = run_infer_type(y)
     assert yy.checked_type == relay.TensorType((n,) + oshape, dtype)
     dshape = (1,) + ishape
     x = relay.var("x", shape=dshape)
diff --git a/tests/python/relay/test_op_level3.py b/tests/python/relay/test_op_level3.py
index fcd4caff2695f..e1a760421349a 100644
--- a/tests/python/relay/test_op_level3.py
+++ b/tests/python/relay/test_op_level3.py
@@ -16,17 +16,23 @@
 # under the License.
 """ Support level3 operator test cases.
 """
-import tvm
 import numpy as np
+from nose.tools import raises
+import tvm
 from tvm import relay
-from tvm.relay import create_executor
+from tvm.relay import create_executor, transform
 from tvm.relay.testing import ctx_list
-from nose.tools import raises
+
+def run_infer_type(expr):
+    mod = relay.Module.from_expr(expr)
+    mod = transform.InferType()(mod)
+    entry = mod["main"]
+    return entry if isinstance(expr, relay.Function) else entry.body
 
 def test_zeros_ones():
     for op, ref in [(relay.zeros, np.zeros), (relay.ones, np.ones)]:
         y = op(shape=(124, 50), dtype="float64")
-        yy = relay.ir_pass.infer_type(y)
+        yy = run_infer_type(y)
         assert yy.checked_type == relay.TensorType((124, 50), "float64")
         intrp = create_executor()
         intrp_res = intrp.evaluate(y).asnumpy()
@@ -46,7 +52,7 @@ def test_unary_identity():
         shape = (8, 9, 4)
         x = relay.var("x", relay.TensorType(shape, "float32"))
         y = op(x)
-        yy = relay.ir_pass.infer_type(y)
+        yy = run_infer_type(y)
         assert yy.checked_type == relay.TensorType(shape, "float32")
 
         if ref is not None:
@@ -59,20 +65,20 @@ def test_unary_identity():
 def test_cast():
     x = relay.var("x", relay.TensorType((8, 9, 4), "float32"))
     y = x.astype("int32")
-    yy = relay.ir_pass.infer_type(y)
+    yy = run_infer_type(y)
     assert "dtype=" in yy.astext()
     assert yy.checked_type == relay.TensorType((8, 9, 4), "int32")
 
     x = relay.var("x", relay.TensorType((8, 9, 4), "float32"))
     y = relay.cast(x, "int32")
-    yy = relay.ir_pass.infer_type(y)
+    yy = run_infer_type(y)
     assert "dtype=" in yy.astext()
     assert yy.checked_type == relay.TensorType((8, 9, 4), "int32")
 
 def test_clip():
     a = relay.var("a", relay.TensorType((10, 4), "float32"))
     y = relay.clip(a, 1., 4.)
-    yy = relay.ir_pass.infer_type(y)
+    yy = run_infer_type(y)
     assert yy.checked_type == relay.TensorType((10, 4), "float32")
 
     data = np.random.rand(10, 4).astype('float32')
@@ -105,13 +111,13 @@ def test_transpose_infer_type():
     x = relay.var("x", relay.TensorType((n, t, d), "float32"))
     y = relay.transpose(x, axes=(1, 0, 2))
     assert "axes=" in y.astext()
-    yy = relay.ir_pass.infer_type(y)
+    yy = run_infer_type(y)
     assert yy.checked_type == relay.TensorType(
         (t, n, 100), "float32")
 
     y = relay.transpose(x)
     assert "axes=" in y.astext()
-    yy = relay.ir_pass.infer_type(y)
+    yy = run_infer_type(y)
     assert yy.checked_type == relay.TensorType(
         (100, t, n), "float32")
 
@@ -138,7 +144,7 @@ def test_squeeze_infer_type():
     x = relay.var("x", relay.TensorType((n, t, d), "float32"))
     y = relay.squeeze(x, axis=(2,))
     assert "axis=" in y.astext()
-    yy = relay.ir_pass.infer_type(y)
+    yy = run_infer_type(y)
     assert yy.checked_type == relay.TensorType(
         (1, 4), "float32")
 
@@ -146,7 +152,7 @@ def test_squeeze_infer_type():
     x = relay.var("x", relay.TensorType((n, t, d), "float32"))
     y = relay.squeeze(x)
     assert "axis=" not in y.astext()
-    yy = relay.ir_pass.infer_type(y)
+    yy = run_infer_type(y)
     assert yy.checked_type == relay.TensorType(
         (4,), "float32")
 
@@ -156,7 +162,7 @@ def test_squeeze_bad_axes_infer_type():
     n, t, d = 1, 4, 1
     x = relay.var("x", relay.TensorType((n, t, d), "float32"))
     y = relay.squeeze(x, axis=(1,))
-    yy = relay.ir_pass.infer_type(y)
+    yy = run_infer_type(y)
 
 
 def test_reshape_infer_type():
@@ -164,7 +170,7 @@ def test_reshape_infer_type():
     x = relay.var("x", relay.TensorType((n, t, d1, d2), "float32"))
     y = relay.reshape(x, newshape=(n, t, 2000))
     assert "newshape=" in y.astext()
-    yy = relay.ir_pass.infer_type(y)
+    yy = run_infer_type(y)
     assert yy.checked_type == relay.TensorType(
         (n, t, 2000), "float32")
 
@@ -172,7 +178,7 @@ def test_reshape():
     def verify_reshape(shape, newshape, oshape):
         x = relay.var("x", relay.TensorType(shape, "float32"))
         z = relay.reshape(x, newshape=newshape)
-        zz = relay.ir_pass.infer_type(z)
+        zz = run_infer_type(z)
         assert "newshape=" in z.astext()
         assert zz.checked_type == relay.ty.TensorType(oshape, "float32")
 
@@ -205,7 +211,7 @@ def test_reshape_like_infer_type():
     x = relay.var("x", relay.TensorType((1, 2, 3), "float32"))
     y = relay.var("y", relay.TensorType((1,6), "float32"))
     z = relay.reshape_like(x, y)
-    zz = relay.ir_pass.infer_type(z)
+    zz = run_infer_type(z)
     assert zz.checked_type == relay.TensorType((1, 6), "float32")
 
     # symbolic shape
@@ -213,7 +219,7 @@ def test_reshape_like_infer_type():
     x = relay.var("x", relay.TensorType((n, c, h, w), "float32"))
     y = relay.var("y", relay.TensorType((1, 8, 8), "float32"))
     z = relay.reshape_like(x, y)
-    zz = relay.ir_pass.infer_type(z)
+    zz = run_infer_type(z)
     assert zz.checked_type == relay.TensorType((1, 8, 8), "float32")
 
 
@@ -226,7 +232,7 @@ def verify_reshape_like(shape, oshape):
         x = relay.var("x", relay.TensorType(shape, "float32"))
         y = relay.var("x", relay.TensorType(oshape, "float32"))
         z = relay.reshape_like(x, y)
-        zz = relay.ir_pass.infer_type(z)
+        zz = run_infer_type(z)
         assert zz.checked_type == relay.ty.TensorType(ref_res.shape, "float32")
 
         func = relay.Function([x, y], z)
@@ -245,8 +251,7 @@ def verify_take(dshape, indices_shape, oshape, axis=None):
         x = relay.var("x", relay.TensorType(dshape, "float32"))
         indices = relay.var("indices", relay.TensorType(indices_shape, "int32"))
         y = relay.take(x, indices, axis=axis)
-        y.astext()
-        yy = relay.ir_pass.infer_type(y)
+        yy = run_infer_type(y)
         assert yy.checked_type == relay.TensorType(oshape, "float32")
 
     d1, d2, d3 = tvm.var("d1"), tvm.var("d2"), tvm.var("d3")
@@ -301,8 +306,7 @@ def test_split_infer_type():
     def verify_split(dshape, indices_or_sections, ret_type, axis=None):
         x = relay.var("x", relay.ty.TensorType(dshape, "float32"))
         y = relay.split(x, indices_or_sections, axis=axis)
-        y.astext()
-        yy = relay.ir_pass.infer_type(y.astuple())
+        yy = run_infer_type(y.astuple())
         assert yy.checked_type == ret_type
 
     d1, d2, d3, d4 = tvm.var("d1"), tvm.var("d2"), tvm.var("d3"), tvm.var("d4")
@@ -347,14 +351,14 @@ def test_full_infer_type():
     # default settings: match input dtype
     x = relay.var("x", relay.TensorType((), "int8"))
     y = relay.full(x, ())
-    yy = relay.ir_pass.infer_type(y)
+    yy = run_infer_type(y)
     assert yy.checked_type == relay.TensorType((), "int8")
 
     # change the shape and dtype
     x = relay.var("x", relay.TensorType((), "float32"))
     y = relay.full(x, (1, 2), "int8")
     "shape=" in y.astext()
-    yy = relay.ir_pass.infer_type(y)
+    yy = run_infer_type(y)
     assert yy.checked_type == relay.TensorType((1, 2), "int8")
 
 
@@ -378,7 +382,7 @@ def test_full_like_infer_type():
     base = relay.var("base", relay.TensorType((1, 2, 3), "float32"))
     fill = relay.var("fill", relay.TensorType((), "float32"))
     y = relay.full_like(base, fill)
-    yy = relay.ir_pass.infer_type(y)
+    yy = run_infer_type(y)
     assert yy.checked_type == relay.TensorType((1, 2, 3), "float32")
 
     # symbolic shape
@@ -386,7 +390,7 @@ def test_full_like_infer_type():
     base = relay.var("base", relay.TensorType((n, c, h, w), "float32"))
     fill = relay.var("fill", relay.TensorType((), "float32"))
     y = relay.full_like(base, fill)
-    yy = relay.ir_pass.infer_type(y)
+    yy = run_infer_type(y)
     assert yy.checked_type == relay.TensorType((n, c, h, w), "float32")
 
 
@@ -414,7 +418,7 @@ def test_infer_type_leaky_relu():
     x = relay.var("x", relay.TensorType((n, c, h, w), "float32"))
     y = relay.nn.leaky_relu(x, alpha=0.1)
     "alpha=0.1" in y.astext()
-    yy = relay.ir_pass.infer_type(y)
+    yy = run_infer_type(y)
     assert yy.checked_type == relay.TensorType((n, c, h, w), "float32")
 
     shape = (1, 5, 10, 10)
@@ -422,8 +426,8 @@ def test_infer_type_leaky_relu():
     x = relay.var("x", relay.TensorType(shape, dtype))
     z = relay.nn.leaky_relu(x, alpha=0.1)
     assert "alpha=0.1" in z.astext()
-    yy = relay.ir_pass.infer_type(z)
-    assert yy.checked_type == relay.TensorType(shape, dtype)
+    zz = run_infer_type(z)
+    assert zz.checked_type == relay.TensorType(shape, dtype)
     func = relay.Function([x], z)
     x_data = np.random.uniform(low=-1, high=1, size=shape).astype(dtype)
     ref_res = np.where(x_data > 0, x_data, x_data * 0.1)
@@ -443,7 +447,7 @@ def verify_infer_type_prelu(data, alpha, axis, output, dtype="float32"):
     else:
         y = relay.var("alpha", relay.IncompleteType())
     z = relay.nn.prelu(x, y, axis=axis)
-    zz = relay.ir_pass.infer_type(z)
+    zz = run_infer_type(z)
     if axis != 1:
         assert "axis" in z.astext()
     assert zz.checked_type == relay.ty.TensorType(output, dtype)
@@ -577,7 +581,7 @@ def test_reverse():
     def verify_reverse(dshape, axis):
         x = relay.var("x", relay.TensorType(dshape, "float32"))
         z = relay.reverse(x, axis=axis)
-        zz = relay.ir_pass.infer_type(z)
+        zz = run_infer_type(z)
 
         func = relay.Function([x], z)
         x_data = np.random.uniform(low=-1, high=1, size=dshape).astype("float32")
diff --git a/tests/python/relay/test_op_level4.py b/tests/python/relay/test_op_level4.py
index da0fe01063f4a..69fd88b562b7b 100644
--- a/tests/python/relay/test_op_level4.py
+++ b/tests/python/relay/test_op_level4.py
@@ -17,9 +17,16 @@
 import tvm
 import numpy as np
 from tvm import relay
+from tvm.relay import transform
 from tvm.relay.testing import ctx_list
 import topi.testing
 
+def run_infer_type(expr):
+    mod = relay.Module.from_expr(expr)
+    mod = transform.InferType()(mod)
+    entry = mod["main"]
+    return entry if isinstance(expr, relay.Function) else entry.body
+
 def test_binary_op():
     def check_binary_op(opfunc, ref):
         n = tvm.var("n")
@@ -30,7 +37,8 @@ def check_binary_op(opfunc, ref):
         z = opfunc(x, y)
         # test printer
         assert ("{}(%x, %y)".format(z.op.name)) in z.astext()
-        assert relay.ir_pass.infer_type(z).checked_type == t1
+        zz = run_infer_type(z)
+        assert zz.checked_type == t1
 
         if ref is not None:
             t1 = relay.TensorType((5, 10, 5))
@@ -62,8 +70,7 @@ def test_cmp_type():
         x = relay.var("x", relay.TensorType((10, 4), "float32"))
         y = relay.var("y", relay.TensorType((5, 10, 1), "float32"))
         z = op(x, y)
-        z.astext()
-        zz = relay.ir_pass.infer_type(z)
+        zz = run_infer_type(z)
         assert zz.checked_type == relay.TensorType((5, 10, 4), "bool")
 
         if ref is not None:
@@ -94,7 +101,7 @@ def test_binary_int_broadcast():
         x = relay.var("x", relay.TensorType((10, 4), "int32"))
         y = relay.var("y", relay.TensorType((5, 10, 1), "int32"))
         z = op(x, y)
-        zz = relay.ir_pass.infer_type(z)
+        zz = run_infer_type(z)
         assert zz.checked_type == relay.TensorType((5, 10, 4), "int32")
 
     if ref is not None:
@@ -120,7 +127,7 @@ def test_where():
     x = relay.var("x", relay.TensorType(shape, dtype))
     y = relay.var("y", relay.TensorType(shape, dtype))
     z = relay.where(cond, x, y)
-    zz = relay.ir_pass.infer_type(z)
+    zz = run_infer_type(z)
     assert zz.checked_type == relay.TensorType(shape, dtype)
 
     func = relay.Function([cond, x, y], z)
@@ -142,7 +149,7 @@ def verify_reduce(funcs, data, axis, keepdims, exclude, output, dtype="float32")
 
     x = relay.var("x", relay.TensorType(data, dtype))
     z = test_func(x, axis, keepdims, exclude)
-    zz = relay.ir_pass.infer_type(z)
+    zz = run_infer_type(z)
     if axis:
         assert "axis=" in z.astext()
     if keepdims:
@@ -224,7 +231,7 @@ def verify(dshape, begin, end, strides, output, test_ref=True):
         x = relay.var("x", relay.TensorType(dshape, "float32"))
         z = relay.strided_slice(x, begin=begin, end=end, strides=strides)
         func = relay.Function([x], z)
-        func = relay.ir_pass.infer_type(func)
+        func = run_infer_type(func)
         text = func.astext()
         assert "begin=" in text
         assert "end=" in text
diff --git a/tests/python/relay/test_op_level5.py b/tests/python/relay/test_op_level5.py
index 3d9ec6dde4adc..328e4d5b0da34 100644
--- a/tests/python/relay/test_op_level5.py
+++ b/tests/python/relay/test_op_level5.py
@@ -20,21 +20,28 @@
 import numpy as np
 import tvm
 from tvm import relay
+from tvm.relay import transform
 from tvm.relay.testing import ctx_list
 import topi.testing
 
+def run_infer_type(expr):
+    mod = relay.Module.from_expr(expr)
+    mod = transform.InferType()(mod)
+    entry = mod["main"]
+    return entry if isinstance(expr, relay.Function) else entry.body
+
 def test_resize_infer_type():
     n, c, h, w = tvm.var("n"), tvm.var("c"), tvm.var("h"), tvm.var("w")
     x = relay.var("x", relay.TensorType((n, c, h, w), "int8"))
     th, tw = tvm.var("th"), tvm.var("tw")
     z = relay.image.resize(x, (th, tw))
-    zz = relay.ir_pass.infer_type(z)
+    zz = run_infer_type(z)
     assert zz.checked_type == relay.TensorType((n, c, th, tw), "int8")
 
     x = relay.var("x", relay.TensorType((n, c, h, w), "int8"))
     z= relay.image.resize(x, (100, 200), "NCHW", "BILINEAR", False)
     assert "size=" in z.astext()
-    zz = relay.ir_pass.infer_type(z)
+    zz = run_infer_type(z)
     assert zz.checked_type == relay.TensorType((n, c, 100, 200), "int8")
 
 def test_resize():
@@ -52,7 +59,7 @@ def verify_resize(dshape, scale, method, layout):
         x = relay.var("x", relay.TensorType(dshape, "float32"))
         z = relay.image.resize(x, size, layout, method, False)
         assert "size=" in z.astext()
-        zz = relay.ir_pass.infer_type(z)
+        zz = run_infer_type(z)
         assert zz.checked_type == relay.TensorType(ref_res.shape, "float32")
         func = relay.Function([x], z)
 
@@ -109,7 +116,7 @@ def verify_multibox_prior(x, dshape, ref_res, sizes=(1.0,),
                               check_type_only=False):
 
         z = relay.vision.multibox_prior(x, sizes, ratios, steps, offsets, clip)
-        zz = relay.ir_pass.infer_type(z)
+        zz = run_infer_type(z)
         if check_size:
             assert "sizes=" in z.astext()
         assert zz.checked_type == relay.TensorType(
@@ -121,7 +128,7 @@ def verify_multibox_prior(x, dshape, ref_res, sizes=(1.0,),
 
         data = np.random.uniform(low=-1, high=1, size=dshape).astype("float32")
         func = relay.Function([x], z)
-        func = relay.ir_pass.infer_type(func)
+        func = run_infer_type(func)
         for target, ctx in ctx_list():
             intrp1 = relay.create_executor("graph", ctx=ctx, target=target)
             op_res1 = intrp1.evaluate(func)(data)
@@ -176,7 +183,7 @@ def verify_get_valid_counts(dshape, score_threshold, id_index, score_index):
         z = relay.vision.get_valid_counts(x, score_threshold, id_index, score_index)
         assert "score_threshold" in z.astext()
         func = relay.Function([x], z.astuple())
-        func = relay.ir_pass.infer_type(func)
+        func = run_infer_type(func)
         for target, ctx in ctx_list():
             if target == 'cuda':
                 return
@@ -205,8 +212,8 @@ def verify_nms(x0_data, x1_data, dshape, ref_res, ref_indices_res,
                     top_k = top_k)
         assert "iou_threshold" in z.astext()
         assert "iou_threshold" in z_indices.astext()
-        zz = relay.ir_pass.infer_type(z)
-        zz_indices = relay.ir_pass.infer_type(z_indices)
+        zz = run_infer_type(z)
+        zz_indices = run_infer_type(z_indices)
         assert zz.checked_type == relay.ty.TensorType(dshape, "float32")
         assert zz_indices.checked_type == relay.ty.TensorType((dshape[0], dshape[1]), "int32")
 
@@ -214,9 +221,9 @@ def verify_nms(x0_data, x1_data, dshape, ref_res, ref_indices_res,
             return
 
         func = relay.Function([x0, x1], z)
-        func = relay.ir_pass.infer_type(func)
+        func = run_infer_type(func)
         func_indices = relay.Function([x0, x1], z_indices)
-        func_indices = relay.ir_pass.infer_type(func_indices)
+        func_indices = run_infer_type(func_indices)
         for target, ctx in ctx_list():
             intrp1 = relay.create_executor("graph", ctx=ctx, target=target)
             op_res1 = intrp1.evaluate(func)(x0_data, x1_data)
@@ -288,7 +295,7 @@ def test_default_value():
 
         mtl = relay.vision.multibox_transform_loc(
             cls_prob=cls_prob, loc_pred=loc_pred, anchor=anchors)
-        ret = relay.ir_pass.infer_type(mtl.astuple())
+        ret = run_infer_type(mtl.astuple())
         ref_type = relay.ty.TupleType(
             tvm.convert([
                 relay.ty.TensorType((1, num_anchors, 6), "float32"),
@@ -299,7 +306,7 @@ def test_default_value():
 
         nms = relay.vision.non_max_suppression(mtl[0], mtl[1], return_indices=False)
         func = relay.Function([cls_prob, loc_pred, anchors], nms)
-        func = relay.ir_pass.infer_type(func)
+        func = run_infer_type(func)
         for target, ctx in ctx_list():
             intrp1 = relay.create_executor("graph", ctx=ctx, target=target)
             op_res1 = intrp1.evaluate(func)(np_cls_prob, np_loc_preds,
@@ -330,7 +337,7 @@ def test_threshold():
             anchor=anchors,
             threshold=threshold,
             variances=variances)
-        ret = relay.ir_pass.infer_type(ret.astuple())
+        ret = run_infer_type(ret.astuple())
         ref_type = relay.ty.TupleType(
             tvm.convert([
                 relay.ty.TensorType((n, num_anchors, 6), "float32"),
@@ -349,15 +356,14 @@ def verify_roi_align(data_shape, rois_shape, pooled_size, spatial_scale, sample_
         z = relay.vision.roi_align(data, rois, pooled_size=(pooled_size, pooled_size),
                                    spatial_scale=spatial_scale, sample_ratio=sample_ratio,
                                    layout="NCHW")
-        zz = relay.ir_pass.infer_type(z)
-
+        zz = run_infer_type(z)
         batch, channel, in_size, _ = data_shape
         num_roi = rois_shape[0]
         assert zz.checked_type == relay.ty.TensorType(
                 (num_roi, channel, pooled_size, pooled_size), "float32")
 
         func = relay.Function([data, rois], z)
-        func = relay.ir_pass.infer_type(func)
+        func = run_infer_type(func)
         np_data = np.random.uniform(size=data_shape).astype("float32")
         np_rois = np.random.uniform(size=rois_shape).astype('float32') * in_size
         np_rois[:, 0] = np.random.randint(low = 0, high = batch, size = num_roi)
@@ -382,15 +388,14 @@ def verify_roi_pool(data_shape, rois_shape, pooled_size, spatial_scale):
         rois = relay.var("rois", relay.ty.TensorType(rois_shape, "float32"))
         z = relay.vision.roi_pool(data, rois, pooled_size=(pooled_size, pooled_size),
                                    spatial_scale=spatial_scale, layout="NCHW")
-        zz = relay.ir_pass.infer_type(z)
-
+        zz = run_infer_type(z)
         batch, channel, in_size, _ = data_shape
         num_roi = rois_shape[0]
         assert zz.checked_type == relay.ty.TensorType(
                 (num_roi, channel, pooled_size, pooled_size), "float32")
 
         func = relay.Function([data, rois], z)
-        func = relay.ir_pass.infer_type(func)
+        func = run_infer_type(func)
         np_data = np.random.uniform(size=data_shape).astype("float32")
         np_rois = np.random.uniform(size=rois_shape).astype('float32') * in_size
         np_rois[:, 0] = np.random.randint(low = 0, high = batch, size = num_roi).astype('float32')
@@ -414,12 +419,11 @@ def verify_proposal(np_cls_prob, np_bbox_pred, np_im_info, np_out, attrs):
         bbox_pred = relay.var("bbox_pred", relay.ty.TensorType(np_bbox_pred.shape, "float32"))
         im_info = relay.var("im_info", relay.ty.TensorType(np_im_info.shape, "float32"))
         z = relay.vision.proposal(cls_prob, bbox_pred, im_info, **attrs)
-        zz = relay.ir_pass.infer_type(z)
-
+        zz = run_infer_type(z)
         assert zz.checked_type == relay.ty.TensorType(np_out.shape, "float32")
 
         func = relay.Function([cls_prob, bbox_pred, im_info], z)
-        func = relay.ir_pass.infer_type(func)
+        func = run_infer_type(func)
         for target in ['cuda']:
             if not tvm.module.enabled(target):
                 print("Skip test because %s is not enabled." % target)
@@ -478,7 +482,7 @@ def test_yolo_reorg_infer_shape():
     def verify_yolo_reorg(shape, stride, out_shape):
         x = relay.var("x", relay.TensorType(shape, "float32"))
         z = relay.vision.yolo_reorg(x, stride=stride)
-        zz = relay.ir_pass.infer_type(z)
+        zz = run_infer_type(z)
         assert "stride=" in z.astext()
         assert zz.checked_type == relay.ty.TensorType(out_shape, "float32")
 
@@ -493,7 +497,7 @@ def verify_yolo_reorg(shape, stride):
 
         x = relay.var("x", relay.TensorType(shape, "float32"))
         z = relay.vision.yolo_reorg(x, stride=stride)
-        zz = relay.ir_pass.infer_type(z)
+        zz = run_infer_type(z)
         assert "stride=" in z.astext()
         assert zz.checked_type == relay.ty.TensorType(ref_res.shape, "float32")
 
@@ -527,7 +531,7 @@ def test_infer_type(batch, in_channel, size, out_channel, deformable_groups, gro
         weight_shape = (out_channel, in_channel // groups, kernel_size[0], kernel_size[1])
         out_shape = (batch, out_channel, size, size)
         offset_shape = (batch, 2 * kernel_size[0] * kernel_size[1] * deformable_groups, out_shape[2], out_shape[3])
-        yy = relay.ir_pass.infer_type(y)
+        yy = run_infer_type(y)
         assert yy.checked_type == relay.TensorType(out_shape)
         assert yy.args[1].checked_type == relay.TensorType(offset_shape), yy.args[1].checked_type
         assert yy.args[2].checked_type == relay.TensorType(weight_shape)
diff --git a/tests/python/relay/test_pass_alpha_equal.py b/tests/python/relay/test_pass_alpha_equal.py
index 0e0036565363e..de764f849c1c7 100644
--- a/tests/python/relay/test_pass_alpha_equal.py
+++ b/tests/python/relay/test_pass_alpha_equal.py
@@ -14,17 +14,17 @@
 # KIND, either express or implied.  See the License for the
 # specific language governing permissions and limitations
 # under the License.
-import tvm
 import numpy as np
+import tvm
 from tvm import relay
-from tvm.relay import ir_pass
+from tvm.relay import analysis
 
 def alpha_equal(x, y):
     """
     Wrapper around alpha equality which ensures that
     the hash function respects equality.
     """
-    return ir_pass.alpha_equal(x, y) and ir_pass.structural_hash(x) == ir_pass.structural_hash(y)
+    return analysis.alpha_equal(x, y) and analysis.structural_hash(x) == analysis.structural_hash(y)
 
 def test_tensor_type_alpha_equal():
     t1 = relay.TensorType((3, 4), "float32")
@@ -604,14 +604,14 @@ def test_hash_unequal():
     y2 = relay.var("y2", shape=(10, 10), dtype="float32")
     func2 = relay.Function([x2, y2], relay.add(x2, y2))
 
-    assert ir_pass.structural_hash(func1) == ir_pass.structural_hash(func2)
+    assert analysis.structural_hash(func1) == analysis.structural_hash(func2)
 
     # func3 is same as func1 but with different var shapes
     x3 = relay.var("x3", shape=(20, 10), dtype="float32")
     y3 = relay.var("y3", shape=(20, 10), dtype="float32")
     func3 = relay.Function([x3, y3], relay.add(x3, y3))
 
-    assert not ir_pass.structural_hash(func1) == ir_pass.structural_hash(func3)
+    assert not analysis.structural_hash(func1) == analysis.structural_hash(func3)
 
 if __name__ == "__main__":
     test_tensor_type_alpha_equal()
diff --git a/tests/python/relay/test_pass_alter_op_layout.py b/tests/python/relay/test_pass_alter_op_layout.py
index 7d022ba255708..6b31eed8f166d 100644
--- a/tests/python/relay/test_pass_alter_op_layout.py
+++ b/tests/python/relay/test_pass_alter_op_layout.py
@@ -19,7 +19,18 @@
 
 from tvm import relay
 from tvm.relay.op import register_alter_op_layout
-from tvm.relay.ir_pass import *
+from tvm.relay import transform, analysis
+
+
+def run_opt_pass(expr, passes):
+    passes = passes if isinstance(passes, list) else [passes]
+    mod = relay.Module.from_expr(expr)
+    seq = transform.Sequential(passes)
+    with transform.PassContext(opt_level=3):
+        mod = seq(mod)
+    entry = mod["main"]
+    return entry if isinstance(expr, relay.Function) else entry.body
+
 
 def test_alter_op():
     """Test directly replacing an operator with a new one"""
@@ -52,13 +63,10 @@ def expected():
         return y
 
     a = before()
-    a = infer_type(a)
-    a = alter_op_layout(a)
+    a = run_opt_pass(a, transform.AlterOpLayout())
+    b = run_opt_pass(expected(), transform.InferType())
 
-    b = expected()
-    b = infer_type(b)
-
-    assert alpha_equal(a, b), "Actual = \n" + str(a)
+    assert analysis.alpha_equal(a, b), "Actual = \n" + str(a)
 
 
 def test_alter_return_none():
@@ -77,12 +85,11 @@ def alter_conv2d(attrs, inputs, tinfos):
         return None
 
     a = before()
-    a = infer_type(a)
-    a = alter_op_layout(a)
+    a = run_opt_pass(a, transform.AlterOpLayout())
 
     b = before()
-    b = infer_type(b)
-    assert alpha_equal(a, b), "Actual = \n" + str(a)
+    b = run_opt_pass(b, transform.InferType())
+    assert analysis.alpha_equal(a, b), "Actual = \n" + str(a)
     assert(called[0])
 
 
@@ -102,7 +109,7 @@ def before():
         y = relay.nn.max_pool2d(y, pool_size=(2, 2))
         y = relay.cast(y, 'int32')
         y = relay.nn.batch_flatten(y)
-        y = relay.Function(free_vars(y), y)
+        y = relay.Function(analysis.free_vars(y), y)
         return y
 
     @register_alter_op_layout("nn.conv2d", level=102)
@@ -135,20 +142,17 @@ def expected():
         y = relay.cast(y, 'int32')
         y = relay.layout_transform(y, "NCHW16c", "NCHW")
         y = relay.nn.batch_flatten(y)
-        y = relay.Function(free_vars(y), y)
+        y = relay.Function(analysis.free_vars(y), y)
         return y
 
     a = before()
-    a = infer_type(a)
-    a = canonicalize_ops(a)
-    a = infer_type(a)
-    a = alter_op_layout(a)
-    a = infer_type(a)
+    a = run_opt_pass(a, [transform.CanonicalizeOps(),
+                         transform.AlterOpLayout()])
 
     b = expected()
-    b = infer_type(b)
+    b = run_opt_pass(b, transform.InferType())
 
-    assert alpha_equal(a, b), "Actual = \n" + str(a)
+    assert analysis.alpha_equal(a, b), "Actual = \n" + str(a)
 
 
 def test_alter_layout_dual_path():
@@ -172,7 +176,7 @@ def before():
         y1 = relay.nn.relu(y1)
         y2 = relay.nn.batch_flatten(y)
         ret = relay.Tuple([y1, y2])
-        y = relay.Function(free_vars(ret), ret)
+        y = relay.Function(analysis.free_vars(ret), ret)
         return y
 
     @register_alter_op_layout("nn.conv2d", level=103)
@@ -203,18 +207,16 @@ def expected():
         y2 = relay.layout_transform(y, "NCHW16c", "NCHW")
         y2 = relay.nn.batch_flatten(y2)
         ret = relay.Tuple([y1, y2])
-        y = relay.Function(free_vars(ret), ret)
+        y = relay.Function(analysis.free_vars(ret), ret)
         return y
 
     a = before()
-    a = infer_type(a)
-    a = alter_op_layout(a)
-    a = infer_type(a)
+    a = run_opt_pass(a, transform.AlterOpLayout())
 
     b = expected()
-    b = infer_type(b)
+    b = run_opt_pass(b, transform.InferType())
 
-    assert alpha_equal(a, b), "Actual = \n" + str(a)
+    assert analysis.alpha_equal(a, b), "Actual = \n" + str(a)
 
 def test_alter_layout_resnet():
     """Test alternating the layout of a residual block
@@ -236,7 +238,7 @@ def before():
         y2 = relay.nn.relu(y2)
         y = y + y2
         y = relay.nn.global_max_pool2d(y)
-        return relay.Function(free_vars(y), y)
+        return relay.Function(analysis.free_vars(y), y)
 
     @register_alter_op_layout("nn.conv2d", level=104)
     def alter_conv2d(attrs, inputs, tinfos):
@@ -264,17 +266,15 @@ def expected():
         y = y + y2
         y = relay.nn.global_max_pool2d(y, layout="NCHW16c")
         y = relay.layout_transform(y, "NCHW16c", "NCHW")
-        return relay.Function(free_vars(y), y)
+        return relay.Function(analysis.free_vars(y), y)
 
     a = before()
-    a = infer_type(a)
-    a = alter_op_layout(a)
-    a = infer_type(a)
+    a = run_opt_pass(a, transform.AlterOpLayout())
 
     b = expected()
-    b = infer_type(b)
+    b = run_opt_pass(b, transform.InferType())
 
-    assert alpha_equal(a, b), "Actual = \n" + str(a)
+    assert analysis.alpha_equal(a, b), "Actual = \n" + str(a)
 
 
 def test_alter_layout_broadcast_op():
@@ -287,7 +287,7 @@ def before():
         y = relay.nn.conv2d(x, weight, channels=64, kernel_size=(3, 3), padding=(1, 1))
         y = relay.nn.bias_add(y, bias) # test broadcasting to lhs
         y = relay.multiply(scale, y)         # test broadcasting to rhs
-        y = relay.Function(free_vars(y), y)
+        y = relay.Function(analysis.free_vars(y), y)
         return y
 
     @register_alter_op_layout("nn.conv2d", level=105)
@@ -311,20 +311,17 @@ def expected():
         y = relay.add(y, bias)          # test broadcasting to lhs
         y = relay.multiply(scale, y)      # test broadcasting to rhs
         y = relay.layout_transform(y, "NCHW16c", "NCHW")
-        y = relay.Function(free_vars(y), y)
+        y = relay.Function(analysis.free_vars(y), y)
         return y
 
     a = before()
-    a = infer_type(a)
-    a = canonicalize_ops(a)
-    a = infer_type(a)
-    a = alter_op_layout(a)
-    a = infer_type(a)
+    a = run_opt_pass(a, [transform.CanonicalizeOps(),
+                         transform.AlterOpLayout()])
 
     b = expected()
-    b = infer_type(b)
+    b = run_opt_pass(b, transform.InferType())
 
-    assert alpha_equal(a, b), "Actual = \n" + str(a)
+    assert analysis.alpha_equal(a, b), "Actual = \n" + str(a)
 
 def test_alter_layout_scalar():
     """Test alternating the layout of a conv2d.
@@ -335,7 +332,7 @@ def before():
         weight = relay.var("weight")
         y = relay.nn.conv2d(x, weight, channels=64, kernel_size=(3, 3), padding=(1, 1))
         y = relay.add(y, relay.const(1, "float32"))
-        y = relay.Function(free_vars(y), y)
+        y = relay.Function(analysis.free_vars(y), y)
         return y
 
     @register_alter_op_layout("nn.conv2d", level=106)
@@ -358,20 +355,17 @@ def expected():
         y = relay.add(y, relay.const(1.0, "float32"))
 
         y = relay.layout_transform(y, "NCHW16c", "NCHW")
-        y = relay.Function(free_vars(y), y)
+        y = relay.Function(analysis.free_vars(y), y)
         return y
 
     a = before()
-    a = infer_type(a)
-    a = canonicalize_ops(a)
-    a = infer_type(a)
-    a = alter_op_layout(a)
-    a = infer_type(a)
+    a = run_opt_pass(a, [transform.CanonicalizeOps(),
+                         transform.AlterOpLayout()])
 
     b = expected()
-    b = infer_type(b)
+    b = run_opt_pass(b, transform.InferType())
 
-    assert alpha_equal(a, b), "Actual = \n" + str(a)
+    assert analysis.alpha_equal(a, b), "Actual = \n" + str(a)
 
 def test_alter_layout_concatenate():
     """ """
@@ -388,7 +382,7 @@ def before():
                              kernel_size=(3, 3),
                              padding=(1, 1))
         ret = relay.concatenate([y, y1], axis=1)
-        y = relay.Function(free_vars(ret), ret)
+        y = relay.Function(analysis.free_vars(ret), ret)
         return y
 
     @register_alter_op_layout("nn.conv2d", level=107)
@@ -415,18 +409,16 @@ def expected():
                              data_layout='NCHW16c')
         ret = relay.concatenate([y, y1], axis=1)
         ret = relay.layout_transform(ret, "NCHW16c", "NCHW")
-        y = relay.Function(free_vars(ret), ret)
+        y = relay.Function(analysis.free_vars(ret), ret)
         return y
 
     a = before()
-    a = infer_type(a)
-    a = alter_op_layout(a)
-    a = infer_type(a)
+    a = run_opt_pass(a, transform.AlterOpLayout())
 
     b = expected()
-    b = infer_type(b)
+    b = run_opt_pass(b, transform.InferType())
 
-    assert alpha_equal(a, b), "Actual = \n" + str(a)
+    assert analysis.alpha_equal(a, b), "Actual = \n" + str(a)
 
 
 def test_alter_layout_nchw_upsamping_op():
@@ -437,7 +429,7 @@ def before():
         y = relay.nn.conv2d(x, weight, channels=32, kernel_size=(3, 3), padding=(1, 1))
         y = relay.nn.upsampling(y, scale=2)
         y = relay.nn.avg_pool2d(y, pool_size=(2, 2), strides=(2, 2))
-        y = relay.Function(free_vars(y), y)
+        y = relay.Function(analysis.free_vars(y), y)
         return y
 
     @register_alter_op_layout("nn.conv2d", level=108)
@@ -456,21 +448,17 @@ def expected():
         y = relay.nn.upsampling(y, scale=2, layout="NCHW16c")
         y = relay.nn.avg_pool2d(y, pool_size=(2, 2), strides=(2, 2), layout='NCHW16c')
         y = relay.layout_transform(y, "NCHW16c", "NCHW")
-        y = relay.Function(free_vars(y), y)
+        y = relay.Function(analysis.free_vars(y), y)
         return y
 
     a = before()
-    a = infer_type(a)
-    a = canonicalize_ops(a)
-    a = infer_type(a)
-
-    a = alter_op_layout(a)
-    a = infer_type(a)
+    a = run_opt_pass(a, [transform.CanonicalizeOps(),
+                         transform.AlterOpLayout()])
 
     b = expected()
-    b = infer_type(b)
+    b = run_opt_pass(b, transform.InferType())
 
-    assert alpha_equal(a, b), "Actual = \n" + str(a)
+    assert analysis.alpha_equal(a, b), "Actual = \n" + str(a)
 
 
 def test_alter_layout_strided_slice():
@@ -480,7 +468,7 @@ def before():
         weight = relay.var('weight', shape=(32, 32, 3, 3))
         y = relay.nn.conv2d(x, weight, channels=32, kernel_size=(3, 3), padding=(1, 1))
         y = relay.strided_slice(y, begin=[0, 16], end=[None, None])
-        y = relay.Function(free_vars(y), y)
+        y = relay.Function(analysis.free_vars(y), y)
         return y
 
     @register_alter_op_layout("nn.conv2d", level=109)
@@ -498,21 +486,17 @@ def expected():
                             data_layout="NCHW4c")
         y = relay.strided_slice(y, begin=[0, 4], end=[None, 8])
         y = relay.layout_transform(y, "NCHW4c", "NCHW")
-        y = relay.Function(free_vars(y), y)
+        y = relay.Function(analysis.free_vars(y), y)
         return y
 
     a = before()
-    a = infer_type(a)
-    a = canonicalize_ops(a)
-    a = infer_type(a)
-
-    a = alter_op_layout(a)
-    a = infer_type(a)
+    a = run_opt_pass(a, [transform.CanonicalizeOps(),
+                         transform.AlterOpLayout()])
 
     b = expected()
-    b = infer_type(b)
+    b = run_opt_pass(b, transform.InferType())
 
-    assert alpha_equal(a, b), "Actual = \n" + str(a)
+    assert analysis.alpha_equal(a, b), "Actual = \n" + str(a)
 
 def test_alter_layout_depthwise_conv2d():
     """Test depthwise_conv2d operator"""
@@ -520,7 +504,7 @@ def before():
         x = relay.var("x", shape=(1, 32, 56, 56))
         w = relay.var("w", shape=(32, 1, 3, 3))
         y = relay.nn.conv2d(x, w, padding=(1, 1), channels=32, kernel_size=(3, 3), groups=32)
-        y = relay.Function(free_vars(y), y)
+        y = relay.Function(analysis.free_vars(y), y)
         return y
 
     import topi
@@ -538,20 +522,17 @@ def expected():
                                                     groups=32, data_layout="NCHW8c", kernel_layout="OIHW1i8o",
                                                     out_layout="NCHW8c")
         y = relay.layout_transform(y, "NCHW8c", "NCHW")
-        y = relay.Function(free_vars(y), y)
+        y = relay.Function(analysis.free_vars(y), y)
         return y
 
     a = before()
-    a = infer_type(a)
-    a = canonicalize_ops(a)
-    a = infer_type(a)
-    a = alter_op_layout(a)
-    a = infer_type(a)
+    a = run_opt_pass(a, [transform.CanonicalizeOps(),
+                         transform.AlterOpLayout()])
 
     b = expected()
-    b = infer_type(b)
+    b = run_opt_pass(b, transform.InferType())
 
-    assert(alpha_equal(a, b))
+    assert(analysis.alpha_equal(a, b))
 
 def test_alter_layout_prelu():
     """Test PRelu operator"""
@@ -561,7 +542,7 @@ def before():
         alpha = relay.var("alpha", relay.IncompleteType())
         y = relay.nn.conv2d(x, weight, channels=64, kernel_size=(3, 3), padding=(1, 1))
         y = relay.nn.prelu(y, alpha)
-        y = relay.Function(free_vars(y), y)
+        y = relay.Function(analysis.free_vars(y), y)
         return y
 
     @register_alter_op_layout("nn.conv2d", level=111)
@@ -584,20 +565,16 @@ def expected():
                             data_layout="NCHW16c")
         y = relay.layout_transform(y, "NCHW16c", "NCHW")
         y = relay.nn.prelu(y, alpha)
-        y = relay.Function(free_vars(y), y)
+        y = relay.Function(analysis.free_vars(y), y)
         return y
 
     a = before()
-    a = infer_type(a)
-    a = canonicalize_ops(a)
-    a = infer_type(a)
-    a = alter_op_layout(a)
-    a = infer_type(a)
+    a = run_opt_pass(a, [transform.CanonicalizeOps(), transform.AlterOpLayout()])
 
     b = expected()
-    b = infer_type(b)
+    b = run_opt_pass(b, transform.InferType())
 
-    assert(alpha_equal(a, b))
+    assert(analysis.alpha_equal(a, b))
 
 
 if __name__ == "__main__":
diff --git a/tests/python/relay/test_pass_annotation.py b/tests/python/relay/test_pass_annotation.py
index 84a5c87490796..14d53a0e2c2c5 100644
--- a/tests/python/relay/test_pass_annotation.py
+++ b/tests/python/relay/test_pass_annotation.py
@@ -22,6 +22,16 @@
 from tvm import relay
 from tvm.contrib import graph_runtime
 from tvm.relay.expr_functor import ExprMutator
+from tvm.relay import transform
+
+
+def run_opt_pass(expr, passes):
+    passes = passes if isinstance(passes, list) else [passes]
+    mod = relay.Module.from_expr(expr)
+    seq = transform.Sequential(passes)
+    with transform.PassContext(opt_level=3):
+        mod = seq(mod)
+    return mod["main"]
 
 
 def test_redundant_annotation():
@@ -39,9 +49,8 @@ def annotated():
         sub2 = relay.subtract(_add2, z)
 
         func = relay.Function([x, y, z], relay.Tuple([sub1, sub2]))
-        func = relay.ir_pass.infer_type(func)
-        func = relay.ir_pass.rewrite_annotated_ops(func,
-                                                   ctx1.device_type)
+        func = run_opt_pass(func,
+                            transform.RewriteAnnotatedOps(ctx1.device_type))
         return func
 
     def expected():
@@ -53,9 +62,9 @@ def expected():
         func = relay.Function([x, y, z], relay.Tuple([sub1, sub2]))
         return func
 
-    annotated_func = relay.ir_pass.infer_type(annotated())
-    expected_func = relay.ir_pass.infer_type(expected())
-    assert relay.ir_pass.alpha_equal(annotated_func, expected_func)
+    annotated_func = annotated()
+    expected_func = run_opt_pass(expected(), transform.InferType())
+    assert relay.analysis.alpha_equal(annotated_func, expected_func)
 
 
 def test_annotate_expr():
@@ -70,9 +79,8 @@ def annotated():
         _add = relay.annotation.on_device(add, ctx1)
         sub = relay.subtract(_add, z)
         _sub = relay.annotation.on_device(sub, ctx2)
-        expr = relay.ir_pass.infer_type(_sub)
-        expr = relay.ir_pass.rewrite_annotated_ops(expr,
-                                                   ctx1.device_type)
+        expr = run_opt_pass(_sub,
+                            transform.RewriteAnnotatedOps(ctx1.device_type))
         return expr
 
     def expected():
@@ -81,9 +89,9 @@ def expected():
         sub = relay.subtract(copy_add_sub, z)
         return sub
 
-    annotated_expr = relay.ir_pass.infer_type(annotated())
-    expected_expr = relay.ir_pass.infer_type(expected())
-    assert relay.ir_pass.graph_equal(annotated_expr, expected_expr)
+    annotated_expr = annotated()
+    expected_expr = run_opt_pass(expected(), transform.InferType())
+    assert relay.analysis.graph_equal(annotated_expr, expected_expr)
 
 
 def test_annotate_all():
@@ -100,9 +108,8 @@ def annotated():
         _sub = relay.annotation.on_device(sub, ctx2)
 
         func = relay.Function([x, y, z], _sub)
-        func = relay.ir_pass.infer_type(func)
-        func = relay.ir_pass.rewrite_annotated_ops(func,
-                                                   ctx1.device_type)
+        func = run_opt_pass(func,
+                            transform.RewriteAnnotatedOps(ctx1.device_type))
         return func
 
     def expected():
@@ -111,9 +118,9 @@ def expected():
         func = relay.Function([x, y, z], sub)
         return func
 
-    annotated_func = relay.ir_pass.infer_type(annotated())
-    expected_func = relay.ir_pass.infer_type(expected())
-    assert relay.ir_pass.alpha_equal(annotated_func, expected_func)
+    annotated_func = annotated()
+    expected_func = run_opt_pass(expected(), transform.InferType())
+    assert relay.analysis.graph_equal(annotated_func, expected_func)
 
 
 def test_annotate_none():
@@ -127,9 +134,8 @@ def annotated():
         add = relay.add(x, y)
         sub = relay.subtract(add, z)
         func = relay.Function([x, y, z], sub)
-        func = relay.ir_pass.infer_type(func)
-        func = relay.ir_pass.rewrite_annotated_ops(func,
-                                                   ctx1.device_type)
+        func = run_opt_pass(func,
+                            transform.RewriteAnnotatedOps(ctx1.device_type))
         return func
 
     def expected():
@@ -138,15 +144,15 @@ def expected():
         func = relay.Function([x, y, z], sub)
         return func
 
-    annotated_func = relay.ir_pass.infer_type(annotated())
-    expected_func = relay.ir_pass.infer_type(expected())
-    assert relay.ir_pass.alpha_equal(annotated_func, expected_func)
+    annotated_func = annotated()
+    expected_func = run_opt_pass(expected(), transform.InferType())
+    assert relay.analysis.graph_equal(annotated_func, expected_func)
 
 
 def check_annotated_graph(annotated_func, expected_func):
-    annotated_func = relay.ir_pass.infer_type(annotated_func)
-    expected_func = relay.ir_pass.infer_type(expected_func)
-    assert relay.ir_pass.alpha_equal(annotated_func, expected_func)
+    annotated_func = run_opt_pass(annotated_func, transform.InferType())
+    expected_func = run_opt_pass(expected_func, transform.InferType())
+    assert relay.analysis.alpha_equal(annotated_func, expected_func)
 
 
 def test_conv_network():
@@ -189,9 +195,8 @@ def original():
             padding=(1, 1))
 
         func = relay.Function([data1, data2, weight], conv2d_3)
-        func = relay.ir_pass.infer_type(func)
-        func = relay.ir_pass.rewrite_annotated_ops(func,
-                                                   tvm.context(3).device_type)
+        func = run_opt_pass(
+            func, transform.RewriteAnnotatedOps(tvm.context(3).device_type))
         return func
 
 
@@ -221,9 +226,8 @@ def annotated():
         _conv2d_3 = relay.annotation.on_device(conv2d_3, dev2)
 
         func = relay.Function([data1, data2, weight], _conv2d_3)
-        func = relay.ir_pass.infer_type(func)
-        func = relay.ir_pass.rewrite_annotated_ops(func,
-                                                   tvm.context(3).device_type)
+        func = run_opt_pass(
+            func, transform.RewriteAnnotatedOps(tvm.context(3).device_type))
         return func
 
     class ScheduleConv2d(ExprMutator):
@@ -241,7 +245,8 @@ def visit_call(self, expr):
     def annotate_with_visitor(func):
         sched = ScheduleConv2d(dev2)
         func = sched.visit(func)
-        func = relay.ir_pass.rewrite_annotated_ops(func, dev1.device_type)
+        func = run_opt_pass(
+            func, transform.RewriteAnnotatedOps(dev1.device_type))
         return func
 
     def expected():
@@ -273,10 +278,8 @@ def expected():
 
     def check_storage_and_device_types():
         func = annotated()
-        func = relay.ir_pass.rewrite_annotated_ops(func, 3)
-        func = relay.ir_pass.infer_type(func)
-        func = relay.ir_pass.fuse_ops(func, opt_level=2)
-        func = relay.ir_pass.infer_type(func)
+        func = run_opt_pass(func, [transform.RewriteAnnotatedOps(3),
+                                   transform.FuseOps(2)])
         smap = relay.backend._backend.GraphPlanMemory(func)
         storage_ids = []
         device_types = []
@@ -377,9 +380,8 @@ def annotated():
             _exp = relay.annotation.on_device(exp, dev_ctx)
 
             func = relay.Function([x, y], _exp)
-            func = relay.ir_pass.infer_type(func)
-            func = relay.ir_pass.rewrite_annotated_ops(func,
-                                                       cpu_ctx.device_type)
+            func = run_opt_pass(
+                func, transform.RewriteAnnotatedOps(cpu_ctx.device_type))
             return func
 
         def expected():
@@ -424,9 +426,8 @@ def annotated():
             _exp = relay.annotation.on_device(exp, dev_ctx)
 
             func = relay.Function([x, y], _exp)
-            func = relay.ir_pass.infer_type(func)
-            func = relay.ir_pass.rewrite_annotated_ops(func,
-                                                       cpu_ctx.device_type)
+            func = run_opt_pass(
+                func, transform.RewriteAnnotatedOps(cpu_ctx.device_type))
             return func
 
         annotated_func = annotated()
@@ -449,9 +450,8 @@ def annotated():
             _exp = relay.annotation.on_device(exp, cpu_ctx)
 
             func = relay.Function([x, y], _exp)
-            func = relay.ir_pass.infer_type(func)
-            func = relay.ir_pass.rewrite_annotated_ops(func,
-                                                       dev_ctx.device_type)
+            func = run_opt_pass(
+                func, transform.RewriteAnnotatedOps(dev_ctx.device_type))
             return func
 
         def expected():
@@ -495,7 +495,7 @@ def run_unpropagatable_graph(dev, tgt):
                 \      /
                 subtract
     """
-    
+
     a = relay.var("a", shape=(10, 10))
     b = relay.var("b", shape=(10, 10))
     c = relay.var("c", shape=(10, 10))
@@ -507,13 +507,13 @@ def run_unpropagatable_graph(dev, tgt):
     tmp_add = a_data + b_data
     tmp_mul = np.multiply(c_data, d_data)
     ref_res = np.subtract(tmp_add, tmp_mul)
-    
+
     fallback_device = tvm.context("cpu")
     target = {"cpu": "llvm", dev: tgt}
     cpu_ctx = fallback_device
     dev_ctx = tvm.context(dev)
-    
-    def annotated():    
+
+    def annotated():
         add = relay.add(a, b)
         _add = relay.annotation.on_device(add, dev_ctx)
         mul = relay.multiply(c, d)
@@ -521,19 +521,18 @@ def annotated():
         sub = relay.subtract(_add, _mul)
         _sub = relay.annotation.on_device(sub, dev_ctx)
         func = relay.Function([a, b, c, d], _sub)
-        func = relay.ir_pass.infer_type(func)
-        func = relay.ir_pass.rewrite_annotated_ops(func,
-                                                   dev_ctx.device_type)
+        func = run_opt_pass(
+            func, transform.RewriteAnnotatedOps(dev_ctx.device_type))
         return func
-        
-    def expected():    
+
+    def expected():
         add = relay.add(a, b)
         mul = relay.multiply(c, d)
         copy_mul_sub = relay.device_copy(mul, cpu_ctx, dev_ctx)
         sub = relay.subtract(add, copy_mul_sub)
         func = relay.Function([a, b, c, d], sub)
         return func
-    
+
     annotated_func = annotated()
     expected_func = expected()
     expected_index = [2, 2, 2, 1, 1, 1, 2, 2]
@@ -553,7 +552,7 @@ def expected():
         mod.run()
         res = mod.get_output(0).asnumpy()
         tvm.testing.assert_allclose(res, ref_res, rtol=1e-5, atol=1e-5)
-        
+
 
 def test_check_run():
     for dev, tgt in [("opencl", "opencl"), ("cuda", "cuda"),
@@ -580,7 +579,7 @@ def expected():
         elem0 = relay.device_copy(split[0], gpu_ctx, cpu_ctx)
         elem1 = relay.device_copy(split[1], gpu_ctx, cpu_ctx)
         sub = elem0 - elem1
-        func = relay.Function(relay.ir_pass.free_vars(sub), sub)
+        func = relay.Function(relay.analysis.free_vars(sub), sub)
         return func
 
     def annotated():
@@ -590,13 +589,14 @@ def annotated():
         split = relay.annotation.on_device(split, gpu_ctx)
         split = relay.TupleWrapper(split, 3)
         sub = split[0] - split[1]
-        func = relay.Function(relay.ir_pass.free_vars(sub), sub)
-        func = relay.ir_pass.rewrite_annotated_ops(func, cpu_ctx.device_type)
+        func = relay.Function(relay.analysis.free_vars(sub), sub)
+        func = run_opt_pass(
+            func, transform.RewriteAnnotatedOps(cpu_ctx.device_type))
         return func
 
-    annotated_func = relay.ir_pass.infer_type(annotated())
-    expected_func = relay.ir_pass.infer_type(expected())
-    assert relay.ir_pass.graph_equal(annotated_func, expected_func)
+    annotated_func = annotated()
+    expected_func = run_opt_pass(expected(), transform.InferType())
+    assert relay.analysis.graph_equal(annotated_func, expected_func)
 
 
 if __name__ == "__main__":
diff --git a/tests/python/relay/test_pass_canonicalize_cast.py b/tests/python/relay/test_pass_canonicalize_cast.py
index 04478e94039a2..b72ded21ef521 100644
--- a/tests/python/relay/test_pass_canonicalize_cast.py
+++ b/tests/python/relay/test_pass_canonicalize_cast.py
@@ -58,10 +58,13 @@ def check(shape):
                                      _transform.InferType()])
         with _transform.PassContext(opt_level=3):
             mod = seq(mod)
-        y = mod[mod.entry_func.name_hint]
+        y = mod["main"]
         y_expected = expected(data, conv_weight, bias1, bias2)
-        y_expected = relay.ir_pass.infer_type(y_expected)
-        assert relay.ir_pass.alpha_equal(y, y_expected)
+        gv = relay.GlobalVar("expected")
+        mod[gv] = y_expected
+        mod = _transform.InferType()(mod)
+        y_expected = mod["expected"]
+        assert relay.analysis.alpha_equal(y, y_expected)
 
     check((1, 16, 7, 7))
 
diff --git a/tests/python/relay/test_pass_check_kind.py b/tests/python/relay/test_pass_check_kind.py
index 4d9a2e77eae28..7049ba6f11ed1 100644
--- a/tests/python/relay/test_pass_check_kind.py
+++ b/tests/python/relay/test_pass_check_kind.py
@@ -16,7 +16,7 @@
 # under the License.
 import tvm
 from tvm import relay
-from tvm.relay.ir_pass import check_kind
+from tvm.relay.analysis import check_kind
 from nose.tools import raises
 
 
diff --git a/tests/python/relay/test_pass_combine_parallel_conv2d.py b/tests/python/relay/test_pass_combine_parallel_conv2d.py
index 3bb656b2bda56..599b308b21367 100644
--- a/tests/python/relay/test_pass_combine_parallel_conv2d.py
+++ b/tests/python/relay/test_pass_combine_parallel_conv2d.py
@@ -15,7 +15,19 @@
 # specific language governing permissions and limitations
 # under the License.
 from tvm import relay
-import numpy as np
+from tvm.relay import transform
+
+
+def run_combine_parallel(expr, min_num_branches=3):
+    mod = relay.Module.from_expr(expr)
+    mod = transform.CombineParallelConv2D(min_num_branches)(mod)
+    return mod["main"]
+
+def run_opt_pass(expr, opt_pass):
+    assert isinstance(opt_pass, transform.Pass)
+    mod = relay.Module.from_expr(expr)
+    mod = opt_pass(mod)
+    return mod["main"]
 
 
 def test_combine_parallel_conv2d():
@@ -54,12 +66,11 @@ def check(x_shape, channels1, channels2, channels3, channels4):
         w4 = relay.var("w4", shape=(channels4, in_c, 1, 1))
 
         y_before = before(x, w1, w2, w3, w4)
-        y = relay.ir_pass.infer_type(y_before)
-        y = relay.ir_pass.combine_parallel_conv2d(y, min_num_branches=2)
-        y = relay.ir_pass.infer_type(y)
+        y = run_opt_pass(y_before,
+                         transform.CombineParallelConv2D(min_num_branches=2))
         y_expected = expected(x, w1, w2, w3, w4, channels1, channels2, channels3, channels4)
-        y_expected = relay.ir_pass.infer_type(y_expected)
-        assert relay.ir_pass.alpha_equal(y, y_expected)
+        y_expected = run_opt_pass(y_expected, transform.InferType())
+        assert relay.analysis.alpha_equal(y, y_expected)
 
     check((1, 4, 16, 16), 4, 4, 4, 4)
     check((1, 4, 16, 16), 4, 8, 4, 7)
@@ -101,12 +112,11 @@ def check(x_shape, channels1, channels2):
         scale2 = relay.var("scale2", shape=(channels2, 1, 1))
         bias = relay.var("bias", shape=(channels2, 1, 1))
         y_before = before(x, w1, w2, scale1, scale2, bias)
-        y = relay.ir_pass.infer_type(y_before)
-        y = relay.ir_pass.combine_parallel_conv2d(y, min_num_branches=2)
-        y = relay.ir_pass.infer_type(y)
+        y = run_opt_pass(y_before,
+                         transform.CombineParallelConv2D(min_num_branches=2))
         y_expected = expected(x, w1, w2, scale1, scale2, bias, channels1, channels2)
-        y_expected = relay.ir_pass.infer_type(y_expected)
-        assert relay.ir_pass.alpha_equal(y, y_expected)
+        y_expected = run_opt_pass(y_expected, transform.InferType())
+        assert relay.analysis.alpha_equal(y, y_expected)
 
     check((1, 4, 16, 16), 4, 8)
 
@@ -141,12 +151,11 @@ def check(x_shape, channels1, channels2):
         scale1 = relay.var("scale1", shape=(1,))
         scale2 = relay.var("scale2", shape=(1,))
         y_before = before(x, w1, w2, scale1, scale2)
-        y = relay.ir_pass.infer_type(y_before)
-        y = relay.ir_pass.combine_parallel_conv2d(y, min_num_branches=2)
-        y = relay.ir_pass.infer_type(y)
+        y = run_opt_pass(y_before,
+                         transform.CombineParallelConv2D(min_num_branches=2))
         y_expected = expected(x, w1, w2, scale1, scale2, channels1, channels2)
-        y_expected = relay.ir_pass.infer_type(y_expected)
-        assert relay.ir_pass.alpha_equal(y, y_expected)
+        y_expected = run_opt_pass(y_expected, transform.InferType())
+        assert relay.analysis.alpha_equal(y, y_expected)
 
     check((1, 4, 16, 16), 4, 8)
 
@@ -178,12 +187,11 @@ def check(x_shape, repeat):
         out_c = in_c // 2
         w = relay.var("w", shape=(out_c, in_c, 1, 1))
         y_before = before(x, w, repeat)
-        y = relay.ir_pass.infer_type(y_before)
-        y = relay.ir_pass.combine_parallel_conv2d(y, min_num_branches=2)
-        y = relay.ir_pass.infer_type(y)
+        y = run_opt_pass(y_before,
+                         transform.CombineParallelConv2D(min_num_branches=2))
         y_expected = expected(x, w, out_c, repeat)
-        y_expected = relay.ir_pass.infer_type(y_expected)
-        assert relay.ir_pass.alpha_equal(y, y_expected)
+        y_expected = run_opt_pass(y_expected, transform.InferType())
+        assert relay.analysis.alpha_equal(y, y_expected)
 
     check((1, 4, 16, 16), 4)
 
diff --git a/tests/python/relay/test_pass_dead_code_elimination.py b/tests/python/relay/test_pass_dead_code_elimination.py
index 9158f0729d614..f3515800e449f 100644
--- a/tests/python/relay/test_pass_dead_code_elimination.py
+++ b/tests/python/relay/test_pass_dead_code_elimination.py
@@ -18,20 +18,13 @@
 
 import tvm
 from tvm import relay
-from tvm.relay.ir_pass import dead_code_elimination, alpha_equal
+from tvm.relay import Function, transform
+from tvm.relay.analysis import alpha_equal, graph_equal, free_vars
 from tvm.relay.op import log, add, equal, subtract
 
 
 class env:
     def __init__(self):
-        self.a = relay.Var("a")
-        self.b = relay.Var("b")
-        self.c = relay.Var("c")
-        self.d = relay.Var("d")
-        self.e = relay.Var("e")
-        self.x = relay.Var("x")
-        self.y = relay.Var("y")
-        self.z = relay.Var("z")
         self.shape = tvm.convert([1, 2, 3])
         self.tt = relay.TensorType(self.shape, "float32")
         self.int32 = relay.TensorType([], "int32")
@@ -39,29 +32,50 @@ def __init__(self):
         self.one = relay.const(1.0)
         self.two = relay.const(2.0)
         self.three = relay.const(3.0)
+        self.a = relay.Var("a", self.float32)
+        self.b = relay.Var("b", self.float32)
+        self.c = relay.Var("c", self.float32)
+        self.d = relay.Var("d", self.float32)
+        self.e = relay.Var("e", self.float32)
+        self.x = relay.Var("x", self.int32)
+        self.y = relay.Var("y", self.int32)
+        self.z = relay.Var("z", self.int32)
 
 
 e = env()
 
 
+def run_opt_pass(expr, opt_pass):
+    assert isinstance(opt_pass, transform.Pass)
+    mod = relay.Module.from_expr(expr)
+    mod = opt_pass(mod)
+    entry = mod["main"]
+    return entry if isinstance(expr, relay.Function) else entry.body
+
+
 def test_let():
     orig = relay.Let(e.x, e.y, e.z)
-    assert alpha_equal(dead_code_elimination(orig), e.z)
+    orig = run_opt_pass(orig, transform.DeadCodeElimination())
+    assert alpha_equal(Function(free_vars(orig), orig), Function([e.z], e.z))
 
 
 def test_used_let():
     orig = relay.Let(e.c, e.one, e.c + e.c)
-    assert alpha_equal(dead_code_elimination(orig), relay.Let(e.c, e.one, e.c + e.c))
+    orig = run_opt_pass(orig, transform.DeadCodeElimination())
+    expected = relay.Let(e.c, e.one, e.c + e.c)
+    assert alpha_equal(Function([e.c], orig), Function([e.c], expected))
 
 @nottest
 def test_inline():
     orig = relay.Let(e.a, e.b, relay.Let(e.c, e.d, e.c))
-    assert alpha_equal(dead_code_elimination(orig), e.d)
+    orig = run_opt_pass(orig, transform.DeadCodeElimination())
+    assert alpha_equal(Function(free_vars(orig), orig), Function([e.d], e.d))
 
 
 def test_chain_unused_let():
     orig = relay.Let(e.a, e.b, relay.Let(e.c, e.d, e.e))
-    assert alpha_equal(dead_code_elimination(orig), e.e)
+    orig = run_opt_pass(orig, transform.DeadCodeElimination())
+    assert alpha_equal(Function(free_vars(orig), orig), Function([e.e], e.e))
 
 
 # make sure we dont infinite loop
@@ -78,27 +92,39 @@ def test_recursion():
        f(2, 10000);
     """
     f = relay.Var("f")
+    f1 = relay.Var("f1")
     n = relay.Var("n", e.int32)
     data = relay.Var("data", e.float32)
     funcbody = relay.If(equal(n, relay.const(0)),
                         data,
-                        relay.Call(f, [subtract(n, relay.const(1.0)),
+                        relay.Call(f1, [subtract(n, relay.const(1)),
                                        log(data)]))
     value = relay.Function([n, data], funcbody, e.float32, [])
-    orig = relay.Let(f, value, relay.Call(f, [relay.const(2.0), relay.const(10000.0)]))
-    assert alpha_equal(dead_code_elimination(orig), orig)
-    assert alpha_equal(dead_code_elimination(relay.Let(f, value, e.three)), e.three)
+    orig = relay.Let(f, value, relay.Call(f, [relay.const(2), relay.const(10000.0)]))
+    dced = run_opt_pass(orig, transform.DeadCodeElimination())
+    orig = run_opt_pass(orig, transform.InferType())
+    assert graph_equal(dced, orig)
+    dced = run_opt_pass(relay.Let(f, value, e.three),
+                        transform.DeadCodeElimination())
+    assert alpha_equal(dced, e.three)
 
 
 def test_op_let():
-    assert alpha_equal(dead_code_elimination(add(relay.Let(e.a, e.one, e.three), e.two)), add(e.three, e.two))
+    dced = run_opt_pass(add(relay.Let(e.a, e.one, e.three), e.two),
+                        transform.DeadCodeElimination())
+    assert alpha_equal(dced, add(e.three, e.two))
 
 
 def test_tuple_get_item():
-    t = relay.Var('t')
+    tt = relay.TupleType([e.float32, e.float32])
+    t = relay.Var('t', tt)
+    a = relay.Var('a')
     g = relay.TupleGetItem(t, 0)
-    assert alpha_equal(dead_code_elimination(g), g)
-    assert alpha_equal(dead_code_elimination(relay.TupleGetItem(relay.Let(e.a, e.one, t), 0)), g)
+    dced = run_opt_pass(g, transform.DeadCodeElimination())
+    assert alpha_equal(Function(free_vars(dced), dced), Function(free_vars(g), g))
+    orig = relay.TupleGetItem(relay.Let(a, e.one, t), 0)
+    dced = run_opt_pass(orig, transform.DeadCodeElimination())
+    assert alpha_equal(Function(free_vars(dced), dced), Function(free_vars(g), g))
 
 
 if __name__ == "__main__":
diff --git a/tests/python/relay/test_pass_eliminate_common_subexpr.py b/tests/python/relay/test_pass_eliminate_common_subexpr.py
index 1ebd834d4da76..09ea7044daf5f 100644
--- a/tests/python/relay/test_pass_eliminate_common_subexpr.py
+++ b/tests/python/relay/test_pass_eliminate_common_subexpr.py
@@ -17,7 +17,15 @@
 """Test eliminate common subexpr pass"""
 from tvm import relay
 from tvm.relay.op import register_alter_op_layout
-from tvm.relay import ir_pass
+from tvm.relay import transform, analysis
+
+
+def run_opt_pass(expr, opt_pass):
+    assert isinstance(opt_pass, transform.Pass)
+    mod = relay.Module.from_expr(expr)
+    mod = opt_pass(mod)
+    entry = mod["main"]
+    return entry if isinstance(expr, relay.Function) else entry.body
 
 
 def test_simple():
@@ -37,11 +45,11 @@ def expected():
         y = relay.add(y, relay.const(1.0, "float32"))
         y = relay.add(y, y)
         f = relay.Function([x], y)
-        return f
+        return run_opt_pass(f, transform.InferType())
 
     z = before()
-    z = ir_pass.eliminate_common_subexpr(z)
-    assert ir_pass.alpha_equal(z, expected())
+    z = run_opt_pass(z, transform.EliminateCommonSubexpr())
+    assert analysis.alpha_equal(z, expected())
 
 
 def test_callback():
@@ -62,7 +70,7 @@ def expected():
         y2 = relay.add(y, relay.const(1.0, "float32"))
         y = relay.add(y1, y2)
         f = relay.Function([x], y)
-        return f
+        return run_opt_pass(f, transform.InferType())
 
     def fskip(expr):
         if isinstance(expr, relay.expr.Call) and expr.op.name == 'add':
@@ -70,8 +78,8 @@ def fskip(expr):
         return False
 
     z = before()
-    z = ir_pass.eliminate_common_subexpr(z, fskip)
-    assert ir_pass.alpha_equal(z, expected())
+    z = run_opt_pass(z, transform.EliminateCommonSubexpr(fskip))
+    assert analysis.alpha_equal(z, expected())
 
 
 if __name__ == "__main__":
diff --git a/tests/python/relay/test_pass_eta_expand.py b/tests/python/relay/test_pass_eta_expand.py
index 4e20b02357d3d..73c3a4eb4073c 100644
--- a/tests/python/relay/test_pass_eta_expand.py
+++ b/tests/python/relay/test_pass_eta_expand.py
@@ -26,14 +26,15 @@ def test_eta_expand_basic():
     with _transform.PassContext(opt_level=3):
         mod = seq(mod)
 
-    got = mod[mod.entry_func.name_hint]
+    got = mod["main"]
 
     y = relay.var('y', 'int32')
     expected = relay.Function([y], orig(y))
-
-    got = relay.ir_pass.infer_type(got, mod)
-    expected = relay.ir_pass.infer_type(expected, mod)
-    assert(relay.ir_pass.alpha_equal(got, expected))
+    gv = relay.GlobalVar("gv")
+    mod[gv] = expected
+    mod = _transform.InferType()(mod)
+    expected = mod["gv"]
+    assert(relay.analysis.alpha_equal(got, expected))
 
 if __name__ == "__main__":
     test_eta_expand_basic()
diff --git a/tests/python/relay/test_pass_fold_constant.py b/tests/python/relay/test_pass_fold_constant.py
index 2abeaa8f8db8b..97b20c6b9219a 100644
--- a/tests/python/relay/test_pass_fold_constant.py
+++ b/tests/python/relay/test_pass_fold_constant.py
@@ -17,13 +17,24 @@
 import numpy as np
 import tvm
 from tvm import relay
+from tvm.relay import transform
+
+
+def run_opt_pass(expr, opt_pass):
+    assert isinstance(opt_pass, transform.Pass)
+
+    mod = relay.Module.from_expr(expr)
+    mod = opt_pass(mod)
+    entry = mod["main"]
+    return entry if isinstance(expr, relay.Function) else entry.body
 
 
 def test_fold_const():
     c_data = np.array([1, 2, 3]).astype("float32")
+    t = relay.TensorType([1, 2, 3], "float32")
     def before():
         c = relay.const(c_data)
-        x = relay.var("x")
+        x = relay.var("x", t)
         y = relay.add(c, c)
         y = relay.multiply(y, relay.const(2, "float32"))
         y = relay.add(x, y)
@@ -31,7 +42,7 @@ def before():
         return relay.Function([x], z)
 
     def expected():
-        x = relay.var("x")
+        x = relay.var("x", t)
         c_folded = (c_data + c_data) * 2
         y = relay.add(x, relay.const(c_folded))
         z = relay.add(y, relay.const(c_data))
@@ -39,19 +50,21 @@ def expected():
 
     def fail(x):
         raise RuntimeError()
+
     # the fold constant should work on any context.
     with tvm.build_config(add_lower_pass=[(0, fail)]):
         with tvm.target.create("cuda"):
-            zz = relay.ir_pass.fold_constant(before())
-    zexpected = expected()
-    assert relay.ir_pass.alpha_equal(zz, zexpected)
+            zz = run_opt_pass(before(), transform.FoldConstant())
+    zexpected = run_opt_pass(expected(), transform.InferType())
+    assert relay.analysis.alpha_equal(zz, zexpected)
 
 
 def test_fold_let():
     c_data = np.array(1).astype("float32")
+    t = relay.TensorType([1], "float32")
     def before():
         sb = relay.ScopeBuilder()
-        x = relay.var("x")
+        x = relay.var("x", t)
         t1 = sb.let("t1", relay.const(c_data))
         t2 = sb.let("t2", relay.add(t1, t1))
         t3 = sb.let("t3", relay.add(t2, x))
@@ -60,22 +73,23 @@ def before():
 
     def expected():
         sb = relay.ScopeBuilder()
-        x = relay.var("x")
+        x = relay.var("x", t)
         c_folded = (c_data + c_data)
         t3 = sb.let("t3", relay.add(relay.const(c_folded), x))
         sb.ret(t3)
         return relay.Function([x], sb.get())
 
-    zz = relay.ir_pass.fold_constant(before())
-    zexpected = expected()
-    assert relay.ir_pass.graph_equal(zz, zexpected)
+    zz = run_opt_pass(before(), transform.FoldConstant())
+    zexpected = run_opt_pass(expected(), transform.InferType())
+    assert relay.analysis.graph_equal(zz, zexpected)
 
 
 def test_fold_tuple():
     c_data = np.array(1).astype("float32")
+    t = relay.TensorType([1], "float32")
     def before():
         c = relay.const(c_data)
-        x = relay.var("x")
+        x = relay.var("x", t)
         y = relay.Tuple([x, c])
         z = relay.add(y[1], c)
         z = relay.add(z, y[0])
@@ -83,13 +97,13 @@ def before():
 
     def expected():
         c = relay.const(c_data + c_data)
-        x = relay.var("x")
+        x = relay.var("x", t)
         z = relay.add(c, x)
         return relay.Function([x], z)
 
-    zz = relay.ir_pass.fold_constant(before())
-    zexpected = expected()
-    assert relay.ir_pass.graph_equal(zz, zexpected)
+    zz = run_opt_pass(before(), transform.FoldConstant())
+    zexpected = run_opt_pass(expected(), transform.InferType())
+    assert relay.analysis.graph_equal(zz, zexpected)
 
 
 def test_fold_concat():
@@ -106,9 +120,9 @@ def expected():
         y = relay.const(y_data)
         return relay.Function([], y)
 
-    zz = relay.ir_pass.fold_constant(before())
-    zexpected = expected()
-    assert relay.ir_pass.graph_equal(zz, zexpected)
+    zz = run_opt_pass(before(), transform.FoldConstant())
+    zexpected = run_opt_pass(expected(), transform.InferType())
+    assert relay.analysis.graph_equal(zz, zexpected)
 
 
 def test_fold_shape_of():
@@ -123,17 +137,13 @@ def expected(dtype):
         x = relay.var("x", shape=c_shape, dtype="float32")
         y = relay.var("y", shape=c_shape, dtype="float32")
         z = relay.const(np.array(c_shape).astype(dtype), dtype=dtype)
-        return relay.ir_pass.infer_type(relay.Function([x, y], z))
+        func = relay.Function([x, y], z)
+        return func
 
     for dtype in ["int32", "float32"]:
-        zbefore = before(dtype)
-        zz = relay.ir_pass.fold_constant(zbefore)
-        assert relay.ir_pass.graph_equal(zz, zbefore)
-
-        zz = relay.ir_pass.infer_type(zbefore)
-        zz = relay.ir_pass.fold_constant(zz)
-        zexpected = expected(dtype)
-        assert relay.ir_pass.graph_equal(zz, zexpected)
+        zz = run_opt_pass(before(dtype), transform.FoldConstant())
+        zexpected = run_opt_pass(expected(dtype), transform.InferType())
+        assert relay.analysis.graph_equal(zz, zexpected)
 
 
 if __name__ == "__main__":
diff --git a/tests/python/relay/test_pass_fold_scale_axis.py b/tests/python/relay/test_pass_fold_scale_axis.py
index 383f0072059f4..d6f471bef04a2 100644
--- a/tests/python/relay/test_pass_fold_scale_axis.py
+++ b/tests/python/relay/test_pass_fold_scale_axis.py
@@ -14,13 +14,23 @@
 # KIND, either express or implied.  See the License for the
 # specific language governing permissions and limitations
 # under the License.
-from tvm import relay
 import numpy as np
 
+from tvm import relay
+from tvm.relay import transform
+
 def _get_positive_scale(size):
     return np.random.uniform(0.5, 1, size=size).astype('float32')
 
 
+def run_opt_pass(expr, opt_pass):
+    assert isinstance(opt_pass, transform.Pass)
+    mod = relay.Module.from_expr(expr)
+    mod = opt_pass(mod)
+    entry = mod["main"]
+    return entry if isinstance(expr, relay.Function) else entry.body
+
+
 def test_fold_fwd_simple():
     """Simple testcase."""
     def before(x, conv_weight, in_bias, in_scale, channels):
@@ -59,15 +69,15 @@ def check(shape, channels):
         in_bias = relay.var("in_bias", shape=(in_channels,))
         in_scale = relay.const(_get_positive_scale((in_channels, 1, 1)))
         y1 = before(x, weight, in_bias, in_scale, channels)
-        y1 = relay.ir_pass.infer_type(y1)
+        y1 = run_opt_pass(y1, transform.InferType())
         type_dict = {x.name_hint:x.checked_type for x in y1.params}
         weight = relay.var("weight", type_dict["weight"])
-        y1_folded = relay.ir_pass.forward_fold_scale_axis(y1)
+        y1_folded = run_opt_pass(y1, transform.ForwardFoldScaleAxis())
         y1_expected = expected(x, weight, in_bias, in_scale, channels)
 
-        y1_folded = relay.ir_pass.infer_type(y1_folded)
-        y1_expected = relay.ir_pass.infer_type(y1_expected)
-        assert relay.ir_pass.alpha_equal(y1_folded, y1_expected)
+        y1_folded = run_opt_pass(y1_folded, transform.InferType())
+        y1_expected = run_opt_pass(y1_expected, transform.InferType())
+        assert relay.analysis.alpha_equal(y1_folded, y1_expected)
 
     check((2, 4, 10, 10), 2)
 
@@ -129,14 +139,13 @@ def check(shape, channels):
         in_bias = relay.var("in_bias", shape=(in_channels,))
         in_scale = relay.const(_get_positive_scale(in_channels,))
         y1 = before(x, weight, in_bias, in_scale, channels)
-        y1 = relay.ir_pass.infer_type(y1)
-        y1_folded = relay.ir_pass.forward_fold_scale_axis(y1)
+        y1 = run_opt_pass(y1, transform.InferType())
+        y1_folded = run_opt_pass(y1, transform.ForwardFoldScaleAxis())
         type_dict = {x.name_hint:x.checked_type for x in y1.params}
         weight = relay.var("weight", type_dict["weight"])
         y1_expected = expected(x, weight, in_bias, in_scale, channels)
-        y1_folded = relay.ir_pass.infer_type(y1_folded)
-        y1_expected = relay.ir_pass.infer_type(y1_expected)
-        assert relay.ir_pass.alpha_equal(y1_folded, y1_expected)
+        y1_expected = run_opt_pass(y1_expected, transform.InferType())
+        assert relay.analysis.alpha_equal(y1_folded, y1_expected)
 
     check((2, 4, 10, 3), 3)
 
@@ -152,7 +161,7 @@ def before(x, conv_weight, in_bias, in_scale, channels):
                              data_layout="NHWC",
                              padding=(1, 1))
         z = relay.add(y1, x)
-        return relay.Function(relay.ir_pass.free_vars(z), z)
+        return relay.Function(relay.analysis.free_vars(z), z)
 
     def check(shape, channels):
         x =  relay.var("x", shape=shape)
@@ -163,9 +172,9 @@ def check(shape, channels):
         in_bias = relay.var("in_bias", shape=(in_channels,))
         in_scale = relay.const(_get_positive_scale(size=(in_channels,)))
         y1 = before(x, weight, in_bias, in_scale, channels)
-        y1 = relay.ir_pass.infer_type(y1)
-        y1_folded = relay.ir_pass.forward_fold_scale_axis(y1)
-        assert relay.ir_pass.alpha_equal(y1, y1_folded)
+        y1 = run_opt_pass(y1, transform.InferType())
+        y1_folded = run_opt_pass(y1, transform.ForwardFoldScaleAxis())
+        assert relay.analysis.alpha_equal(y1, y1_folded)
 
     check((2, 11, 10, 4), 4)
 
@@ -181,7 +190,7 @@ def before(x, conv_weight, in_bias, in_scale, channels):
                              data_layout="NHWC",
                              padding=(1, 1))
         z = relay.add(y1, x)
-        return relay.Function(relay.ir_pass.free_vars(z), z)
+        return relay.Function(relay.analysis.free_vars(z), z)
 
     def check(shape, channels, in_scale):
         x =  relay.var("x", shape=shape)
@@ -191,9 +200,9 @@ def check(shape, channels, in_scale):
         weight = relay.var("weight")
         in_bias = relay.var("in_bias", shape=(in_channels,))
         y1 = before(x, weight, in_bias, in_scale, channels)
-        y1 = relay.ir_pass.infer_type(y1)
-        y1_folded = relay.ir_pass.forward_fold_scale_axis(y1)
-        assert relay.ir_pass.alpha_equal(y1, y1_folded)
+        y1 = run_opt_pass(y1, transform.InferType())
+        y1_folded = run_opt_pass(y1, transform.ForwardFoldScaleAxis())
+        assert relay.analysis.alpha_equal(y1, y1_folded)
 
     in_scale = relay.var("in_scale", shape=(4,))
     check((2, 11, 10, 4), 4, in_scale)
@@ -231,14 +240,13 @@ def check(shape, channels):
         in_scale = relay.const(-_get_positive_scale((in_channels, 1, 1)))
         weight = relay.var("weight")
         y1 = before(x, weight, in_scale, channels)
-        y1 = relay.ir_pass.infer_type(y1)
+        y1 = run_opt_pass(y1, transform.InferType())
         type_dict = {x.name_hint:x.checked_type for x in y1.params}
         weight = relay.var("weight", type_dict["weight"])
-        y1_folded = relay.ir_pass.forward_fold_scale_axis(y1)
+        y1_folded = run_opt_pass(y1, transform.ForwardFoldScaleAxis())
         y1_expected = expected(x, weight, in_scale, channels)
-        y1_folded = relay.ir_pass.infer_type(y1_folded)
-        y1_expected = relay.ir_pass.infer_type(y1_expected)
-        assert relay.ir_pass.alpha_equal(y1_folded, y1_expected)
+        y1_expected = run_opt_pass(y1_expected, transform.InferType())
+        assert relay.analysis.alpha_equal(y1_folded, y1_expected)
 
     check((2, 4, 10, 10), 4)
 
@@ -283,14 +291,13 @@ def check(shape, channels):
         out_scale = relay.const(_get_positive_scale((channels, 1, 1)))
 
         y1 = before(x, weight, out_bias, out_scale, channels)
-        y1 = relay.ir_pass.infer_type(y1)
+        y1 = run_opt_pass(y1, transform.InferType())
         type_dict = {x.name_hint:x.checked_type for x in y1.params}
         weight = relay.var("weight", type_dict["weight"])
-        y1_folded = relay.ir_pass.backward_fold_scale_axis(y1)
+        y1_folded = run_opt_pass(y1, transform.BackwardFoldScaleAxis())
         y1_expected = expected(x, weight, out_bias, out_scale, channels)
-        y1_folded = relay.ir_pass.infer_type(y1_folded)
-        y1_expected = relay.ir_pass.infer_type(y1_expected)
-        assert relay.ir_pass.alpha_equal(y1_folded, y1_expected)
+        y1_expected = run_opt_pass(y1_expected, transform.InferType())
+        assert relay.analysis.alpha_equal(y1_folded, y1_expected)
 
     check((2, 4, 10, 10), 8)
 
@@ -343,14 +350,13 @@ def check(shape, channels):
         out_scale = relay.const(_get_positive_scale((channels, 1, 1)))
 
         y1 = before(x, weight, out_bias, out_scale, channels)
-        y1 = relay.ir_pass.infer_type(y1)
+        y1 = run_opt_pass(y1, transform.InferType())
         type_dict = {x.name_hint:x.checked_type for x in y1.params}
         weight = relay.var("weight", type_dict["weight"])
-        y1_folded = relay.ir_pass.backward_fold_scale_axis(y1)
+        y1_folded = run_opt_pass(y1, transform.BackwardFoldScaleAxis())
         y1_expected = expected(x, weight, out_bias, out_scale, channels)
-        y1_folded = relay.ir_pass.infer_type(y1_folded)
-        y1_expected = relay.ir_pass.infer_type(y1_expected)
-        assert relay.ir_pass.alpha_equal(y1_folded, y1_expected)
+        y1_expected = run_opt_pass(y1_expected, transform.InferType())
+        assert relay.analysis.alpha_equal(y1_folded, y1_expected)
 
     check((2, 4, 10, 10), 8)
 
@@ -416,14 +422,13 @@ def check(shape, channels):
         out_scale = relay.const(_get_positive_scale((channels,1, 1)))
 
         y1 = before(x, weight, out_bias, out_scale, channels)
-        y1 = relay.ir_pass.infer_type(y1)
+        y1 = run_opt_pass(y1, transform.InferType())
         type_dict = {x.name_hint:x.checked_type for x in y1.params}
         weight = relay.var("weight", type_dict["weight"])
-        y1_folded = relay.ir_pass.backward_fold_scale_axis(y1)
+        y1_folded = run_opt_pass(y1, transform.BackwardFoldScaleAxis())
         y1_expected = expected(x, weight, out_bias, out_scale, channels)
-        y1_folded = relay.ir_pass.infer_type(y1_folded)
-        y1_expected = relay.ir_pass.infer_type(y1_expected)
-        assert relay.ir_pass.alpha_equal(y1_folded, y1_expected)
+        y1_expected = run_opt_pass(y1_expected, transform.InferType())
+        assert relay.analysis.alpha_equal(y1_folded, y1_expected)
 
     check((2, 4, 10, 10), 4)
 
@@ -470,9 +475,9 @@ def check(shape, channels, fbefore):
         out_bias = relay.var("out_bias", shape=(channels,))
         out_scale = relay.const(_get_positive_scale((channels, 1, 1)))
         y1 = fbefore(x, weight, out_bias, out_scale, channels)
-        y1 = relay.ir_pass.infer_type(y1)
-        y1_folded = relay.ir_pass.backward_fold_scale_axis(y1)
-        assert relay.ir_pass.alpha_equal(y1_folded, y1)
+        y1 = run_opt_pass(y1, transform.InferType())
+        y1_folded = run_opt_pass(y1, transform.BackwardFoldScaleAxis())
+        assert relay.analysis.alpha_equal(y1_folded, y1)
 
     check((4, 4, 10, 10), 4, fail1)
     check((4, 4, 10, 10), 4, fail2)
@@ -488,16 +493,16 @@ def before(x, conv_weight, out_scale, channels):
                              padding=(1, 1))
         y = relay.nn.relu(y)
         y = relay.multiply(x, out_scale)
-        return relay.Function(relay.ir_pass.free_vars(y), y)
+        return relay.Function(relay.analysis.free_vars(y), y)
 
     def check(shape, channels, out_scale):
         x =  relay.var("x", shape=shape)
         in_channels = shape[1]
         weight = relay.var("weight")
         y1 = before(x, weight, out_scale, channels)
-        y1 = relay.ir_pass.infer_type(y1)
-        y1_folded = relay.ir_pass.forward_fold_scale_axis(y1)
-        assert relay.ir_pass.alpha_equal(y1, y1_folded)
+        y1 = run_opt_pass(y1, transform.InferType())
+        y1_folded = run_opt_pass(y1, transform.BackwardFoldScaleAxis())
+        assert relay.analysis.alpha_equal(y1, y1_folded)
 
     out_scale = relay.var("in_scale", shape=(4, 1, 1))
     check((4, 4, 10, 10), 4, out_scale)
@@ -533,14 +538,13 @@ def check(shape, channels):
         weight = relay.var("weight")
         out_scale = relay.const(-_get_positive_scale((channels, 1, 1)))
         y1 = before(x, weight, out_scale, channels)
-        y1 = relay.ir_pass.infer_type(y1)
+        y1 = run_opt_pass(y1, transform.InferType())
         type_dict = {x.name_hint:x.checked_type for x in y1.params}
         weight = relay.var("weight", type_dict["weight"])
-        y1_folded = relay.ir_pass.backward_fold_scale_axis(y1)
+        y1_folded = run_opt_pass(y1, transform.BackwardFoldScaleAxis())
         y1_expected = expected(x, weight, out_scale, channels)
-        y1_folded = relay.ir_pass.infer_type(y1_folded)
-        y1_expected = relay.ir_pass.infer_type(y1_expected)
-        assert relay.ir_pass.alpha_equal(y1_folded, y1_expected)
+        y1_expected = run_opt_pass(y1_expected, transform.InferType())
+        assert relay.analysis.alpha_equal(y1_folded, y1_expected)
 
     check((2, 4, 10, 10), 8)
 
diff --git a/tests/python/relay/test_pass_fuse_ops.py b/tests/python/relay/test_pass_fuse_ops.py
index 6d6781046a10d..8bcde88ba1cd8 100644
--- a/tests/python/relay/test_pass_fuse_ops.py
+++ b/tests/python/relay/test_pass_fuse_ops.py
@@ -16,6 +16,9 @@
 # under the License.
 import tvm
 from tvm import relay
+from tvm.relay import transform
+from tvm.relay.testing import run_opt_pass
+
 
 def test_fuse_simple():
     """Simple testcase."""
@@ -37,13 +40,10 @@ def expected():
         return relay.Function([x], y)
 
     z = before()
-    z = relay.ir_pass.infer_type(z)
-    zz = relay.ir_pass.fuse_ops(z, opt_level=2)
-    zz = relay.ir_pass.infer_type(zz)
-    zz = relay.ir_pass.fuse_ops(zz)
-    zz = relay.ir_pass.infer_type(zz)
-    after = relay.ir_pass.infer_type(expected())
-    assert relay.ir_pass.alpha_equal(zz, after)
+    zz = run_opt_pass(z, transform.FuseOps(fuse_opt_level=2))
+    zz = run_opt_pass(z, transform.FuseOps())
+    after = run_opt_pass(expected(), transform.InferType())
+    assert relay.analysis.alpha_equal(zz, after)
 
 
 def test_conv2d_fuse():
@@ -69,7 +69,7 @@ def before(dshape):
                              channels=16)
         # add can only be fused to z1
         z = relay.add(z2, z3)
-        return relay.Function(relay.ir_pass.free_vars(z), z)
+        return relay.Function(relay.analysis.free_vars(z), z)
 
     def expected(dshape):
         # segment 0
@@ -111,15 +111,13 @@ def expected(dshape):
         z2 = relay.Call(f2, [y, relay.var("w3")])
         z3 = relay.Call(f3, [y, relay.var("w2"), z2])
         z = z3
-        return relay.Function(relay.ir_pass.free_vars(z), z)
+        return relay.Function(relay.analysis.free_vars(z), z)
 
     dshape = (1, 16, 64, 64)
     z = before(dshape)
-    z = relay.ir_pass.infer_type(z)
-    zz = relay.ir_pass.fuse_ops(z, opt_level=2)
-    zz = relay.ir_pass.infer_type(zz)
-    after = relay.ir_pass.infer_type(expected(dshape))
-    assert relay.ir_pass.alpha_equal(zz, after)
+    zz = run_opt_pass(z, transform.FuseOps(fuse_opt_level=2))
+    after = run_opt_pass(expected(dshape), transform.InferType())
+    assert relay.analysis.alpha_equal(zz, after)
 
 
 def test_concatenate():
@@ -131,7 +129,7 @@ def before(dshape):
         upsampled = relay.nn.upsampling(pooled, scale=2, layout="NCHW")
         concat = relay.concatenate((upsampled, x), axis=1)
         out = relay.add(concat, relay.const(1, "float32"))
-        return relay.Function(relay.ir_pass.free_vars(out), out)
+        return relay.Function(relay.analysis.free_vars(out), out)
 
     def expected(dshape):
         x = relay.var("x", shape=dshape)
@@ -152,14 +150,12 @@ def expected(dshape):
 
     dshape = (1, 16, 64, 64)
     z = before(dshape)
-    z = relay.ir_pass.infer_type(z)
-    zz = relay.ir_pass.fuse_ops(z, opt_level=0)
-    assert not relay.ir_pass.free_vars(zz)
-    zz = relay.ir_pass.fuse_ops(z, opt_level=2)
-    zz = relay.ir_pass.infer_type(zz)
-    assert not relay.ir_pass.free_vars(zz)
-    after = relay.ir_pass.infer_type(expected(dshape))
-    assert relay.ir_pass.alpha_equal(zz, after)
+    zz = run_opt_pass(z, transform.FuseOps(fuse_opt_level=0))
+    assert not relay.analysis.free_vars(zz)
+    zz = run_opt_pass(z, transform.FuseOps(fuse_opt_level=2))
+    assert not relay.analysis.free_vars(zz)
+    after = run_opt_pass(expected(dshape), transform.InferType())
+    assert relay.analysis.alpha_equal(zz, after)
 
 
 def test_tuple_root():
@@ -170,7 +166,7 @@ def before(dshape):
         pooled = relay.nn.max_pool2d(x, pool_size=(2, 2), strides=(2, 2), padding=(0, 0))
         upsampled = relay.nn.upsampling(pooled, scale=2, layout="NCHW")
         out = relay.Tuple((upsampled, x))
-        return relay.Function(relay.ir_pass.free_vars(out), out)
+        return relay.Function(relay.analysis.free_vars(out), out)
 
     def expected(dshape):
         x = relay.var("x", shape=dshape)
@@ -189,15 +185,12 @@ def expected(dshape):
 
     dshape = (1, 16, 64, 64)
     z = before(dshape)
-    z = relay.ir_pass.infer_type(z)
-    zz = relay.ir_pass.fuse_ops(z, opt_level=0)
-    assert not relay.ir_pass.free_vars(zz)
-    zz = relay.ir_pass.fuse_ops(z, opt_level=2)
-    zz = relay.ir_pass.infer_type(zz)
-    assert not relay.ir_pass.free_vars(zz)
-    after = relay.ir_pass.infer_type(expected(dshape))
-    assert relay.ir_pass.alpha_equal(zz, after)
-
+    zz = run_opt_pass(z, transform.FuseOps(fuse_opt_level=0))
+    assert not relay.analysis.free_vars(zz)
+    zz = run_opt_pass(z, transform.FuseOps(fuse_opt_level=2))
+    assert not relay.analysis.free_vars(zz)
+    after = run_opt_pass(expected(dshape), transform.InferType())
+    assert relay.analysis.alpha_equal(zz, after)
 
 
 def test_stop_fusion():
@@ -224,11 +217,9 @@ def expected(dshape):
 
     dshape = (10, 20)
     z = before(dshape)
-    z = relay.ir_pass.infer_type(z)
-    z = relay.ir_pass.fuse_ops(z)
-    z = relay.ir_pass.infer_type(z)
-    after = relay.ir_pass.infer_type(expected(dshape))
-    assert relay.ir_pass.alpha_equal(z, after)
+    zz = run_opt_pass(z, transform.FuseOps())
+    after = run_opt_pass(expected(dshape), transform.InferType())
+    assert relay.analysis.alpha_equal(zz, after)
 
 
 def test_fuse_myia_regression():
@@ -261,10 +252,9 @@ def expected(dshape, dtype):
     dshape = ()
     dtype = 'int64'
     f = before(dshape, dtype)
-    f = relay.ir_pass.infer_type(f)
-    f = relay.ir_pass.fuse_ops(f)
-    after = relay.ir_pass.infer_type(expected(dshape, dtype))
-    assert relay.ir_pass.alpha_equal(f, after)
+    zz = run_opt_pass(f, transform.FuseOps())
+    after = run_opt_pass(expected(dshape, dtype), transform.InferType())
+    assert relay.analysis.alpha_equal(zz, after)
 
 
 def test_fuse_tuple_get_elemwise():
@@ -295,14 +285,12 @@ def expected(dim):
 
     dim = 10
     z = before(dim)
-    z = relay.ir_pass.infer_type(z)
-    zz = relay.ir_pass.fuse_ops(z, opt_level=0)
-    assert not relay.ir_pass.free_vars(zz)
-    zz = relay.ir_pass.fuse_ops(z, opt_level=2)
-    zz = relay.ir_pass.infer_type(zz)
-    assert not relay.ir_pass.free_vars(zz)
-    after = relay.ir_pass.infer_type(expected(dim))
-    assert relay.ir_pass.alpha_equal(zz, after)
+    zz = run_opt_pass(z, transform.FuseOps(fuse_opt_level=0))
+    assert not relay.analysis.free_vars(zz)
+    zz = run_opt_pass(z, transform.FuseOps(fuse_opt_level=2))
+    assert not relay.analysis.free_vars(zz)
+    after = run_opt_pass(expected(dim), transform.InferType())
+    assert relay.analysis.alpha_equal(zz, after)
 
 
 def test_tuple_get_root():
@@ -332,16 +320,17 @@ def expected(dim):
 
     dim = 10
     z = before(dim)
-    z = relay.ir_pass.infer_type(z)
-    zz = relay.ir_pass.fuse_ops(z, opt_level=0)
-    assert not relay.ir_pass.free_vars(zz)
-    zz = relay.ir_pass.fuse_ops(z, opt_level=2)
-    zz = relay.ir_pass.infer_type(zz)
-    assert not relay.ir_pass.free_vars(zz)
-    after = relay.ir_pass.infer_type(expected(dim))
-    assert relay.ir_pass.alpha_equal(zz, after)
+    zz = run_opt_pass(z, transform.FuseOps(fuse_opt_level=0))
+    assert not relay.analysis.free_vars(zz)
+    zz = run_opt_pass(z, transform.FuseOps(fuse_opt_level=2))
+    assert not relay.analysis.free_vars(zz)
+    after = run_opt_pass(expected(dim), transform.InferType())
+    assert relay.analysis.alpha_equal(zz, after)
 
 
+fuse0 = relay.transform.FuseOps(fuse_opt_level=0)
+fuse2 = relay.transform.FuseOps(fuse_opt_level=2)
+
 def test_tuple_intermediate():
     def before(x):
         inj = relay.squeeze(x)
@@ -353,7 +342,7 @@ def before(x):
         concat = relay.concatenate((y1, y2, y3), axis=1)
         out_inj = relay.squeeze(concat)
         out = relay.add(out_inj, relay.const(1, "float32"))
-        return relay.Function(relay.ir_pass.free_vars(out), out)
+        return relay.Function(relay.analysis.free_vars(out), out)
 
     def expected(p0):
         f0 = before(p0)
@@ -363,16 +352,12 @@ def expected(p0):
 
     dshape = (1, 16, 64, 64)
     x = relay.var("x", shape=dshape)
-    z = before(x)
-    z = relay.ir_pass.infer_type(z)
-    zz = relay.ir_pass.fuse_ops(z, opt_level=0)
-    assert not relay.ir_pass.free_vars(zz)
-    zz = relay.ir_pass.fuse_ops(z, opt_level=2)
-    relay.build(zz, 'llvm')
-    zz = relay.ir_pass.infer_type(zz)
-    assert not relay.ir_pass.free_vars(zz)
-    after = relay.ir_pass.infer_type(expected(x))
-    assert relay.ir_pass.alpha_equal(zz, after)
+    orig = before(x)
+    fuse0(relay.Module.from_expr(orig))
+    m = fuse2(relay.Module.from_expr(orig))
+    relay.build(m, 'llvm')
+    after = run_opt_pass(expected(x), transform.InferType())
+    assert relay.analysis.alpha_equal(m["main"], after)
 
 
 def test_tuple_consecutive():
@@ -397,7 +382,7 @@ def before(x):
         out = relay.add(pooled, relay.const(1, "float32"))
         out2 = relay.add(out, relay.const(1, "float32"))
         out_tup = relay.Tuple((out, out2))
-        return relay.Function(relay.ir_pass.free_vars(out_tup), out_tup)
+        return relay.Function(relay.analysis.free_vars(out_tup), out_tup)
 
     def expected(dshape):
         p0 = relay.var("p0", shape=dshape)
@@ -422,16 +407,12 @@ def expected(dshape):
 
     dshape = (1, 16, 64, 64)
     x = relay.var("x", shape=dshape)
-    z = before(x)
-    z = relay.ir_pass.infer_type(z)
-    zz = relay.ir_pass.fuse_ops(z, opt_level=0)
-    assert not relay.ir_pass.free_vars(zz)
-    zz = relay.ir_pass.fuse_ops(z, opt_level=2)
-    relay.build(zz, 'llvm')
-    zz = relay.ir_pass.infer_type(zz)
-    assert not relay.ir_pass.free_vars(zz)
-    after = relay.ir_pass.infer_type(expected(dshape))
-    assert relay.ir_pass.alpha_equal(zz, after)
+    orig = before(x)
+    fuse0(relay.Module.from_expr(orig))
+    m = fuse2(relay.Module.from_expr(orig))
+    relay.build(m, 'llvm')
+    after = run_opt_pass(expected(dshape), transform.InferType())
+    assert relay.analysis.alpha_equal(m["main"], after)
 
 
 def test_inception_like():
@@ -451,16 +432,16 @@ def before(dshape):
         x = relay.var("x", shape=dshape)
         in1 = inception_like(x)
         in2 = inception_like(in1)
-        return relay.Function(relay.ir_pass.free_vars(in2), in2)
+        return relay.Function(relay.analysis.free_vars(in2), in2)
 
     def expected(dshape):
         p0 = relay.var("p0", shape=dshape)
         c = conv(p0)
-        f0 = relay.Function(relay.ir_pass.free_vars(c), c)
+        f0 = relay.Function(relay.analysis.free_vars(c), c)
 
         p01 = relay.var("p01", shape=dshape)
         c = conv(p01)
-        f1 = relay.Function(relay.ir_pass.free_vars(c), c)
+        f1 = relay.Function(relay.analysis.free_vars(c), c)
 
         p02 = relay.var("p02", shape=dshape)
         p12 = relay.var("p12", shape=dshape)
@@ -471,11 +452,11 @@ def expected(dshape):
 
         p03 = relay.var("p03", shape=dshape2)
         c = conv(p03)
-        f2 = relay.Function(relay.ir_pass.free_vars(c), c)
+        f2 = relay.Function(relay.analysis.free_vars(c), c)
 
         p04 = relay.var("p04", shape=dshape2)
         c = conv(p04)
-        f3 = relay.Function(relay.ir_pass.free_vars(c), c)
+        f3 = relay.Function(relay.analysis.free_vars(c), c)
 
         p05 = relay.var("p05", shape=dshape)
         p15 = relay.var("p15", shape=dshape)
@@ -490,19 +471,15 @@ def expected(dshape):
         c4 = relay.Call(f3, [concat, relay.var("w4")])
         out = relay.Call(f_concat2, [c3, c4])
 
-        return relay.Function(relay.ir_pass.free_vars(out), out)
+        return relay.Function(relay.analysis.free_vars(out), out)
 
     dshape = (1, 16, 64, 64)
-    z = before(dshape)
-    z = relay.ir_pass.infer_type(z)
-    zz = relay.ir_pass.fuse_ops(z, opt_level=0)
-    assert not relay.ir_pass.free_vars(zz)
-    zz = relay.ir_pass.fuse_ops(z, opt_level=2)
-    relay.build(zz, 'llvm')
-    zz = relay.ir_pass.infer_type(zz)
-    assert not relay.ir_pass.free_vars(zz)
-    after = relay.ir_pass.infer_type(expected(dshape))
-    assert relay.ir_pass.alpha_equal(zz, after)
+    orig = before(dshape)
+    fuse0(relay.Module.from_expr(orig))
+    m = fuse2(relay.Module.from_expr(orig))
+    relay.build(m, 'llvm')
+    after = run_opt_pass(expected(dshape), transform.InferType())
+    assert relay.analysis.alpha_equal(m["main"], after)
 
 
 def test_fuse_parallel_injective():
@@ -527,14 +504,12 @@ def expected():
         return relay.Function([x], y)
 
     z = before()
-    z = relay.ir_pass.infer_type(z)
-    zz = relay.ir_pass.fuse_ops(z, opt_level=0)
-    assert not relay.ir_pass.free_vars(zz)
-    zz = relay.ir_pass.fuse_ops(z, opt_level=2)
-    zz = relay.ir_pass.infer_type(zz)
-    assert not relay.ir_pass.free_vars(zz)
-    after = relay.ir_pass.infer_type(expected())
-    assert relay.ir_pass.alpha_equal(zz, after)
+    zz = run_opt_pass(z, transform.FuseOps(fuse_opt_level=0))
+    assert not relay.analysis.free_vars(zz)
+    zz = run_opt_pass(z, transform.FuseOps(fuse_opt_level=2))
+    assert not relay.analysis.free_vars(zz)
+    after = run_opt_pass(expected(), transform.InferType())
+    assert relay.analysis.alpha_equal(zz, after)
 
 
 if __name__ == "__main__":
diff --git a/tests/python/relay/test_pass_gradient.py b/tests/python/relay/test_pass_gradient.py
index 6fece1b0a6ddf..3fc1d74de8768 100644
--- a/tests/python/relay/test_pass_gradient.py
+++ b/tests/python/relay/test_pass_gradient.py
@@ -14,14 +14,15 @@
 # KIND, either express or implied.  See the License for the
 # specific language governing permissions and limitations
 # under the License.
+import numpy as np
+
 import tvm
 from tvm import relay
-from tvm.relay.ir_pass import free_vars, free_type_vars, gradient
-from tvm.relay import create_executor
+from tvm.relay.analysis import free_vars, free_type_vars
+from tvm.relay import create_executor, transform
+from tvm.relay.transform import gradient
 from tvm.relay.prelude import Prelude
-from tvm.relay.testing import add_nat_definitions, make_nat_expr
-
-import numpy as np
+from tvm.relay.testing import add_nat_definitions, make_nat_expr, run_infer_type
 
 
 def rand(dtype='float32', *shape):
@@ -34,7 +35,7 @@ def test_id():
     t = relay.TensorType(shape, dtype)
     x = relay.var("x", t)
     func = relay.Function([x], x)
-    back_func = relay.ir_pass.infer_type(gradient(func))
+    back_func = run_infer_type(gradient(func))
     assert back_func.checked_type == relay.FuncType([t], relay.TupleType([t, relay.TupleType([t])]))
     ex = create_executor()
     x = rand(dtype, *shape)
@@ -49,7 +50,7 @@ def test_add():
     t = relay.TensorType(shape, dtype)
     x = relay.var("x", t)
     func = relay.Function([x], x + x)
-    back_func = relay.ir_pass.infer_type(gradient(func))
+    back_func = run_infer_type(gradient(func))
     assert back_func.checked_type == relay.FuncType([t], relay.TupleType([t, relay.TupleType([t])]))
     ex = create_executor()
     x = rand(dtype, *shape)
@@ -65,7 +66,7 @@ def test_temp_add():
     x = relay.var("x", t)
     y = x + x
     func = relay.Function([x], y + y)
-    back_func = relay.ir_pass.infer_type(gradient(func))
+    back_func = run_infer_type(gradient(func))
     assert back_func.checked_type == relay.FuncType([t], relay.TupleType([t, relay.TupleType([t])]))
     ex = create_executor()
     x = rand(dtype, *shape)
@@ -80,7 +81,7 @@ def test_sub():
     t = relay.TensorType(shape, dtype)
     x = relay.var("x", t)
     func = relay.Function([x], x - x)
-    back_func = relay.ir_pass.infer_type(gradient(func))
+    back_func = run_infer_type(gradient(func))
     assert back_func.checked_type == relay.FuncType([t], relay.TupleType([t, relay.TupleType([t])]))
     ex = create_executor()
     x = rand(dtype, *shape)
@@ -103,7 +104,7 @@ def test_broadcast_add():
     x = relay.var("x", t1)
     y = relay.var("y", t2)
     func = relay.Function([x, y], x + y)
-    full_func = relay.ir_pass.infer_type(gradient(func))
+    full_func = run_infer_type(gradient(func))
     assert full_func.checked_type == relay.FuncType([t1, t2],
                                                     relay.TupleType([relay.TensorType(expected_forward.shape, dtype),
                                                                      relay.TupleType([t1, t2])]))
@@ -130,7 +131,7 @@ def test_broadcast_subtract():
     x = relay.var("x", t1)
     y = relay.var("y", t2)
     func = relay.Function([x, y], x - y)
-    full_func = relay.ir_pass.infer_type(gradient(func))
+    full_func = run_infer_type(gradient(func))
     assert full_func.checked_type == relay.FuncType([t1, t2],
                                                     relay.TupleType([relay.TensorType(expected_forward.shape, dtype),
                                                                      relay.TupleType([t1, t2])]))
@@ -155,7 +156,7 @@ def test_tuple():
                                                relay.TupleGetItem(tup, 0) +
                                                relay.TupleGetItem(tup, 1) -
                                                relay.TupleGetItem(tup, 2)))
-    back_func = relay.ir_pass.infer_type(gradient(func))
+    back_func = run_infer_type(gradient(func))
     assert back_func.checked_type == relay.FuncType([t, t, t], relay.TupleType([t, relay.TupleType([t, t, t])]))
     x_nd = rand(dtype, *shape)
     y_nd = rand(dtype, *shape)
@@ -183,7 +184,10 @@ def test_pow():
     double = relay.Function([x], x + x)
     i = relay.var("i", t)
     func = relay.Function([i], p.nat_iterate(double, make_nat_expr(p, 3))(i))
-    back_func = relay.ir_pass.infer_type(gradient(func, mod=mod), mod=mod)
+    func = gradient(func, mod=mod)
+    mod["main"] = func
+    m = transform.InferType()(mod)
+    back_func = m["main"]
     assert back_func.checked_type == relay.FuncType([t], relay.TupleType([t, relay.TupleType([t])]))
     i_nd = rand(dtype, *shape)
     ex = create_executor(mod=mod)
@@ -203,7 +207,7 @@ def test_ref():
     body = relay.Let(u, relay.RefWrite(r, relay.RefRead(r) + relay.RefRead(r)), body)
     body = relay.Let(r, relay.RefCreate(x), body)
     func = relay.Function([x], body)
-    back_func = relay.ir_pass.infer_type(gradient(func))
+    back_func = run_infer_type(gradient(func))
     assert back_func.checked_type == relay.FuncType([t], relay.TupleType([t, relay.TupleType([t])]))
     x_nd = rand(dtype, *shape)
     ex = create_executor()
@@ -218,11 +222,11 @@ def test_square_second_order():
     t = relay.TensorType(shape, dtype)
     x = relay.var("x", t)
     func = relay.Function([x], x * x)
-    back_func = relay.ir_pass.infer_type(gradient(func))
+    back_func = run_infer_type(gradient(func))
     y = relay.var("y", t)
     back_func_adjusted = relay.Function([y], relay.TupleGetItem(relay.TupleGetItem(back_func(y), 1), 0))
-    back_func_adjusted = relay.ir_pass.infer_type(back_func_adjusted)
-    back_back_func = relay.ir_pass.infer_type(gradient(back_func_adjusted))
+    back_func_adjusted = run_infer_type(back_func_adjusted)
+    back_back_func = run_infer_type(gradient(back_func_adjusted))
     assert back_func.checked_type == relay.FuncType([t], relay.TupleType([t, relay.TupleType([t])]))
     x_nd = rand(dtype, *shape)
     ex = create_executor()
@@ -237,8 +241,10 @@ def test_if():
     cond = relay.var("cond", shape=(), dtype='uint1')
     net = relay.If(cond, x, y)
     net = relay.log(net)
-    net = relay.ir_pass.infer_type(relay.Function(relay.ir_pass.free_vars(net), net))
-    back_func = relay.ir_pass.infer_type(relay.ir_pass.gradient(net, mode='higher_order'))
+    func = relay.Function(free_vars(net), net)
+    net = run_infer_type(func)
+    net = gradient(net, mode='higher_order')
+    net = run_infer_type(net)
 
 
 if __name__ == "__main__":
diff --git a/tests/python/relay/test_pass_mac_count.py b/tests/python/relay/test_pass_mac_count.py
index 98ba1ad6325d9..0ad1e3abe7595 100644
--- a/tests/python/relay/test_pass_mac_count.py
+++ b/tests/python/relay/test_pass_mac_count.py
@@ -18,6 +18,16 @@
 import numpy as np
 import tvm
 from tvm import relay
+from tvm.relay import analysis, transform
+
+
+def run_opt_pass(expr, opt_pass):
+    assert isinstance(opt_pass, transform.Pass)
+    mod = relay.Module.from_expr(expr)
+    mod = opt_pass(mod)
+    entry = mod["main"]
+    return entry if isinstance(expr, relay.Function) else entry.body
+
 
 def test_gemm():
     n = 512
@@ -30,8 +40,8 @@ def test_gemm():
     gemm = relay.nn.dense(data1, data2)
     func = relay.Function([data1, data2],
                             relay.Tuple(tvm.convert([gemm])))
-    func = relay.ir_pass.infer_type(func)
-    compute_count = relay.ir_pass.get_total_mac_number(func)
+    func = run_opt_pass(func, transform.InferType())
+    compute_count = analysis.get_total_mac_number(func)
     expect_count = n * m * k
     assert compute_count == expect_count
 
@@ -55,11 +65,10 @@ def test_conv():
         weight,
         channels=output_channel,
         kernel_size=(kh, kw),
-        padding=(1, 1))
-    func = relay.Function([data, weight],
-                            relay.Tuple(tvm.convert([conv2d])))
-    func = relay.ir_pass.infer_type(func)
-    compute_count = relay.ir_pass.get_total_mac_number(func)
+        padding=(h_padding, w_padding))
+    func = relay.Function([data, weight], relay.Tuple(tvm.convert([conv2d])))
+    func = run_opt_pass(func, transform.InferType())
+    compute_count = analysis.get_total_mac_number(func)
     expect_count = batch_size * input_channel * oh * ow * output_channel * kh * kw
     assert compute_count == expect_count
 
@@ -92,11 +101,9 @@ def test_simple_network():
     func = relay.Function([data1, data2, weight_conv, weight_dense],
                             relay.Tuple(tvm.convert([conv2d_1, conv2d_2,
                                                     dense_1, add, flattened])))
-    func = relay.ir_pass.infer_type(func)
     # alter the CONV 2D data layout to test
-    func = relay.ir_pass.alter_op_layout(func)
-    func = relay.ir_pass.infer_type(func)
-    compute_count = relay.ir_pass.get_total_mac_number(func)
+    func = run_opt_pass(func, transform.AlterOpLayout())
+    compute_count = analysis.get_total_mac_number(func)
     expect_count = 231411712
     assert compute_count == expect_count
 
@@ -123,12 +130,41 @@ def test_depthwise_conv2d():
                             relay.Tuple(tvm.convert([depthwise_conv2d_1,
                                                     depthwise_conv2d_2,
                                                     add])))
-    func = relay.ir_pass.infer_type(func)
-    compute_count = relay.ir_pass.get_total_mac_number(func)
+    func = run_opt_pass(func, transform.InferType())
+    compute_count = analysis.get_total_mac_number(func)
     assert compute_count == 2 * np.prod(dshape) * 3*3
 
+def test_conv_2d_transpose():
+    batch_size = 1
+    input_channel = 3
+    h = 224
+    w = 224
+    output_channel = 64
+    kh = 7
+    kw = 7
+    h_padding = 1
+    w_padding = 1
+    oh = h - h_padding * 2 + kh - 1
+    ow = w - w_padding * 2 + kw - 1
+    dshape = (batch_size, input_channel, h, w)
+    weight = relay.var("weight", shape=(input_channel, output_channel, kh, kw))
+    data = relay.var("data", shape=dshape)
+    conv2d_transpose = relay.nn.conv2d_transpose(
+        data,
+        weight,
+        channels=output_channel,
+        kernel_size=(kh, kw),
+        padding=(h_padding, w_padding))
+    func = relay.Function([data, weight],
+                            relay.Tuple(tvm.convert([conv2d_transpose])))
+    func = run_opt_pass(func, transform.InferType())
+    compute_count = analysis.get_total_mac_number(func)
+    expect_count = batch_size * input_channel * oh * ow * output_channel * kh * kw
+    assert compute_count == expect_count
+
 if __name__ == "__main__":
     test_conv()
     test_gemm()
     test_simple_network()
     test_depthwise_conv2d()
+    test_conv_2d_transpose()
diff --git a/tests/python/relay/test_pass_manager.py b/tests/python/relay/test_pass_manager.py
index a8f50bdb8f558..22e9c76b4acaf 100644
--- a/tests/python/relay/test_pass_manager.py
+++ b/tests/python/relay/test_pass_manager.py
@@ -21,11 +21,18 @@
 from tvm import relay
 from tvm.relay import ExprFunctor
 from tvm.relay import Function, Call
-from tvm.relay import ir_pass
+from tvm.relay import analysis
 from tvm.relay import transform as _transform
 from tvm.relay.testing import ctx_list
 
 
+def run_infer_type(expr):
+    mod = relay.Module.from_expr(expr)
+    mod = _transform.InferType()(mod)
+    entry = mod["main"]
+    return entry if isinstance(expr, relay.Function) else entry.body
+
+
 def get_var_func():
     shape = (5, 10)
     tp = relay.TensorType(shape, "float32")
@@ -107,9 +114,9 @@ def get_rand(shape, dtype='float32'):
 
 
 def check_func(func, ref_func):
-    func = ir_pass.infer_type(func)
-    ref_func = ir_pass.infer_type(ref_func)
-    assert ir_pass.graph_equal(func, ref_func)
+    func = run_infer_type(func)
+    ref_func = run_infer_type(ref_func)
+    assert analysis.graph_equal(func, ref_func)
 
 
 def test_module_pass():
@@ -493,8 +500,8 @@ def expected():
             mod = seq(mod)
 
     zz = mod["main"]
-    zexpected = ir_pass.infer_type(expected())
-    assert relay.ir_pass.alpha_equal(zz, zexpected)
+    zexpected = run_infer_type(expected())
+    assert analysis.alpha_equal(zz, zexpected)
 
 
 if __name__ == "__main__":
diff --git a/tests/python/relay/test_pass_partial_eval.py b/tests/python/relay/test_pass_partial_eval.py
index b3c0c28d26cb8..452399a2a5eaa 100644
--- a/tests/python/relay/test_pass_partial_eval.py
+++ b/tests/python/relay/test_pass_partial_eval.py
@@ -18,17 +18,14 @@
 import numpy as np
 import tvm
 from tvm import relay
-from tvm.relay.ir_pass import partial_evaluate, alpha_equal, infer_type, dead_code_elimination
-from tvm.relay.ir_pass import gradient
-from tvm.relay import op, create_executor
-from tvm.relay.backend.interpreter import Value, TupleValue, ConstructorValue
+from tvm.relay.analysis import alpha_equal
 from tvm.relay.prelude import Prelude
-from tvm.relay import create_executor
-from nose.tools import nottest
+from tvm.relay import op, create_executor, transform
 from tvm.relay import Var, TypeVar, TupleGetItem, Let, Function, const, RefRead, RefWrite, RefCreate
 from tvm.relay import TensorType, Tuple, If, Module, Clause, PatternConstructor, PatternVar, Match
-from tvm.relay import GlobalVar, Call, Type
-from tvm.relay.testing import add_nat_definitions, count, make_nat_value, make_nat_expr
+from tvm.relay import GlobalVar, Call
+from tvm.relay.transform import gradient
+from tvm.relay.testing import add_nat_definitions, make_nat_expr
 
 def check_eval(expr, expected_result, mod=None, rtol=1e-07):
     ctx = tvm.context("llvm", 0)
@@ -38,8 +35,33 @@ def check_eval(expr, expected_result, mod=None, rtol=1e-07):
     np.testing.assert_allclose(result.asnumpy(), expected_result, rtol=rtol)
 
 
-def dcpe(expr, mod=None):
-    return dead_code_elimination(partial_evaluate(expr, mod=mod), inline_once=True)
+def run_opt_pass(expr, passes):
+    passes = passes if isinstance(passes, list) else [passes]
+    mod = relay.Module.from_expr(expr)
+    seq = transform.Sequential(passes)
+    with transform.PassContext(opt_level=3):
+       mod = seq(mod)
+    entry = mod["main"]
+    return entry if isinstance(expr, relay.Function) else entry.body
+
+
+def tipe(expr):
+    return run_opt_pass(expr, [transform.PartialEvaluate(),
+                               transform.InferType()])
+
+
+def dcpe(expr, mod=None, grad=False):
+    passes = [transform.PartialEvaluate(),
+              transform.DeadCodeElimination(inline_once=True)]
+    if grad:
+        expr = gradient(expr)
+    if mod:
+        assert isinstance(expr, Function)
+        mod["main"] = expr
+        seq = transform.Sequential(passes)
+        mod = seq(mod)
+        return mod["main"]
+    return run_opt_pass(expr, passes)
 
 
 def test_tuple():
@@ -47,24 +69,30 @@ def test_tuple():
     x = Var("x", t)
     body = TupleGetItem(relay.Tuple([relay.const(4.0), x]), 1)
     f = Function([x], body, None, [t])
-    assert alpha_equal(dcpe(f), relay.Function([x], x, None, [t]))
+    expected = relay.Function([x], x, None, [t])
+    expected = run_opt_pass(expected, transform.InferType())
+    assert alpha_equal(dcpe(f), expected)
+
 
 def test_const_inline():
-    d = Var("d")
+    t = relay.TensorType([], "float32")
+    d = Var("d", t)
     double = Function([d], d + d)
     orig = double(const(4.0))
     assert alpha_equal(dcpe(orig), const(8.0))
 
 
 def test_ref():
-    d = relay.Var("d")
-    r = relay.Var("r")
+    t = relay.TensorType([], "float32")
+    d = relay.Var("d", t)
+    r = relay.Var("r", relay.RefType(t))
     x = relay.Var("x")
     body = relay.RefRead(r)
     body = Let(x, RefWrite(r, RefRead(r) * RefRead(r)), body)
     body = Let(r, RefCreate(d), body)
     square = Function([d], body)
-    assert alpha_equal(dcpe(square), Function([d], d * d))
+    expected = run_opt_pass(Function([d], d * d), transform.InferType())
+    assert alpha_equal(dcpe(square), expected)
 
 
 def test_empty_ad():
@@ -73,17 +101,19 @@ def test_empty_ad():
     t = TensorType(shape, dtype)
     d = Var("d", t)
     f = Function([d], d)
-    g = dcpe(gradient(f))
+    g = dcpe(f, grad=True)
     expected = Function([d], Tuple([d, Tuple([op.ones_like(d)])]))
+    expected = run_opt_pass(expected, transform.InferType())
     assert alpha_equal(g, expected)
 
+
 def test_ad():
     shape = (10, 10)
     dtype = "float32"
     t = TensorType(shape, dtype)
     d = Var("d", t)
     f = Function([d], d * d)
-    g = dcpe(gradient(f))
+    g = dcpe(f, grad=True)
     m = d * d
     x = relay.Var("x")
     o = op.ones_like(x)
@@ -92,6 +122,7 @@ def test_ad():
     body = Tuple([x, Tuple([grad])])
     body = relay.Let(x1, o, body)
     expected = Function([d], relay.Let(x, m, body))
+    expected = run_opt_pass(expected, transform.InferType())
     assert alpha_equal(g, expected)
 
 
@@ -107,8 +138,7 @@ def test_if_ref():
     eff = Var("eff")
     body = Let(eff, body, RefRead(r))
     f = Function([d], Let(r, RefCreate(const(1)), Let(u, update, body)))
-    f = infer_type(f)
-    pe_f = infer_type(partial_evaluate(f))
+    pe_f = tipe(f)
     ex = create_executor()
     f_res = ex.evaluate(f)(const(True))
     pe_f_res = ex.evaluate(pe_f)(const(True))
@@ -132,8 +162,7 @@ def test_function_invalidate():
     body = Let(fet, fetch, body)
     body = Let(r, RefCreate(const(0)), body)
     f = Function([d], body)
-    f = infer_type(f)
-    pe_f = infer_type(partial_evaluate(f))
+    pe_f = tipe(f)
     ex = create_executor()
     f_res = ex.evaluate(f)(const(True))
     pe_f_res = ex.evaluate(pe_f)(const(True))
@@ -144,35 +173,30 @@ def test_function_invalidate():
 def test_head_cons():
     mod = Module()
     p = Prelude(mod)
-    def hd_impl():
-        a = TypeVar("a")
-        x = Var("x", p.l(a))
-        y = Var("y")
-        z = Var("z")
-        cons_case = Clause(PatternConstructor(p.cons,
-                                              [PatternVar(y),
-                                               PatternVar(z)]),
-                           y)
-        y = Var("y")
-        z = Var("z")
-        return Function([x], Match(x, [cons_case]), a, [a])
+    hd = p.hd
     t = TypeVar("t")
     x = Var("x", t)
-    hd = Var("hd")
-    body = Let(hd, hd_impl(), hd(p.cons(x, p.nil())))
+    body = hd(p.cons(x, p.nil()))
     f = Function([x], body, None, [t])
-    f = infer_type(f, mod=mod)
-    res = dcpe(f)
+    res = dcpe(f, mod)
     assert alpha_equal(res, Function([x], x, t, [t]))
 
 
 def test_map():
     mod = Module()
     p = Prelude(mod)
-    f = Var("f")
+    f = GlobalVar("f")
+    t = TypeVar("t")
+    a = Var("a", t)
+    mod[f] = Function([a], a, t, [t])
     orig = p.map(f, p.cons(const(1), p.cons(const(2), p.cons(const(3), p.nil()))))
-    expected = p.cons(f(const(1)), p.cons(f(const(2)), p.cons(f(const(3)), p.nil())))
-    assert alpha_equal(dcpe(orig, mod=mod), expected)
+    expected = p.cons((const(1)), p.cons((const(2)), p.cons((const(3)), p.nil())))
+    expected = Function([], expected)
+    mod["main"] = expected
+    expected = mod["main"]
+    orig = Function([], orig)
+    res = dcpe(orig, mod=mod)
+    assert alpha_equal(res.body, expected.body)
 
 
 def test_loop():
@@ -181,9 +205,12 @@ def test_loop():
     x = Var("x", t)
     loop = GlobalVar("loop")
     mod[loop] = Function([x], loop(x), t, [t])
-    res = dcpe(loop(const(1)), mod=mod)
-    expected = Call(loop, [const(1)], None, [None])
-    assert alpha_equal(res, expected)
+    expected = Call(loop, [const(1)])
+    mod["main"] = Function([], expected)
+    expected = mod["main"].body
+    call = Function([], loop(const(1)))
+    res = dcpe(call, mod=mod)
+    assert alpha_equal(res.body, expected)
 
 
 def test_swap_loop():
@@ -196,8 +223,9 @@ def test_swap_loop():
     loop = GlobalVar("loop")
     mod[loop] = Function([x, y], loop(y, x), nat)
     prog = loop(make_nat_expr(p, 1), make_nat_expr(p, 2))
-    res = dcpe(prog, mod=mod)
-    assert alpha_equal(prog, res)
+    res = Function([], prog)
+    res = dcpe(res, mod=mod)
+    assert alpha_equal(prog, res.body)
 
 
 def test_abs_diff():
@@ -217,8 +245,9 @@ def test_abs_diff():
     x_s_case = Clause(PatternConstructor(p.s, [PatternVar(xp)]), Match(y, [y_z_case, y_s_case]))
     mod[diff] = Function([x, y], Match(x, [x_z_case, x_s_case]))
     orig = diff(make_nat_expr(p, 7), make_nat_expr(p, 3))
+    orig = Function([], orig)
     res = dcpe(orig, mod=mod)
-    assert alpha_equal(res, make_nat_expr(p, 4))
+    assert alpha_equal(res.body, make_nat_expr(p, 4))
 
 
 def test_match_nat_id():
@@ -233,8 +262,9 @@ def test_match_nat_id():
     s_case = Clause(PatternConstructor(p.s, [PatternVar(y)]), p.s(y))
     mod[nat_id] = Function([x], Match(x, [z_case, s_case]))
     orig = nat_id(make_nat_expr(p, 3))
+    orig = Function([], orig)
     res = dcpe(orig, mod=mod)
-    assert alpha_equal(res, make_nat_expr(p, 3))
+    assert alpha_equal(res.body, make_nat_expr(p, 3))
 
 
 def test_nat_id():
@@ -247,8 +277,9 @@ def test_nat_id():
     nat_id = GlobalVar("nat_id")
     mod[nat_id] = Function([x], x)
     orig = nat_id(make_nat_expr(p, 3))
+    orig = Function([], orig)
     res = dcpe(orig, mod=mod)
-    assert alpha_equal(res, make_nat_expr(p, 3))
+    assert alpha_equal(res.body, make_nat_expr(p, 3))
 
 
 def test_global_match_nat_id():
@@ -260,8 +291,9 @@ def test_global_match_nat_id():
     z_case = Clause(PatternConstructor(p.z, []), p.z())
     s_case = Clause(PatternConstructor(p.s, [PatternVar(x)]), p.s(x))
     orig = Match(make_nat_expr(p, 3), [z_case, s_case])
+    orig = Function([], orig)
     res = dcpe(orig, mod=mod)
-    assert alpha_equal(res, make_nat_expr(p, 3))
+    assert alpha_equal(res.body, make_nat_expr(p, 3))
 
 
 def test_double():
@@ -269,15 +301,16 @@ def test_double():
     p = Prelude(mod)
     add_nat_definitions(p)
     orig = p.double(make_nat_expr(p, 3))
+    orig = Function([], orig)
     res = dcpe(orig, mod=mod)
-    assert alpha_equal(res, make_nat_expr(p, 6))
+    assert alpha_equal(res.body, make_nat_expr(p, 6))
 
 
 if __name__ == '__main__':
-    test_empty_ad()
+    test_ref()
     test_tuple()
+    test_empty_ad()
     test_const_inline()
-    test_ref()
     test_ad()
     test_if_ref()
     test_function_invalidate()
diff --git a/tests/python/relay/test_pass_quantize.py b/tests/python/relay/test_pass_quantize.py
index fe62c3b5cea4f..f6f67d6b6ac93 100644
--- a/tests/python/relay/test_pass_quantize.py
+++ b/tests/python/relay/test_pass_quantize.py
@@ -19,10 +19,18 @@
 import tvm
 from tvm import relay
 from tvm.relay import quantize as qtz
+from tvm.relay import transform
+
+
+def run_infer_type(expr):
+    mod = relay.Module.from_expr(expr)
+    mod = transform.InferType()(mod)
+    entry = mod["main"]
+    return entry if isinstance(expr, relay.Function) else entry.body
 
 
 def make_dataset(graph, size=100):
-    args = relay.ir_pass.infer_type(graph).params
+    args = run_infer_type(graph).params
     def create_arr(var):
         ttype = var.type_annotation
         np_arr = np.random.uniform(-1.0, 1.0, size=ttype.concrete_shape).astype(ttype.dtype)
@@ -40,7 +48,7 @@ def create_arr(var):
 def test_simulated_quantize():
     data = relay.var("data", relay.ty.TensorType((3, 4, 5, 6), "float32"))
     out = qtz._annotate.attach_simulated_quantize(data, 1)
-    out = relay.ir_pass.infer_type(out)
+    out = run_infer_type(out)
     assert out.checked_type == out.args[0].checked_type
     assert out.args[1].checked_type == relay.ty.TensorType(tuple(), "float32")
     assert out.args[2].checked_type == relay.ty.TensorType(tuple(), "float32")
@@ -59,7 +67,7 @@ def quantize_weight(arr):
     def make_graph(data):
         weight = relay.var("conv_weight")
         out = relay.nn.conv2d(data, weight, kernel_size=(3, 3), padding=(1, 1), channels=c)
-        out = relay.Function(relay.ir_pass.free_vars(out), out)
+        out = relay.Function(relay.analysis.free_vars(out), out)
         return out
 
     def make_qgraph(data, weight):
@@ -72,7 +80,7 @@ def make_qgraph(data, weight):
                               padding=(1, 1), channels=c, out_dtype='int32')
         out = out.astype('float32')
         out = relay.multiply(out, relay.const(0.00024414062))
-        out = relay.Function(relay.ir_pass.free_vars(out), out)
+        out = relay.Function(relay.analysis.free_vars(out), out)
         return out
 
     np.random.seed(42)
@@ -84,11 +92,11 @@ def make_qgraph(data, weight):
     with qtz.qconfig(skip_conv_layers=None, global_scale=4.0,
                      round_for_shift=False, store_lowbit_output=False):
         qgraph0 = qtz.quantize(graph, params)
-        qgraph0 = relay.ir_pass.infer_type(qgraph0)
+        qgraph0 = run_infer_type(qgraph0)
 
     conv_weight = quantize_weight(params['conv_weight'])
     qgraph1 = make_qgraph(data, conv_weight)
-    qgraph1 = relay.ir_pass.infer_type(qgraph1)
+    qgraph1 = run_infer_type(qgraph1)
 
     graph = relay.create_executor('graph')
     res0 = graph.evaluate(qgraph0)(dataset[0]['data'])
diff --git a/tests/python/relay/test_pass_simplify_inference.py b/tests/python/relay/test_pass_simplify_inference.py
index aad1d9fc6cf5f..4e62fa6dcb08e 100644
--- a/tests/python/relay/test_pass_simplify_inference.py
+++ b/tests/python/relay/test_pass_simplify_inference.py
@@ -15,7 +15,7 @@
 # specific language governing permissions and limitations
 # under the License.
 from tvm import relay as rly
-from tvm.relay.ir_pass import simplify_inference, alpha_equal
+from tvm.relay.transform import SimplifyInference
 
 def test_simplify_batchnorm(dtype='float32'):
     def simple_bn(x, gamma, beta, moving_mean, moving_var,
@@ -49,10 +49,13 @@ def check(dim, axis, nstep):
             y2 = simple_bn(y2 + rly.const(1, dtype),
                            gamma, beta, moving_mean, moving_var,
                            epsilon=eps, axis=axis, shape=ttype1.shape)
-        y1 = rly.ir_pass.infer_type(y1)
-        y1 = simplify_inference(y1)
 
-        assert rly.ir_pass.graph_equal(y1, y2)
+        mod = rly.Module.from_expr(y1)
+        simplify = SimplifyInference()
+        mod = simplify(mod)
+        y1 = mod["main"].body
+
+        assert rly.analysis.graph_equal(y1, y2)
 
     check(2, 1, 1)
     check(4, 1, 1)
diff --git a/tests/python/relay/test_pass_to_a_normal_form.py b/tests/python/relay/test_pass_to_a_normal_form.py
index 9a2570eabb11b..d5d44fdaec729 100644
--- a/tests/python/relay/test_pass_to_a_normal_form.py
+++ b/tests/python/relay/test_pass_to_a_normal_form.py
@@ -17,14 +17,23 @@
 import numpy as np
 import tvm
 from tvm import relay
-from tvm.relay.ir_pass import to_a_normal_form, alpha_equal, infer_type, detect_feature
-from tvm.relay import op, create_executor
-from tvm.relay.backend.interpreter import Value, TupleValue, ConstructorValue
+from tvm.relay.analysis import alpha_equal, detect_feature
+from tvm.relay import op, create_executor, transform
 from tvm.relay.prelude import Prelude
 from tvm.relay.testing import add_nat_definitions, count
 from tvm.relay.feature import Feature
 
 
+def run_opt_pass(expr, passes):
+    passes = passes if isinstance(passes, list) else [passes]
+    mod = relay.Module.from_expr(expr)
+    seq = transform.Sequential(passes)
+    with transform.PassContext(opt_level=3):
+       mod = seq(mod)
+    entry = mod["main"]
+    return entry if isinstance(expr, relay.Function) else entry.body
+
+
 def check_eval(expr, expected_result, mod=None, rtol=1e-07):
     ctx = tvm.context("llvm", 0)
     intrp = create_executor(mod=mod, ctx=ctx, target="llvm")
@@ -39,7 +48,7 @@ def test_explicit_bound():
     z = op.add(y, y)
     f = relay.Function([], op.add(z, z))
     assert not Feature.fLet in detect_feature(f)
-    anf = to_a_normal_form(f)
+    anf = run_opt_pass(f, transform.ToANormalForm())
     assert Feature.fLet in detect_feature(anf)
     check_eval(f(), 8.0)
     check_eval(anf(), 8.0)
@@ -53,7 +62,7 @@ def test_order():
     x = relay.const(1)
     val = x + y * z
     check_eval(val, 7.0)
-    anf = infer_type(to_a_normal_form(val))
+    anf = run_opt_pass(val, [transform.ToANormalForm(), transform.InferType()])
     a = relay.Var('a', relay.IncompleteType())
     b = relay.Var('b', relay.IncompleteType())
     c = relay.Var('c', relay.IncompleteType())
@@ -65,14 +74,14 @@ def test_order():
     expected_output = relay.Let(c, z, expected_output)
     expected_output = relay.Let(b, y, expected_output)
     expected_output = relay.Let(a, x, expected_output)
-    expected_output = infer_type(expected_output)
+    expected_output = run_opt_pass(expected_output, transform.InferType())
     assert alpha_equal(anf, expected_output)
 
 
 def test_if():
     cond = relay.const(True)
     x = relay.If(cond, relay.const(2), relay.const(3))
-    anf = infer_type(to_a_normal_form(x))
+    anf = run_opt_pass(x, [transform.ToANormalForm(), transform.InferType()])
     a = relay.Var('a', relay.IncompleteType())
     b = relay.Var('b', relay.IncompleteType())
     c = relay.Var('c', relay.IncompleteType())
@@ -82,7 +91,7 @@ def test_if():
     expected_output = relay.If(c, true_branch, false_branch)
     expected_output = relay.Let(d, expected_output, d)
     expected_output = relay.Let(c, cond, expected_output)
-    expected_output = infer_type(expected_output)
+    expected_output = run_opt_pass(expected_output, transform.InferType())
     assert alpha_equal(anf, expected_output)
 
 
@@ -114,7 +123,8 @@ def test_recursion():
     mod[f] = value
     check_eval(f(relay.const(5, 'int64')), 30.0, mod=mod)
     old_f = mod[f]
-    f = to_a_normal_form(f, mod=mod)
+    mod = transform.ToANormalForm()(mod)
+    f = mod[f]
     check_eval(f(relay.const(5, 'int64')), 30.0, mod=mod)
 
 
@@ -129,7 +139,8 @@ def test_ref():
     body = relay.Let(iv, relay.RefRead(i), body)
     body = relay.Let(i, relay.RefCreate(relay.const(1)), body)
     check_eval(body, 3)
-    check_eval(to_a_normal_form(body), 3)
+    opt_body = run_opt_pass(body, transform.ToANormalForm())
+    check_eval(opt_body, 3)
 
 
 def test_nat_add():
@@ -144,7 +155,12 @@ def test_nat_add():
     intrp = create_executor(mod=mod, ctx=ctx, target="llvm")
     assert mod[add].checked_type == relay.FuncType([nat(), nat()], nat())
     assert count(p, intrp.evaluate(add(s(z()), s(z())))) == 2
-    assert count(p, intrp.evaluate(to_a_normal_form(add(s(z()), s(z())), mod))) == 2
+    expr = add(s(z()), s(z()))
+    f = relay.GlobalVar("f")
+    mod[f] = relay.Function([], expr)
+    mod = transform.ToANormalForm()(mod)
+    expr = mod["f"]
+    assert count(p, intrp.evaluate(expr.body)) == 2
     assert Feature.fLet in detect_feature(mod[add])
 
 
@@ -155,19 +171,34 @@ def test_let():
     body = relay.Let(y, x, x + y)
     body = relay.Let(x, d, body)
     check_eval(body, 8)
-    check_eval(to_a_normal_form(body), 8)
+    opt_body = run_opt_pass(body, transform.ToANormalForm())
+    check_eval(opt_body, 8)
 
 
 def test_function():
-    x = relay.Var("x")
+    t = relay.TensorType((), 'float32')
+    x = relay.Var("x", t)
     f = relay.Function([x], x + x)
     d = relay.const(4.0, 'float32')
-    anf_f = to_a_normal_form(f)
+    anf_f = run_opt_pass(f, transform.ToANormalForm())
     assert isinstance(anf_f, relay.Function)
     check_eval(f(d), 8)
     check_eval(anf_f(d), 8)
 
 
+def test_gradient_if():
+    x = relay.var("a", shape=(1, 16))
+    y = relay.var("y", shape=(1, 16))
+    cond = relay.var("cond", shape=(), dtype='uint1')
+    net = relay.If(cond, x, x)
+    net = relay.add(x, net)
+    net = relay.Function([cond,x,y], net)
+    mod = relay.Module.from_expr(net)
+    mod = relay.transform.ToANormalForm()(mod)
+    mod["main"] = relay.transform.gradient(mod["main"], mode='higher_order')
+    mod = relay.transform.ToANormalForm()(mod)
+
+
 if __name__ == '__main__':
     test_explicit_bound()
     test_order()
@@ -177,3 +208,4 @@ def test_function():
     test_let()
     test_nat_add()
     test_function()
+    test_gradient_if()
diff --git a/tests/python/relay/test_pass_to_cps.py b/tests/python/relay/test_pass_to_cps.py
new file mode 100644
index 0000000000000..2b6f2ef6b8587
--- /dev/null
+++ b/tests/python/relay/test_pass_to_cps.py
@@ -0,0 +1,100 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+import numpy as np
+import tvm
+from tvm import relay
+from tvm.relay.analysis import alpha_equal, detect_feature
+from tvm.relay.transform import to_cps, un_cps
+from tvm.relay.feature import Feature
+from tvm.relay.prelude import Prelude
+from tvm.relay.testing import add_nat_definitions, make_nat_expr, run_infer_type, run_opt_pass
+from tvm.relay import create_executor
+from tvm.relay import Function, transform
+
+
+def rand(dtype='float32', *shape):
+    return tvm.nd.array(np.random.rand(*shape).astype(dtype))
+
+
+# make sure cps work for recursion.
+def test_recursion():
+    mod = relay.Module()
+    p = Prelude(mod)
+    add_nat_definitions(p)
+    shape = (10, 10)
+    dtype = 'float32'
+    t = relay.TensorType(shape, dtype)
+    x = relay.var("x", t)
+    double = relay.Function([x], x + x)
+    i = relay.var("i", t)
+    func = relay.Function([i], p.nat_iterate(double, make_nat_expr(p, 3))(i))
+    mod["main"] = func
+    mod["main"] = to_cps(mod["main"], mod=mod)
+    mod["main"] = un_cps(mod["main"])
+    ex = create_executor(mod=mod)
+    i_nd = rand(dtype, *shape)
+    forward = ex.evaluate()(i_nd)
+    tvm.testing.assert_allclose(forward.asnumpy(), 8 * i_nd.asnumpy())
+
+
+# This serve as an integration test.
+# It test that, given a program with reference,
+# cps and pe can completely eliminate the allocation of reference.
+def test_cps_pe():
+    def destroy_ref(x):
+        x = run_infer_type(x)
+        x = to_cps(x)
+        x = run_infer_type(x)
+        y = un_cps(x)
+        y = run_infer_type(y)
+        x = run_opt_pass(x, transform.Sequential([transform.PartialEvaluate(), transform.DeadCodeElimination(inline_once=True)]))
+        assert Feature.fRefCreate not in detect_feature(x)
+    unit = relay.Function([], relay.const(0., dtype='float32'))
+    f_ref = relay.Var("f_ref")
+
+    one = relay.const(1., dtype='float32')
+    two = relay.const(2., dtype='float32')
+    cond = relay.var(shape=(), dtype='uint1', name_hint='cond')
+    true_branch = relay.RefWrite(f_ref, relay.Function([], one))
+    false_branch = relay.RefWrite(f_ref, relay.Function([], two))
+    if_expr = relay.If(cond, true_branch, false_branch)
+
+    stmt = relay.Let(f_ref, relay.RefCreate(unit),
+                     relay.Let(relay.Var("x"), if_expr,
+                               relay.Call(relay.RefRead(f_ref), [])))
+
+    F = relay.Function([cond], stmt)
+    destroy_ref(F)
+
+    G = relay.Function([cond], relay.If(cond, one, two))
+    G = relay.transform.gradient(G)
+    destroy_ref(G)
+
+    x = relay.var("x", shape=(1, 16))
+    y = relay.var("y", shape=(1, 16))
+    z = relay.var("z", shape=(1, 16))
+    cond = relay.var("cond", shape=(), dtype='uint1')
+    H = relay.If(cond, x, y)
+    H = relay.add(H, z)
+    H = relay.Function([cond,x,y,z], H)
+    H = relay.transform.gradient(H)
+    destroy_ref(H)
+
+
+if __name__ == '__main__':
+    test_recursion()
+    test_cps_pe()
diff --git a/tests/python/relay/test_pass_to_graph_normal_form.py b/tests/python/relay/test_pass_to_graph_normal_form.py
index 6d9bd6ac254ec..a29172471d484 100644
--- a/tests/python/relay/test_pass_to_graph_normal_form.py
+++ b/tests/python/relay/test_pass_to_graph_normal_form.py
@@ -17,10 +17,15 @@
 import numpy as np
 import tvm
 from tvm import relay
-from tvm.relay.ir_pass import to_graph_normal_form, to_a_normal_form, alpha_equal, detect_feature
-from tvm.relay import op, create_executor
-from tvm.relay.feature import Feature
-from tvm.relay.backend.interpreter import Value, TupleValue
+from tvm.relay import op, create_executor, transform, Feature
+from tvm.relay.analysis import detect_feature
+
+
+def run_opt_pass(expr, opt_pass):
+    mod = relay.Module.from_expr(expr)
+    mod = opt_pass(mod)
+    entry = mod["main"]
+    return entry if isinstance(expr, relay.Function) else entry.body
 
 
 def check_eval(expr, args, expected_result, mod=None, rtol=1e-07):
@@ -41,9 +46,9 @@ def test_implicit_share():
     body = relay.Let(z, op.add(y, y), op.add(z, z))
     body = relay.Let(y, op.add(x, x), body)
     f = relay.Function([], relay.Let(x, relay.const(1), body))
-    g = to_graph_normal_form(f)
-    assert "let" in f.astext()
-    assert not "let" in g.astext()
+    g = run_opt_pass(f, transform.ToGraphNormalForm())
+    assert Feature.fLet in detect_feature(f)
+    assert not Feature.fLet in detect_feature(g)
     check_eval(f, [], 8.0)
     check_eval(g, [], 8.0)
 
@@ -55,8 +60,8 @@ def test_round_trip():
     body = relay.Let(z, op.add(y, y), op.add(z, z))
     body = relay.Let(y, op.add(x, x), body)
     f = relay.Function([], relay.Let(x, relay.const(1), body))
-    g = to_graph_normal_form(f)
-    h = to_a_normal_form(g)
+    g = run_opt_pass(f, transform.ToGraphNormalForm())
+    h = run_opt_pass(g, transform.ToANormalForm())
     assert Feature.fLet in detect_feature(f)
     assert not Feature.fLet in detect_feature(g)
     check_eval(f, [], 8.0)
diff --git a/tests/python/relay/test_pass_unmatched_cases.py b/tests/python/relay/test_pass_unmatched_cases.py
index 4f2bb20ad7d68..776f5a05722d1 100644
--- a/tests/python/relay/test_pass_unmatched_cases.py
+++ b/tests/python/relay/test_pass_unmatched_cases.py
@@ -18,7 +18,7 @@
 import tvm
 from tvm import relay
 from tvm.relay.prelude import Prelude
-from tvm.relay.ir_pass import unmatched_cases
+from tvm.relay.analysis import unmatched_cases
 
 def test_empty_match_block():
     # empty match block will not match anything, so it should return a wildcard pattern
diff --git a/tests/python/relay/test_pass_vars.py b/tests/python/relay/test_pass_vars.py
index 2f1ef36e7878f..70eb047ad03ea 100644
--- a/tests/python/relay/test_pass_vars.py
+++ b/tests/python/relay/test_pass_vars.py
@@ -16,9 +16,9 @@
 # under the License.
 import tvm
 from tvm import relay
-from tvm.relay.ir_pass import (free_vars, free_type_vars,
-                               bound_vars, bound_type_vars,
-                               all_vars, all_type_vars)
+from tvm.relay.analysis import (free_vars, free_type_vars,
+                                bound_vars, bound_type_vars,
+                                all_vars, all_type_vars)
 
 def assert_vars_match(actual, expected):
     assert len(actual) == len(expected)
diff --git a/tests/python/relay/test_type_infer.py b/tests/python/relay/test_type_infer.py
index 8e047354fafd7..eae05ec7d7e0e 100644
--- a/tests/python/relay/test_type_infer.py
+++ b/tests/python/relay/test_type_infer.py
@@ -17,16 +17,34 @@
 """Test that type checker correcly computes types
    for expressions.
 """
-import tvm
-import numpy as np
-from tvm.relay.ir_pass import infer_type
 from tvm import relay
-from tvm.relay import op
-from tvm.relay.scope_builder import ScopeBuilder
+from tvm.relay import op, transform, analysis
+
+
+def run_infer_type(expr, mod=None):
+    if not mod:
+        mod = relay.Module.from_expr(expr)
+        mod = transform.InferType()(mod)
+        entry = mod["main"]
+        return entry if isinstance(expr, relay.Function) else entry.body
+    else:
+        if isinstance(expr, relay.GlobalVar):
+            gv = expr.name_hint
+        else:
+            func = expr
+            if not isinstance(expr, relay.Function):
+                func = relay.Function(analysis.free_vars(expr), expr)
+            mod["main"] = func
+            gv = "main"
+        mod = transform.InferType()(mod)
+
+        if isinstance(expr, (relay.GlobalVar, relay.Function)):
+            return mod[gv]
+        return mod[gv].body
 
 
 def assert_has_type(expr, typ, mod=relay.module.Module({})):
-    checked_expr = infer_type(expr, mod)
+    checked_expr = run_infer_type(expr, mod)
     checked_type = checked_expr.checked_type
     if checked_type != typ:
         raise RuntimeError("Type mismatch %s vs %s" % (
@@ -48,7 +66,7 @@ def test_monomorphic_let():
     sb = relay.ScopeBuilder()
     x = sb.let('x', relay.const(1.0, "float64"))
     sb.ret(x)
-    xchecked = relay.ir_pass.infer_type(sb.get())
+    xchecked = run_infer_type(sb.get())
     assert xchecked.checked_type == relay.scalar_type("float64" )
 
 
@@ -94,7 +112,7 @@ def test_dual_op():
     t2 = sb.let("t2", relay.add(t1, x))
     sb.ret(t2)
     f = relay.Function([x], sb.get())
-    fchecked = relay.ir_pass.infer_type(f)
+    fchecked = run_infer_type(f)
     assert fchecked.checked_type == relay.FuncType([tp], tp)
 
 
@@ -107,7 +125,7 @@ def @f(%x : Tensor[(10, 10), float32]) {
     tp = relay.TensorType((10, 10))
     x = relay.var("x", tp)
     f = relay.Function([x], relay.log(x))
-    fchecked = relay.ir_pass.infer_type(f)
+    fchecked = run_infer_type(f)
     assert fchecked.checked_type == relay.FuncType([tp], tp)
 
 
@@ -145,7 +163,7 @@ def test_incomplete_call():
     f = relay.var('f')
     func = relay.Function([x, f], relay.Call(f, [x]), tt)
 
-    ft = relay.ir_pass.infer_type(func)
+    ft = run_infer_type(func)
     f_type = relay.FuncType([tt], tt)
     assert ft.checked_type == relay.FuncType([tt, f_type], tt)
 
@@ -164,7 +182,7 @@ def test_higher_order_argument():
     # function even though id_func takes a type parameter
     ho_call = ho_func(id_func, relay.const(0, 'int32'))
 
-    hc = relay.ir_pass.infer_type(ho_call)
+    hc = run_infer_type(ho_call)
     expected = relay.scalar_type('int32')
     assert hc.checked_type == expected
 
@@ -177,7 +195,7 @@ def test_higher_order_return():
     b = relay.TypeVar('b')
     nested_id = relay.Function([], id_func, relay.FuncType([b], b), [b])
 
-    ft = relay.ir_pass.infer_type(nested_id)
+    ft = run_infer_type(nested_id)
     assert ft.checked_type == relay.FuncType([], relay.FuncType([b], b), [b])
 
 
@@ -198,7 +216,7 @@ def test_higher_order_nested():
         [b])
 
     expected = relay.FuncType([choice_t], relay.FuncType([b], b), [b])
-    ft = relay.ir_pass.infer_type(top)
+    ft = run_infer_type(top)
     assert ft.checked_type == expected
 
 
@@ -206,8 +224,7 @@ def test_tuple():
     tp = relay.TensorType((10,))
     x = relay.var("x", tp)
     res = relay.Tuple([x, x])
-    assert (relay.ir_pass.infer_type(res).checked_type ==
-            relay.TupleType([tp, tp]))
+    assert (run_infer_type(res).checked_type == relay.TupleType([tp, tp]))
 
 
 def test_ref():
@@ -215,17 +232,17 @@ def test_ref():
     y = relay.var("y", "float32")
     r = relay.RefCreate(x)
     st = relay.scalar_type("float32")
-    assert relay.ir_pass.infer_type(r).checked_type == relay.RefType(st)
+    assert run_infer_type(r).checked_type == relay.RefType(st)
     g = relay.RefRead(r)
-    assert relay.ir_pass.infer_type(g).checked_type == st
+    assert run_infer_type(g).checked_type == st
     w = relay.RefWrite(r, y)
-    assert relay.ir_pass.infer_type(w).checked_type == relay.TupleType([])
+    assert run_infer_type(w).checked_type == relay.TupleType([])
 
 
 def test_free_expr():
     x = relay.var("x", "float32")
     y = relay.add(x, x)
-    yy = relay.ir_pass.infer_type(y)
+    yy = run_infer_type(y)
     assert yy.checked_type == relay.scalar_type("float32")
     assert x.vid.same_as(yy.args[0].vid)
 
@@ -234,7 +251,7 @@ def test_type_args():
     x = relay.var("x", shape=(10, 10))
     y = relay.var("y", shape=(1, 10))
     z = relay.add(x, y)
-    ty_z = relay.ir_pass.infer_type(z)
+    ty_z = run_infer_type(z)
     ty_args = ty_z.type_args
     assert len(ty_args) == 2
     assert ty_args[0].dtype == "float32"
@@ -249,22 +266,22 @@ def test_type_args():
 
 def test_global_var_recursion():
     mod = relay.Module({})
-    gv = relay.GlobalVar("foo")
+    gv = relay.GlobalVar("main")
     x = relay.var('x', shape=[])
     tt = relay.scalar_type('float32')
 
     func = relay.Function([x], relay.Call(gv, [x]), tt)
     mod[gv] = func
 
-    ft = relay.ir_pass.infer_type(gv, mod)
-    assert mod[ft].checked_type == relay.FuncType([tt], tt)
+    ft = run_infer_type(gv, mod)
+    assert ft.checked_type == relay.FuncType([tt], tt)
 
 
 def test_equal():
     i = relay.var('i', shape=[], dtype='int32')
     eq = op.equal(i, relay.const(0, dtype='int32'))
     func = relay.Function([i], eq)
-    ft = relay.ir_pass.infer_type(func)
+    ft = run_infer_type(func)
 
     assert ft.checked_type == relay.FuncType([relay.scalar_type('int32')], relay.scalar_type('bool'))
 
@@ -275,8 +292,7 @@ def test_constructor_type():
 
     a = relay.TypeVar('a')
     x = relay.Var('x', a)
-    ct = relay.ir_pass.infer_type(
-        relay.Function([x], constructor(x), box(a), [a]), mod)
+    ct = run_infer_type(relay.Function([x], constructor(x), box(a), [a]), mod)
     expected = relay.FuncType([a], box(a), [a])
     assert ct.checked_type == expected
 
@@ -288,8 +304,8 @@ def test_constructor_call():
     box_unit = constructor(relay.Tuple([]))
     box_constant = constructor(relay.const(0, 'float32'))
 
-    ut = relay.ir_pass.infer_type(box_unit, mod)
-    ct = relay.ir_pass.infer_type(box_constant, mod)
+    ut = run_infer_type(box_unit, mod)
+    ct = run_infer_type(box_constant, mod)
     assert ut.checked_type == box(relay.TupleType([]))
     assert ct.checked_type == box(relay.TensorType((), 'float32'))
 
@@ -308,7 +324,7 @@ def test_adt_match():
                          relay.Clause(relay.PatternWildcard(),
                                       relay.Tuple([]))])
 
-    mt = relay.ir_pass.infer_type(match, mod)
+    mt = run_infer_type(match, mod)
     assert mt.checked_type == relay.TupleType([])
 
 
@@ -328,7 +344,7 @@ def test_adt_match_type_annotations():
                                                      relay.Tuple([]))])
 
     func = relay.Function([x], match)
-    ft = relay.ir_pass.infer_type(func, mod)
+    ft = run_infer_type(func, mod)
     assert ft.checked_type == relay.FuncType([tt], relay.TupleType([]))
 
 
diff --git a/tests/python/relay/test_type_solver.py b/tests/python/relay/test_type_solver.py
index 81f0222c029a7..655b5d794005a 100644
--- a/tests/python/relay/test_type_solver.py
+++ b/tests/python/relay/test_type_solver.py
@@ -26,7 +26,7 @@ def make_rel(name, args, num_inputs=None, attrs=None):
     return relay.ty.TypeRelation(func, args, num_inputs, attrs)
 
 def make_solver():
-    solver = relay._ir_pass._test_type_solver()
+    solver = relay._analysis._test_type_solver()
     solver.Solve = solver("Solve")
     solver.Unify = solver("Unify")
     solver.Resolve = solver("Resolve")
diff --git a/tests/python/relay/test_typecall.py b/tests/python/relay/test_typecall.py
index 4cb8f4f5d2ce5..b500a937a6eea 100644
--- a/tests/python/relay/test_typecall.py
+++ b/tests/python/relay/test_typecall.py
@@ -15,7 +15,7 @@
 # specific language governing permissions and limitations
 # under the License.
 from tvm import relay
-from tvm.relay.ir_pass import infer_type
+from tvm.relay import transform
 
 def test_dup_type():
     a = relay.TypeVar("a")
@@ -23,7 +23,10 @@ def test_dup_type():
     make_id = relay.Function([av], relay.Tuple([av, av]), None, [a])
     t = relay.scalar_type("float32")
     b = relay.Var("b", t)
-    assert relay.ir_pass.infer_type(make_id(b)).checked_type == relay.TupleType([t, t])
+    mod = relay.Module.from_expr(make_id(b))
+    mod = transform.InferType()(mod)
+    inferred = mod["main"].body
+    assert inferred.checked_type == relay.TupleType([t, t])
 
 
 def test_id_type():
@@ -36,7 +39,9 @@ def test_id_type():
     make_id = relay.Var("make_id", relay.FuncType([b], id_type(b), [b]))
     t = relay.scalar_type("float32")
     b = relay.Var("b", t)
-    assert relay.ir_pass.infer_type(make_id(b), mod).checked_type == id_type(t)
+    mod["main"] = relay.Function([], make_id(b))
+    mod = transform.InferType()(mod)
+    assert mod["main"].body.checked_type == id_type(t)
 
 
 if __name__ == "__main__":
diff --git a/tests/python/relay/test_vm.py b/tests/python/relay/test_vm.py
index 302dc553cdb0d..f85d21255736f 100644
--- a/tests/python/relay/test_vm.py
+++ b/tests/python/relay/test_vm.py
@@ -121,7 +121,7 @@ def test_simple_call():
     mod[sum_up] = func
     i_data = np.array(0, dtype='int32')
     iarg = relay.var('i', shape=[], dtype='int32')
-    mod[mod.entry_func] = relay.Function([iarg], sum_up(iarg))
+    mod["main"] = relay.Function([iarg], sum_up(iarg))
     result = veval(mod, i_data)
     tvm.testing.assert_allclose(result.asnumpy(), i_data)
 
@@ -140,7 +140,7 @@ def test_count_loop():
     mod[sum_up] = func
     i_data = np.array(0, dtype='int32')
     iarg = relay.var('i', shape=[], dtype='int32')
-    mod[mod.entry_func] = relay.Function([iarg], sum_up(iarg))
+    mod["main"] = relay.Function([iarg], sum_up(iarg))
     result = veval(mod, i_data)
     tvm.testing.assert_allclose(result.asnumpy(), i_data)
 
@@ -163,7 +163,7 @@ def test_sum_loop():
     accum_data = np.array(0, dtype='int32')
     iarg = relay.var('i', shape=[], dtype='int32')
     aarg = relay.var('accum', shape=[], dtype='int32')
-    mod[mod.entry_func] = relay.Function([iarg, aarg], sum_up(iarg, aarg))
+    mod["main"] = relay.Function([iarg, aarg], sum_up(iarg, aarg))
     result = veval(mod, i_data, accum_data)
     tvm.testing.assert_allclose(result.asnumpy(), sum(range(1, loop_bound + 1)))
 
@@ -212,7 +212,7 @@ def to_list(o):
     one4 = cons(relay.const(3), one3)
     f = relay.Function([], one4)
 
-    mod[mod.entry_func] = f
+    mod["main"] = f
 
     result = veval(mod)()
     obj = to_list(result)
@@ -284,7 +284,7 @@ def test_compose():
     mod[add_one] = add_one_func
 
     f = relay.Function([y], add_two_body)
-    mod[mod.entry_func] = f
+    mod["main"] = f
 
     x_data = np.array(np.random.rand()).astype('float32')
     result = veval(mod)(x_data)
diff --git a/tests/python/unittest/test_arith_canonical_simplify.py b/tests/python/unittest/test_arith_canonical_simplify.py
index 56d2bb1e67e01..d38dfac77a1f6 100644
--- a/tests/python/unittest/test_arith_canonical_simplify.py
+++ b/tests/python/unittest/test_arith_canonical_simplify.py
@@ -81,6 +81,10 @@ def test_canonical_mixed():
     z = tvm.const(3, "int32")
     ck.verify(x / (z*z) - x / (z*z), 0)
     ck.verify(x / (z+z) - x / (z+z), 0)
+    ck.verify(x - 2 < 3, x < 5)
+    ck.verify(tvm.max(x, 1) - tvm.max(x, 1), 0)
+    ck.verify(tvm.min(x, 1) - tvm.min(x, 1), 0)
+    ck.verify(x * x - x * x, 0)
 
 
 def test_reduce_combiner_simplify():
@@ -211,6 +215,8 @@ def test_complex_cases():
     ck.verify(res3, ((((x*1024) + y)/256) - (y/256)) - (x*4))
 
 
+
+
 if __name__ == "__main__":
     test_simplify_if_then_else()
     test_div_simplify()
diff --git a/tests/python/unittest/test_arith_deduce_bound.py b/tests/python/unittest/test_arith_deduce_bound.py
index 7fe6f56edea78..d26b508ff262a 100644
--- a/tests/python/unittest/test_arith_deduce_bound.py
+++ b/tests/python/unittest/test_arith_deduce_bound.py
@@ -16,6 +16,14 @@
 # under the License.
 import tvm
 
+
+def assert_expr_equal(a, b):
+    res =  tvm.ir_pass.Simplify(a - b)
+    equal = isinstance(res, tvm.expr.IntImm) and res.value == 0
+    if not equal:
+        raise ValueError("{} and {} are not equal".format(a, b))
+
+
 def test_deduce():
     a = tvm.var('a')
     b = tvm.var('b')
@@ -29,31 +37,34 @@ def test_deduce():
 
     e0 = (-b)*a+c-d
     res0 = tvm.arith.DeduceBound(a, e0>=0, {b: b_s, c: c_s, d: d_s}, {})
-    ans0 = ((d - c) /(b*-1))
-    assert str(tvm.ir_pass.Simplify(res0.max_value)) == str(ans0)
+    ans0 = ((d - c) /(b*-1) + (-1))
+    assert_expr_equal(res0.max_value, ans0)
 
     # expression containing variable a is on rhs
     res0 = tvm.arith.DeduceBound(a, zero <= e0, {b: b_s, c: c_s, d: d_s}, {})
-    assert str(tvm.ir_pass.Simplify(res0.max_value)) == str(ans0)
+    assert_expr_equal(res0.max_value, ans0)
 
     e0 = d*a+c-d
     res0 = tvm.arith.DeduceBound(a, e0>=0, {b: b_s, c: c_s, d: d_s}, {})
-    ans0 = ((0-c)/d + 1)
-    assert str(tvm.ir_pass.Simplify(res0.max_value)) == str(ans0)
+    ans0 = ((d-c)/d - 1)
+    assert_expr_equal(res0.max_value, ans0)
 
     # expression containing variable a is on rhs
     res0 = tvm.arith.DeduceBound(a, zero <= e0, {b: b_s, c: c_s, d: d_s}, {})
-    assert str(tvm.ir_pass.Simplify(res0.max_value)) == str(ans0)
+    assert_expr_equal(res0.max_value, ans0)
+
 
     e1 = (a*4+b < c)
     res1 = tvm.arith.DeduceBound(a, e1, {b: b_s, c: c_s, d: d_s}, {})
-    ans1 = (((c - b) + -1)/4)
-    assert str(tvm.ir_pass.Simplify(res1.max_value)) == str(ans1)
+    ans1 = (((c - b) + -1)/4 -1)
+    assert_expr_equal(res1.max_value, ans1)
+
 
     # expression containing variable a is on rhs
     e1 = (c > a*4+b)
     res1 = tvm.arith.DeduceBound(a, e1, {b: b_s, c: c_s, d: d_s}, {})
-    assert str(tvm.ir_pass.Simplify(res1.max_value)) == str(ans1)
+    assert_expr_equal(res1.max_value, ans1)
+
 
     e2 = (tvm.max(5, a * 4) < 0)
     res2 = tvm.arith.DeduceBound(a, e2, {b: b_s, c: c_s, d: d_s}, {})
@@ -66,7 +77,6 @@ def test_deduce():
     assert str(res2.max_value) == "neg_inf"
     assert str(res2.min_value) == "pos_inf"
 
-
     e3 = (-b)+a*c-d
     res3 = tvm.arith.DeduceBound(a, e3>=0, {b: b_s, c: c_s, d: d_s}, {b: b_s, d: d_s})
     ans3 = 2/c+1
@@ -75,6 +85,7 @@ def test_deduce():
     res3 = tvm.arith.DeduceBound(a, zero <= e3, {b: b_s, c: c_s, d: d_s}, {b: b_s, d: d_s})
     assert str(tvm.ir_pass.Simplify(res3.min_value)) == str(ans3)
 
+
 def test_check():
     a = tvm.var('a')
     b = tvm.var('b')
diff --git a/tests/python/unittest/test_arith_rewrite_simplify.py b/tests/python/unittest/test_arith_rewrite_simplify.py
index 8bbade998199d..0ad62ece8a31c 100644
--- a/tests/python/unittest/test_arith_rewrite_simplify.py
+++ b/tests/python/unittest/test_arith_rewrite_simplify.py
@@ -236,7 +236,9 @@ def test_sub_index_simplify():
     # div pattern
     ck.analyzer.update(x, tvm.arith.ConstIntBound(0, 1000), override=True)
     ck.verify(x - (x / 3) * 3, x % 3)
-    ck.verify((x + 5) / 3 - x / 3, (((x + 2) % 3) + 5)/ 3)
+
+    ck.verify((x + 5) / 3 - x / 3, ((x % 3) + 5)/ 3)
+    ck.verify((x + 5) / 3 - (x + 1) / 3, (((x + 1) % 3) + 4)/ 3)
 
     ck.verify(y - (y / (-5)) * (-5), y % 5)
     ck.verify((y / 3) * 3 - y, 0 - y % 3)
@@ -258,6 +260,7 @@ def test_sub_index_simplify():
     ck.verify(6 * ((y + z) / 3) - y * 2, (z - (y + z) % 3) * 2)
     ck.verify(((y - z) / 3) * 6 - 2 * y, (0 - (y - z) % 3 - z) * 2)
 
+
 def test_mul_index_simplify():
     ck = RewriteChecker()
     x, y, z = tvm.var("x"), tvm.var("y"), tvm.var("z")
diff --git a/tests/python/unittest/test_arith_simplify.py b/tests/python/unittest/test_arith_simplify.py
deleted file mode 100644
index b8c5a3a16d5cf..0000000000000
--- a/tests/python/unittest/test_arith_simplify.py
+++ /dev/null
@@ -1,125 +0,0 @@
-# Licensed to the Apache Software Foundation (ASF) under one
-# or more contributor license agreements.  See the NOTICE file
-# distributed with this work for additional information
-# regarding copyright ownership.  The ASF licenses this file
-# to you under the Apache License, Version 2.0 (the
-# "License"); you may not use this file except in compliance
-# with the License.  You may obtain a copy of the License at
-#
-#   http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing,
-# software distributed under the License is distributed on an
-# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-# KIND, either express or implied.  See the License for the
-# specific language governing permissions and limitations
-# under the License.
-import tvm
-
-def csimplify(z):
-    return tvm.ir_pass.CanonicalSimplify(
-        tvm.make.Evaluate(z)).value
-
-def test_simplify():
-    x = tvm.var('n')
-    z = x * 4  - x * 2
-    zz = csimplify(z)
-    assert zz.b.value == 2
-
-    z = (x / 4) * 2  - (x / 4)
-    zz = csimplify(z)
-    assert zz.a == x and zz.b.value == 4
-
-    z = (x % 4) * 3  + (x % 4)
-    zz = csimplify(z)
-    assert zz.b.value == 4
-    zz = zz.a
-    assert zz.a == x and zz.b.value == 4
-
-    n = tvm.var('n')
-    assert tvm.ir_pass.Equal(tvm.ir_pass.CanonicalSimplify(n % 1), tvm.const(0, "int32"))
-    assert tvm.ir_pass.Equal(tvm.ir_pass.CanonicalSimplify(n / 1), n)
-    tvm.ir_pass.CanonicalSimplify(n / (-1))
-    # This is not true in the current implementation
-    #  assert tvm.ir_pass.Equal(tvm.ir_pass.CanonicalSimplify(n / (-1)),
-    #                           tvm.ir_pass.CanonicalSimplify(-n))
-
-def test_simplify_mod():
-    ib = tvm.ir_builder.create()
-    n = tvm.var('n')
-    A = ib.pointer("float32", name="A")
-    with ib.for_range(0, 10, name="j") as j:
-        with ib.for_range(0, 16, name="i") as i:
-            A[i] = A[(j * 32 + i+1) % 16]
-    body = ib.get()
-    stmt = tvm.ir_pass.CanonicalSimplify(body)
-    diff = tvm.ir_pass.CanonicalSimplify(stmt.body.body.value.index - (1 + i) % 16)
-    assert diff.value == 0
-    # if we can't prove that j is non-negative, we can't prove that (j+16) % 16 is j%16
-    index = tvm.ir_pass.CanonicalSimplify((j + 16) % 16)
-    assert index != j
-    index = tvm.ir_pass.CanonicalSimplify((j + 16) % 16, {j: tvm.Range(0, 6)})
-    assert index == j
-    # if we can't prove that j+n*32 is non-negative, we can't prove that (j+n*32) % 16 is j%16
-    index = tvm.ir_pass.CanonicalSimplify(
-        (j + n * 32) % 16, {j: tvm.Range(0, 6)})
-    assert index != j
-    index = tvm.ir_pass.CanonicalSimplify(
-        (j + n * 32) % 16, {j: tvm.Range(0, 6), n: tvm.Range(0, 10)})
-    assert index == j
-
-def test_simplify_minmax():
-    x = tvm.var('x')
-    e1 = tvm.max(x, 1) - tvm.max(x, 1)
-    e1s = tvm.ir_pass.CanonicalSimplify(e1)
-    assert e1s.value == 0
-
-    e2 = tvm.min(x, 1) - tvm.min(x, 1)
-    e2s = tvm.ir_pass.CanonicalSimplify(e2)
-    assert e2s.value == 0
-
-def test_mul():
-    x = tvm.var('x')
-    e = x * x - x * x
-    es = tvm.ir_pass.CanonicalSimplify(e)
-    assert es.value == 0
-
-def test_modular():
-    rx = tvm.var("rx")
-    ry = tvm.var("ry")
-    y = tvm.var("y")
-    x = tvm.var("x")
-    i32_const = lambda x: tvm.const(x, "int32")
-    vmap = {rx: tvm.Range(i32_const(0), i32_const(3)),
-            ry: tvm.Range(i32_const(0), i32_const(3)),
-            y: tvm.Range(i32_const(0), i32_const(2)),
-            x: tvm.Range(i32_const(0), i32_const(14))}
-    idx = ry * 16 + rx + y * 16 + x
-    z2 = tvm.ir_pass.CanonicalSimplify(idx % 16, vmap)
-    z1 = tvm.ir_pass.CanonicalSimplify(idx // 16, vmap)
-    assert tvm.ir_pass.CanonicalSimplify(z1 - (ry + y)).value == 0
-    assert tvm.ir_pass.CanonicalSimplify(z2 - (rx + x)).value == 0
-
-def test_const_propagation():
-    x1 = tvm.const(4, "int32")
-    x2 = x1 + 5
-    assert isinstance(x2, tvm.expr.IntImm) and x2.value == 9
-    x3 = x2 / 3
-    assert isinstance(x3, tvm.expr.IntImm) and x3.value == 3
-    x4 = x3 + 0.5
-    assert isinstance(x4, tvm.expr.FloatImm) and x4.value == 3.5
-    x5 = tvm.ceil(x4)
-    assert isinstance(x5, tvm.expr.FloatImm) and x5.value == 4
-    x6 = x5.astype('int')
-    assert isinstance(x6, tvm.expr.IntImm) and x6.value == 4
-    y = (tvm.round((tvm.const(6.5, 'float32') - 1) / 1.5) + 2).astype('int')
-    assert isinstance(y, tvm.expr.IntImm) and y.value == 6
-
-
-if __name__ == "__main__":
-    test_modular()
-    test_simplify()
-    test_mul()
-    test_simplify_minmax()
-    test_const_propagation()
-    test_simplify_mod()
diff --git a/tests/python/unittest/test_arith_stmt_simplify.py b/tests/python/unittest/test_arith_stmt_simplify.py
deleted file mode 100644
index 44c301ab7ef64..0000000000000
--- a/tests/python/unittest/test_arith_stmt_simplify.py
+++ /dev/null
@@ -1,58 +0,0 @@
-# Licensed to the Apache Software Foundation (ASF) under one
-# or more contributor license agreements.  See the NOTICE file
-# distributed with this work for additional information
-# regarding copyright ownership.  The ASF licenses this file
-# to you under the Apache License, Version 2.0 (the
-# "License"); you may not use this file except in compliance
-# with the License.  You may obtain a copy of the License at
-#
-#   http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing,
-# software distributed under the License is distributed on an
-# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-# KIND, either express or implied.  See the License for the
-# specific language governing permissions and limitations
-# under the License.
-import tvm
-import numpy
-from tvm import comm_reducer
-from tvm.ir_pass import Simplify, CanonicalSimplify, Equal
-
-def test_simplify():
-    """Not yet working, mock design"""
-    dtype = 'int64'
-    n = tvm.var('n')
-    Ab = tvm.decl_buffer((n, ), dtype)
-    i = tvm.var('i')
-    j = tvm.var('j')
-    # for i in 0 to n-1:
-    stmt = tvm.make.For(
-        i, 2, n, 0, 0,
-        tvm.make.For(j, 0, n, 0, 0,
-                     tvm.make.IfThenElse(
-                         tvm.make.LT(i + 2, n),
-                         tvm.make.Store(Ab.data,
-                                        tvm.make.Load(dtype, Ab.data, i + 4) + 1,
-                                        (j + 1) * 4 - 4 * j + i),
-                         None)))
-    stmt = tvm.ir_pass.CanonicalSimplify(stmt)
-
-
-def test_basic():
-    m = tvm.var('m')
-    ret = tvm.ir_pass.CanonicalSimplify(tvm.make.Evaluate(m-1))
-    assert str(ret.value) == "(m - 1)"
-
-
-def test_bound():
-    m = tvm.var('m')
-    vrange = tvm.convert({m: tvm.Range(tvm.const(0, "int32"), tvm.const(10, "int32"))})
-    ret = tvm.ir_pass.Simplify(m % 10, vrange)
-    assert ret == m
-
-
-if __name__ == "__main__":
-    test_bound()
-    test_basic()
-    test_simplify()
diff --git a/tests/python/unittest/test_graph_tuner_core.py b/tests/python/unittest/test_graph_tuner_core.py
index e0d2dc06c192a..ee37b12e74d03 100644
--- a/tests/python/unittest/test_graph_tuner_core.py
+++ b/tests/python/unittest/test_graph_tuner_core.py
@@ -43,9 +43,9 @@ def _create_data(target, dshape, dtype, layout):
     w2 = relay.var("w2_weight")
     conv2 = relay.nn.conv2d(conv1, w2, channels=32, kernel_size=(3, 3), padding=(1, 1))
     out = relay.add(conv1, conv2)
-    net = relay.Function(relay.ir_pass.free_vars(out), out)
-    net, params = relay.testing.create_workload(net)
-    tasks = autotvm.task.extract_from_program(net,
+    net = relay.Function(relay.analysis.free_vars(out), out)
+    mod, params = relay.testing.create_workload(net)
+    tasks = autotvm.task.extract_from_program(mod["main"],
                                               target=target,
                                               params=params,
                                               ops=(relay.op.nn.conv2d,))
@@ -160,7 +160,7 @@ def test_DPTuner_run():
 
     g, records, ltf_records, ltf_keys, tasks = _create_data(target, dshape, dtype, layout)
     mod = relay.module.Module()
-    mod[mod.entry_func] = g
+    mod["main"] = g
     costs = [0.02, 0.02, 0.045]
     config_list = []
     cfg_dict = {"i": -1,
diff --git a/tests/python/unittest/test_graph_tuner_utils.py b/tests/python/unittest/test_graph_tuner_utils.py
index 0847166412d2c..c66854ac65a9d 100644
--- a/tests/python/unittest/test_graph_tuner_utils.py
+++ b/tests/python/unittest/test_graph_tuner_utils.py
@@ -51,7 +51,7 @@ def test_has_multiple_inputs():
     w0 = relay.var("w0")
     out2 = relay.nn.conv2d(data, w0)
     out = relay.add(out1, out2)
-    net = relay.Function(relay.ir_pass.free_vars(out), out)
+    net = relay.Function(relay.analysis.free_vars(out), out)
     net = bind_inputs(net, {"data": (1, 16, 224, 224), "w0": (16, 16, 1, 1)})
     target_ops = ["conv2d"]
     node_list = []
@@ -64,7 +64,7 @@ def test_has_multiple_inputs():
 
 
 def test_expr2graph():
-    net, _ = resnet.get_workload(num_layers=50, batch_size=1)
+    mod, _ = resnet.get_workload(num_layers=50, batch_size=1)
     node_dict = {}
     node_list = []
     target_ops = ["conv2d"]
@@ -80,9 +80,9 @@ def _count_node(node):
             op_name_list.append("Tuple")
         else:
             op_name_list.append("null")
-    relay.ir_pass.post_order_visit(net, _count_node)
+    relay.analysis.post_order_visit(mod["main"], _count_node)
 
-    expr2graph(net, target_ops, node_dict, node_list)
+    expr2graph(mod["main"], target_ops, node_dict, node_list)
     for i, item in enumerate(zip(op_name_list, node_list)):
         op_name, node = item
         assert op_name == node["op"], "%dth Node operator mismatch: expecting %s but got %s" \
@@ -97,7 +97,7 @@ def test_get_direct_ancestor():
     out3 = out2 + relay.expr.const(2.5)
     w1 = relay.var("w1")
     out = relay.nn.conv2d(out3, w1)
-    net = relay.Function(relay.ir_pass.free_vars(out), out)
+    net = relay.Function(relay.analysis.free_vars(out), out)
     net = bind_inputs(net, {"data": (1, 16, 224, 224), "w0": (16, 16, 1, 1), "w1": (16, 16, 1, 1)})
     target_ops = ["conv2d"]
     node_list = []
@@ -117,7 +117,7 @@ def test_get_in_nodes():
     out3 = out2 + relay.expr.const(2.5)
     w1 = relay.var("w1")
     out = relay.nn.conv2d(out3, w1)
-    net = relay.Function(relay.ir_pass.free_vars(out), out)
+    net = relay.Function(relay.analysis.free_vars(out), out)
     net = bind_inputs(net, {"data": (1, 16, 224, 224), "w0": (16, 16, 1, 1), "w1": (16, 16, 1, 1)})
     target_ops = ["conv2d"]
     input_names = ["data"]
diff --git a/tests/python/unittest/test_lang_buffer.py b/tests/python/unittest/test_lang_buffer.py
index e0bb0279c09f7..bd45eac2358a4 100644
--- a/tests/python/unittest/test_lang_buffer.py
+++ b/tests/python/unittest/test_lang_buffer.py
@@ -16,6 +16,7 @@
 # under the License.
 import tvm
 from tvm.schedule import Buffer
+import numpy as np
 
 def test_buffer():
     m = tvm.var('m')
@@ -108,6 +109,34 @@ def assert_simplified_equal(index_simplified, index_direct):
     index_direct = A.vload((0, ((k0 % (k1 / s)) / n) * n + ((k0 % (k1 / n)) % n + (k0 % k1))))
     assert_simplified_equal(index_simplified, index_direct)
 
+def test_buffer_broadcast():
+    m0, m1, m2 = tvm.var("m0"), tvm.var("m1"), tvm.var("m2")
+    n0, n1, n2 = tvm.var("n0"), tvm.var("n1"), tvm.var("n2")
+    o0, o1, o2 = tvm.var("o0"), tvm.var("o1"), tvm.var("o2")
+
+    A = tvm.placeholder((m0, m1, m2), name='A')
+    B = tvm.placeholder((n0, n1, n2), name='B')
+
+    C = tvm.compute((o0, o1, o2), lambda i, j, k: A[i, j, k] + B[i, j, k], name='C')
+
+    Ab = tvm.decl_buffer(A.shape, A.dtype, name="Ab", buffer_type="auto_broadcast")
+    Bb = tvm.decl_buffer(B.shape, B.dtype, name="Bb", buffer_type="auto_broadcast")
+    s = tvm.create_schedule(C.op)
+
+    def check():
+        if not tvm.module.enabled("llvm"):
+            return
+        fadd = tvm.build(s, [A, B, C], target='llvm', name='bcast_add', binds={A:Ab, B:Bb})
+        ctx = tvm.cpu(0)
+        a = tvm.nd.array(np.random.uniform(size=(2, 4, 3)).astype(A.dtype), ctx)
+        b = tvm.nd.array(np.random.uniform(size=(2, 1, 1)).astype(B.dtype), ctx)
+        c = tvm.nd.array(np.zeros((2, 4, 3), dtype=C.dtype), ctx)
+        fadd(a, b, c)
+        tvm.testing.assert_allclose(c.asnumpy(), a.asnumpy() + b.asnumpy())
+
+    check()
+
+
 if __name__ == "__main__":
     test_buffer()
     test_buffer_access_ptr()
@@ -115,3 +144,4 @@ def assert_simplified_equal(index_simplified, index_direct):
     test_buffer_access_ptr_extent()
     test_buffer_vload()
     test_buffer_index_merge_mult_mod()
+    test_buffer_broadcast()
diff --git a/tests/python/unittest/test_lang_operator.py b/tests/python/unittest/test_lang_operator.py
index da309815b9f4e..8e7dcba3230c2 100644
--- a/tests/python/unittest/test_lang_operator.py
+++ b/tests/python/unittest/test_lang_operator.py
@@ -83,7 +83,25 @@ def check_throws(f):
     assert tvm.any(x, true).same_as(true)
     assert tvm.any(true, x).same_as(true)
 
+
+def test_const_fold4():
+    x1 = tvm.const(4, "int32")
+    x2 = x1 + 5
+    assert isinstance(x2, tvm.expr.IntImm) and x2.value == 9
+    x3 = x2 / 3
+    assert isinstance(x3, tvm.expr.IntImm) and x3.value == 3
+    x4 = x3 + 0.55
+    assert isinstance(x4, tvm.expr.FloatImm) and abs(x4.value - 3.55) < 1e-6
+    x5 = tvm.ceil(x4)
+    assert isinstance(x5, tvm.expr.FloatImm) and x5.value == 4
+    x6 = x5.astype('int')
+    assert isinstance(x6, tvm.expr.IntImm) and x6.value == 4, "x6={}".format(x6)
+    y = (tvm.round((tvm.const(6.5, 'float32') - 1) / 1.5) + 2).astype('int')
+    assert isinstance(y, tvm.expr.IntImm) and y.value == 6
+
+
 if __name__ == "__main__":
     test_const_fold()
     test_const_fold2()
     test_const_fold3()
+    test_const_fold4()
diff --git a/tests/python/unittest/test_pass_basic.py b/tests/python/unittest/test_pass_basic.py
index fc76c306731c1..b05d75ab2d1ef 100644
--- a/tests/python/unittest/test_pass_basic.py
+++ b/tests/python/unittest/test_pass_basic.py
@@ -24,9 +24,6 @@ def test_simplify():
   assert(tvm.ir_pass.Equal(e2, x * 8))
   e3 = tvm.ir_pass.Simplify(x - x / 3 * 3)
   assert(tvm.ir_pass.Equal(e3, tvm.make.Mod(x, 3)))
-  let = tvm.make.Let(x, 1, x + 3)
-  e4 = tvm.ir_pass.Simplify(let)
-  assert(tvm.ir_pass.Equal(e4, 4))
 
 
 def test_verify_ssa():
diff --git a/topi/include/topi/detail/extern.h b/topi/include/topi/detail/extern.h
index ac00e52899fae..667722e465c44 100644
--- a/topi/include/topi/detail/extern.h
+++ b/topi/include/topi/detail/extern.h
@@ -49,7 +49,7 @@ inline Buffer DeclExternBuffer(Array<Expr> shape,
   auto data = var(name, Handle());
   auto elem_offset = Expr();
   return BufferNode::make(data, dtype, shape, Array<Expr>(), elem_offset, name, "",
-                          -1, 0);
+                          -1, 0, kDefault);
 }
 
 /*!
diff --git a/topi/python/topi/math.py b/topi/python/topi/math.py
index 5a1742b12c564..406d489696825 100644
--- a/topi/python/topi/math.py
+++ b/topi/python/topi/math.py
@@ -342,4 +342,4 @@ def cast(x, dtype):
     if isinstance(x, tvm.tensor.Tensor):
         return tvm.compute(
             x.shape, lambda *i: x(*i).astype(dtype), tag=tag.ELEMWISE)
-    return tvm.make.static_cast(dtype, x)
+    return tvm.make._cast(dtype, x)
diff --git a/topi/python/topi/nn/conv2d_transpose.py b/topi/python/topi/nn/conv2d_transpose.py
index 083abf3be5885..6898d41af4bc5 100644
--- a/topi/python/topi/nn/conv2d_transpose.py
+++ b/topi/python/topi/nn/conv2d_transpose.py
@@ -51,11 +51,15 @@ def conv2d_transpose_nchw(Input, Filter, strides, padding, out_dtype):
     Output : tvm.Tensor
         4-D with shape [batch, out_channel, out_height, out_width]
     """
-    batch, in_c, in_h, in_w = Input.shape
-    _, out_c, filter_h, filter_w = Filter.shape
+    return declaration_conv2d_transpose_impl(Input, Filter, strides, padding, out_dtype)
+
+def declaration_conv2d_transpose_impl(data, kernel, strides, padding, out_dtype):
+    """Implementation of conv2d transpose"""
+    batch, in_c, in_h, in_w = data.shape
+    _, out_c, filter_h, filter_w = kernel.shape
     stride_h, stride_w = strides
     # dilate stage
-    DilatedInput = dilate(Input, [1, 1, stride_h, stride_w], name='DilatedInput')
+    DilatedInput = dilate(data, [1, 1, stride_h, stride_w], name='DilatedInput')
     # padding stage
     fpad_top, fpad_left, fpad_bottom, fpad_right = get_pad_tuple(padding, (filter_h, filter_w))
     bpad_top = filter_h - 1 - fpad_top
@@ -78,7 +82,7 @@ def conv2d_transpose_nchw(Input, Filter, strides, padding, out_dtype):
         (batch, out_c, out_h, out_w),
         lambda b, c, h, w: tvm.sum(
             PaddedInput[b, dc, h+dh, w+dw].astype(out_dtype) *
-            Filter[dc, c, filter_h-1-dh, filter_w-1-dw].astype(out_dtype),
+            kernel[dc, c, filter_h-1-dh, filter_w-1-dw].astype(out_dtype),
             axis=[dc, dh, dw]), tag="conv2d_transpose_nchw")
 
     return Output
diff --git a/topi/python/topi/x86/__init__.py b/topi/python/topi/x86/__init__.py
index efc1bc512285d..1ecf2495ba6b7 100644
--- a/topi/python/topi/x86/__init__.py
+++ b/topi/python/topi/x86/__init__.py
@@ -14,3 +14,4 @@
 from .dense import _schedule_dense, _schedule_dense_pack, _schedule_dense_nopack
 from .batch_matmul import schedule_batch_matmul
 from .roi_align import roi_align_nchw
+from .conv2d_transpose import schedule_conv2d_transpose
diff --git a/topi/python/topi/x86/conv2d_transpose.py b/topi/python/topi/x86/conv2d_transpose.py
new file mode 100644
index 0000000000000..7681725d416ea
--- /dev/null
+++ b/topi/python/topi/x86/conv2d_transpose.py
@@ -0,0 +1,65 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+# pylint: disable=invalid-name,unused-variable,unused-argument,no-member
+"""Conv2D Transpose schedule on x86"""
+
+import tvm
+from tvm import autotvm
+from .. import generic, tag
+from ..nn.conv2d_transpose import conv2d_transpose_nchw, declaration_conv2d_transpose_impl
+
+@autotvm.register_topi_compute(conv2d_transpose_nchw, 'cpu', ['direct'])
+def _declaration_conv2d_transpose(cfg, data, kernel, strides, padding, out_dtype):
+    # TODO cfg is not used for now
+    return declaration_conv2d_transpose_impl(data, kernel, strides, padding, out_dtype)
+
+@autotvm.register_topi_schedule(generic.schedule_conv2d_transpose_nchw, 'cpu', ['direct'])
+def schedule_conv2d_transpose(cfg, outs):
+    """Create schedule for tensors"""
+    outs = [outs] if isinstance(outs, tvm.tensor.Tensor) else outs
+    s = tvm.create_schedule([x.op for x in outs])
+    scheduled_ops = []
+
+    def traverse(op):
+        """Traverse operators from computation graph"""
+        # inline all one-to-one-mapping operators except the last stage (output)
+        if tag.is_injective(op.tag):
+            if op not in s.outputs:
+                s[op].compute_inline()
+            for tensor in op.input_tensors:
+                if tensor.op.input_tensors and tensor.op not in scheduled_ops:
+                    traverse(tensor.op)
+
+        if 'conv2d_transpose_nchw' in op.tag:
+            C = op.output(0)
+
+            N, OC, OH, OW = C.op.axis
+            rc, ry, rx = C.op.reduce_axis
+
+            OH, oh = s[C].split(OH, factor=2)
+            OC, oc = s[C].split(OC, factor=32)
+            IC, ic = s[C].split(rc, factor=32)
+
+            s[C].reorder(N, OC, OH, OW, oc, IC, ry, rx, ic)
+            N = s[C].fuse(N, OC)
+            s[C].vectorize(oc)
+            s[C].parallel(N)
+
+        scheduled_ops.append(op)
+
+    traverse(outs[0].op)
+    return s
diff --git a/topi/python/topi/x86/roi_align.py b/topi/python/topi/x86/roi_align.py
index a8ad387a242f3..26b84be9585b3 100644
--- a/topi/python/topi/x86/roi_align.py
+++ b/topi/python/topi/x86/roi_align.py
@@ -16,14 +16,17 @@
 # under the License.
 # pylint: disable=invalid-name, no-member, too-many-locals, too-many-arguments, undefined-variable, too-many-nested-blocks, too-many-branches, too-many-statements
 """Non-maximum suppression operator for intel cpu"""
+import math
 import tvm
 
 from tvm import hybrid
 from ..vision.rcnn import roi_align_nchw
+from ..tensor import full
+from ..util import get_const_tuple
 
 
 @hybrid.script
-def roi_align_nchw_ir(data, rois, pooled_size, spatial_scale, sample_ratio):
+def roi_align_nchw_ir(data, rois, w_pc, pos_pc, pooled_size, spatial_scale, sample_ratio):
     """Hybrid routing fo ROI align operator in NCHW layout.
 
     Parameters
@@ -35,6 +38,12 @@ def roi_align_nchw_ir(data, rois, pooled_size, spatial_scale, sample_ratio):
         2-D with shape [num_roi, 5]. The last dimension should be in format of
         [batch_index, w_start, h_start, w_end, h_end]
 
+    w_pc : tvm.Tensor or numpy NDArray
+        3-D weight pre-calculation buffer
+
+    pos_pc : tvm.Tensor or numpy NDArray
+        3-D position pre-calculation buffer
+
     pooled_size : tvm ConsExpr
         [out_height, out_width]
 
@@ -57,9 +66,6 @@ def roi_align_nchw_ir(data, rois, pooled_size, spatial_scale, sample_ratio):
     pooled_size_h = pooled_size[0]
     pooled_size_w = pooled_size[1]
     output = output_tensor((num_rois, channels, pooled_size_h, pooled_size_w), data.dtype)
-    max_num_pc_index = height * width * pooled_size_h * pooled_size_w
-    w_pc = allocate((num_rois, max_num_pc_index, 4), data.dtype)
-    pos_pc = allocate((num_rois, max_num_pc_index, 4), "int32")
 
     for n in parallel(num_rois):
         roi_batch_index = int32(rois[n, 0])
@@ -76,18 +82,16 @@ def roi_align_nchw_ir(data, rois, pooled_size, spatial_scale, sample_ratio):
 
         roi_bin_grid_h = sample_ratio
         roi_bin_grid_w = roi_bin_grid_h
-        div_h = roi_h / pooled_size_h
-        div_w = roi_w / pooled_size_w
-        rounded_div_h = int32(div_h) * 1.0
-        rounded_div_w = int32(div_w) * 1.0
+        rounded_bin_h = int32(bin_h) * 1.0
+        rounded_bin_w = int32(bin_w) * 1.0
         if sample_ratio <= 0:
             # Cannot use ceil function since hybrid script
             # doesn't support Call as indexing
-            roi_bin_grid_h = int32(div_h)
-            roi_bin_grid_w = int32(div_w)
-            if rounded_div_h < div_h:
+            roi_bin_grid_h = int32(bin_h)
+            roi_bin_grid_w = int32(bin_w)
+            if rounded_bin_h < bin_h:
                 roi_bin_grid_h += 1
-            if rounded_div_w < div_w:
+            if rounded_bin_w < bin_w:
                 roi_bin_grid_w += 1
 
         count = roi_bin_grid_h * roi_bin_grid_w
@@ -211,7 +215,21 @@ def roi_align_nchw_cpu(data, rois, pooled_size, spatial_scale, sample_ratio=-1):
     """
     if not isinstance(pooled_size, (tuple, list)):
         pooled_size = (pooled_size, pooled_size)
+
+    # Pre-allocate intermediate buffer
+    if sample_ratio > 0:
+        max_roi_bin_grid_w = max_roi_bin_grid_h = sample_ratio
+    else:
+        _, _, height, width = get_const_tuple(data.shape)
+        max_roi_bin_grid_h = math.ceil(height / pooled_size[0])
+        max_roi_bin_grid_w = math.ceil(width / pooled_size[1])
+    max_pc_shape = (rois.shape[0], max_roi_bin_grid_h * max_roi_bin_grid_w
+                    * pooled_size[0] * pooled_size[1], 4)
+    w_pc_buffer = full(max_pc_shape, data.dtype, 0)
+    pos_pc_buffer = full(max_pc_shape, "int32", 0)
+
     pooled_size = tvm.convert(pooled_size)
     spatial_scale = tvm.const(spatial_scale, "float32")
     sample_ratio = tvm.const(sample_ratio, "int32")
-    return roi_align_nchw_ir(data, rois, pooled_size, spatial_scale, sample_ratio)
+    return roi_align_nchw_ir(data, rois, w_pc_buffer, pos_pc_buffer,
+                             pooled_size, spatial_scale, sample_ratio)
diff --git a/topi/tests/python/test_topi_vision.py b/topi/tests/python/test_topi_vision.py
index 3a0b134890379..08b6d2e7d4148 100644
--- a/topi/tests/python/test_topi_vision.py
+++ b/topi/tests/python/test_topi_vision.py
@@ -306,6 +306,7 @@ def test_roi_align():
     verify_roi_align(1, 16, 32, 64, 7, 1.0, -1)
     verify_roi_align(4, 16, 32, 64, 7, 0.5, 2)
     verify_roi_align(1, 32, 32, 80, 8, 0.0625, 2)
+    verify_roi_align(1, 32, 500, 80, 8, 0.0625, 2)
 
 
 def verify_roi_pool(batch, in_channel, in_size, num_roi, pooled_size, spatial_scale):
diff --git a/tutorials/autotvm/tune_relay_arm.py b/tutorials/autotvm/tune_relay_arm.py
index 290f9756f1955..b671f21402261 100644
--- a/tutorials/autotvm/tune_relay_arm.py
+++ b/tutorials/autotvm/tune_relay_arm.py
@@ -81,28 +81,29 @@ def get_network(name, batch_size):
 
     if "resnet" in name:
         n_layer = int(name.split('-')[1])
-        net, params = relay.testing.resnet.get_workload(num_layers=n_layer, batch_size=batch_size, dtype=dtype)
+        mod, params = relay.testing.resnet.get_workload(num_layers=n_layer, batch_size=batch_size, dtype=dtype)
     elif "vgg" in name:
         n_layer = int(name.split('-')[1])
-        net, params = relay.testing.vgg.get_workload(num_layers=n_layer, batch_size=batch_size, dtype=dtype)
+        mod, params = relay.testing.vgg.get_workload(num_layers=n_layer, batch_size=batch_size, dtype=dtype)
     elif name == 'mobilenet':
-        net, params = relay.testing.mobilenet.get_workload(batch_size=batch_size)
+        mod, params = relay.testing.mobilenet.get_workload(batch_size=batch_size)
     elif name == 'squeezenet_v1.1':
-        net, params = relay.testing.squeezenet.get_workload(batch_size=batch_size, version='1.1', dtype=dtype)
+        mod, params = relay.testing.squeezenet.get_workload(batch_size=batch_size, version='1.1', dtype=dtype)
     elif name == 'inception_v3':
         input_shape = (1, 3, 299, 299)
-        net, params = relay.testing.inception_v3.get_workload(batch_size=batch_size, dtype=dtype)
+        mod, params = relay.testing.inception_v3.get_workload(batch_size=batch_size, dtype=dtype)
     elif name == 'mxnet':
         # an example for mxnet model
         from mxnet.gluon.model_zoo.vision import get_model
         block = get_model('resnet18_v1', pretrained=True)
         mod, params = relay.frontend.from_mxnet(block, shape={'data': input_shape}, dtype=dtype)
-        net = mod[mod.entry_func]
+        net = mod["main"]
         net = relay.Function(net.params, relay.nn.softmax(net.body), None, net.type_params, net.attrs)
+        mod = relay.Module.from_expr(net)
     else:
         raise ValueError("Unsupported network: " + name)
 
-    return net, params, input_shape, output_shape
+    return mod, params, input_shape, output_shape
 
 
 #################################################################
@@ -316,10 +317,10 @@ def tune_tasks(tasks,
 def tune_and_evaluate(tuning_opt):
     # extract workloads from relay program
     print("Extract tasks...")
-    net, params, input_shape, _ = get_network(network, batch_size=1)
-    tasks = autotvm.task.extract_from_program(net, target=target,
-                                            params=params,
-                                            ops=(relay.op.nn.conv2d,))
+    mod, params, input_shape, _ = get_network(network, batch_size=1)
+    tasks = autotvm.task.extract_from_program(mod["main"], target=target,
+                                              params=params,
+                                              ops=(relay.op.nn.conv2d,))
 
     # run tuning tasks
     print("Tuning...")
@@ -330,7 +331,7 @@ def tune_and_evaluate(tuning_opt):
         print("Compile...")
         with relay.build_config(opt_level=3):
             graph, lib, params = relay.build_module.build(
-                net, target=target, params=params)
+                mod, target=target, params=params)
 
         # export library
         tmp = tempdir()
diff --git a/tutorials/autotvm/tune_relay_cuda.py b/tutorials/autotvm/tune_relay_cuda.py
index c158e4b9fe363..5044bd13a7d0a 100644
--- a/tutorials/autotvm/tune_relay_cuda.py
+++ b/tutorials/autotvm/tune_relay_cuda.py
@@ -81,28 +81,29 @@ def get_network(name, batch_size):
 
     if "resnet" in name:
         n_layer = int(name.split('-')[1])
-        net, params = relay.testing.resnet.get_workload(num_layers=n_layer, batch_size=batch_size, dtype=dtype)
+        mod, params = relay.testing.resnet.get_workload(num_layers=n_layer, batch_size=batch_size, dtype=dtype)
     elif "vgg" in name:
         n_layer = int(name.split('-')[1])
-        net, params = relay.testing.vgg.get_workload(num_layers=n_layer, batch_size=batch_size, dtype=dtype)
+        mod, params = relay.testing.vgg.get_workload(num_layers=n_layer, batch_size=batch_size, dtype=dtype)
     elif name == 'mobilenet':
-        net, params = relay.testing.mobilenet.get_workload(batch_size=batch_size, dtype=dtype)
+        mod, params = relay.testing.mobilenet.get_workload(batch_size=batch_size, dtype=dtype)
     elif name == 'squeezenet_v1.1':
-        net, params = relay.testing.squeezenet.get_workload(batch_size=batch_size, version='1.1', dtype=dtype)
+        mod, params = relay.testing.squeezenet.get_workload(batch_size=batch_size, version='1.1', dtype=dtype)
     elif name == 'inception_v3':
         input_shape = (1, 3, 299, 299)
-        net, params = relay.testing.inception_v3.get_workload(batch_size=batch_size, dtype=dtype)
+        mod, params = relay.testing.inception_v3.get_workload(batch_size=batch_size, dtype=dtype)
     elif name == 'mxnet':
         # an example for mxnet model
         from mxnet.gluon.model_zoo.vision import get_model
         block = get_model('resnet18_v1', pretrained=True)
         mod, params = relay.frontend.from_mxnet(block, shape={'data': input_shape}, dtype=dtype)
-        net = mod[mod.entry_func]
+        net = mod["main"]
         net = relay.Function(net.params, relay.nn.softmax(net.body), None, net.type_params, net.attrs)
+        mod = relay.Module.from_expr(net)
     else:
         raise ValueError("Unsupported network: " + name)
 
-    return net, params, input_shape, output_shape
+    return mod, params, input_shape, output_shape
 
 ###########################################
 # Set Tuning Options
@@ -218,9 +219,9 @@ def tune_tasks(tasks,
 def tune_and_evaluate(tuning_opt):
     # extract workloads from relay program
     print("Extract tasks...")
-    net, params, input_shape, out_shape = get_network(network, batch_size=1)
-    tasks = autotvm.task.extract_from_program(net, target=target,
-                                            params=params, ops=(relay.op.nn.conv2d,))
+    mod, params, input_shape, out_shape = get_network(network, batch_size=1)
+    tasks = autotvm.task.extract_from_program(mod["main"], target=target,
+                                              params=params, ops=(relay.op.nn.conv2d,))
 
     # run tuning tasks
     print("Tuning...")
@@ -231,7 +232,7 @@ def tune_and_evaluate(tuning_opt):
         print("Compile...")
         with relay.build_config(opt_level=3):
             graph, lib, params = relay.build_module.build(
-                net, target=target, params=params)
+                mod, target=target, params=params)
 
         # export library
         tmp = tempdir()
diff --git a/tutorials/autotvm/tune_relay_mobile_gpu.py b/tutorials/autotvm/tune_relay_mobile_gpu.py
index c011268fda512..94a86248c9353 100644
--- a/tutorials/autotvm/tune_relay_mobile_gpu.py
+++ b/tutorials/autotvm/tune_relay_mobile_gpu.py
@@ -82,28 +82,29 @@ def get_network(name, batch_size):
 
     if "resnet" in name:
         n_layer = int(name.split('-')[1])
-        net, params = relay.testing.resnet.get_workload(num_layers=n_layer, batch_size=batch_size, dtype=dtype)
+        mod, params = relay.testing.resnet.get_workload(num_layers=n_layer, batch_size=batch_size, dtype=dtype)
     elif "vgg" in name:
         n_layer = int(name.split('-')[1])
-        net, params = relay.testing.vgg.get_workload(num_layers=n_layer, batch_size=batch_size, dtype=dtype)
+        mod, params = relay.testing.vgg.get_workload(num_layers=n_layer, batch_size=batch_size, dtype=dtype)
     elif name == 'mobilenet':
-        net, params = relay.testing.mobilenet.get_workload(batch_size=batch_size, dtype=dtype)
+        mod, params = relay.testing.mobilenet.get_workload(batch_size=batch_size, dtype=dtype)
     elif name == 'squeezenet_v1.1':
-        net, params = relay.testing.squeezenet.get_workload(batch_size=batch_size, version='1.1', dtype=dtype)
+        mod, params = relay.testing.squeezenet.get_workload(batch_size=batch_size, version='1.1', dtype=dtype)
     elif name == 'inception_v3':
         input_shape = (1, 3, 299, 299)
-        net, params = relay.testing.inception_v3.get_workload(batch_size=batch_size, dtype=dtype)
+        mod, params = relay.testing.inception_v3.get_workload(batch_size=batch_size, dtype=dtype)
     elif name == 'mxnet':
         # an example for mxnet model
         from mxnet.gluon.model_zoo.vision import get_model
         block = get_model('resnet18_v1', pretrained=True)
         mod, params = relay.frontend.from_mxnet(block, shape={'data': input_shape}, dtype=dtype)
-        net = mod[mod.entry_func]
+        net = mod["main"]
         net = relay.Function(net.params, relay.nn.softmax(net.body), None, net.type_params, net.attrs)
+        mod = relay.Module.from_expr(net)
     else:
         raise ValueError("Unsupported network: " + name)
 
-    return net, params, input_shape, output_shape
+    return mod, params, input_shape, output_shape
 
 
 #################################################################
@@ -300,8 +301,10 @@ def tune_tasks(tasks,
 def tune_and_evaluate(tuning_opt):
     # extract workloads from relay program
     print("Extract tasks...")
-    net, params, input_shape, _ = get_network(network, batch_size=1)
-    tasks = autotvm.task.extract_from_program(net, target=target, target_host=target_host,
+    mod, params, input_shape, _ = get_network(network, batch_size=1)
+    tasks = autotvm.task.extract_from_program(mod["main"],
+                                              target=target,
+                                              target_host=target_host,
                                               params=params, ops=(relay.op.nn.conv2d,))
 
     # run tuning tasks
@@ -313,7 +316,7 @@ def tune_and_evaluate(tuning_opt):
         print("Compile...")
         with relay.build_config(opt_level=3):
             graph, lib, params = relay.build_module.build(
-                net, target=target, params=params, target_host=target_host)
+                mod, target=target, params=params, target_host=target_host)
         # export library
         tmp = tempdir()
         if use_android:
diff --git a/tutorials/autotvm/tune_relay_x86.py b/tutorials/autotvm/tune_relay_x86.py
index c8d9def206fe3..b53b3c12178b5 100644
--- a/tutorials/autotvm/tune_relay_x86.py
+++ b/tutorials/autotvm/tune_relay_x86.py
@@ -49,28 +49,29 @@ def get_network(name, batch_size):
 
     if "resnet" in name:
         n_layer = int(name.split('-')[1])
-        net, params = relay.testing.resnet.get_workload(num_layers=n_layer, batch_size=batch_size, dtype=dtype)
+        mod, params = relay.testing.resnet.get_workload(num_layers=n_layer, batch_size=batch_size, dtype=dtype)
     elif "vgg" in name:
         n_layer = int(name.split('-')[1])
-        net, params = relay.testing.vgg.get_workload(num_layers=n_layer, batch_size=batch_size, dtype=dtype)
+        mod, params = relay.testing.vgg.get_workload(num_layers=n_layer, batch_size=batch_size, dtype=dtype)
     elif name == 'mobilenet':
-        net, params = relay.testing.mobilenet.get_workload(batch_size=batch_size, dtype=dtype)
+        mod, params = relay.testing.mobilenet.get_workload(batch_size=batch_size, dtype=dtype)
     elif name == 'squeezenet_v1.1':
-        net, params = relay.testing.squeezenet.get_workload(batch_size=batch_size, version='1.1', dtype=dtype)
+        mod, params = relay.testing.squeezenet.get_workload(batch_size=batch_size, version='1.1', dtype=dtype)
     elif name == 'inception_v3':
         input_shape = (1, 3, 299, 299)
-        net, params = relay.testing.inception_v3.get_workload(batch_size=batch_size, dtype=dtype)
+        mod, params = relay.testing.inception_v3.get_workload(batch_size=batch_size, dtype=dtype)
     elif name == 'mxnet':
         # an example for mxnet model
         from mxnet.gluon.model_zoo.vision import get_model
         block = get_model('resnet18_v1', pretrained=True)
         mod, params = relay.frontend.from_mxnet(block, shape={'data': input_shape}, dtype=dtype)
-        net = mod[mod.entry_func]
+        net = mod["main"]
         net = relay.Function(net.params, relay.nn.softmax(net.body), None, net.type_params, net.attrs)
+        mod = relay.Module.from_expr(net)
     else:
         raise ValueError("Unsupported network: " + name)
 
-    return net, params, input_shape, output_shape
+    return mod, params, input_shape, output_shape
 
 # Replace "llvm" with the correct target of your CPU.
 # For example, for AWS EC2 c5 instance with Intel Xeon
@@ -177,21 +178,21 @@ def tune_graph(graph, dshape, records, opt_sch_file, use_DP=True):
 def tune_and_evaluate(tuning_opt):
     # extract workloads from relay program
     print("Extract tasks...")
-    net, params, data_shape, out_shape = get_network(model_name, batch_size)
-    tasks = autotvm.task.extract_from_program(net, target=target,
+    mod, params, data_shape, out_shape = get_network(model_name, batch_size)
+    tasks = autotvm.task.extract_from_program(mod["main"], target=target,
                                               params=params, ops=(relay.op.nn.conv2d,))
 
     # run tuning tasks
     print("Tuning...")
     tune_kernels(tasks, **tuning_opt)
-    tune_graph(net, data_shape, log_file, graph_opt_sch_file)
+    tune_graph(mod["main"], data_shape, log_file, graph_opt_sch_file)
 
     # compile kernels with graph-level best records
     with autotvm.apply_graph_best(graph_opt_sch_file):
         print("Compile...")
         with relay.build_config(opt_level=3):
             graph, lib, params = relay.build_module.build(
-                net, target=target,  params=params)
+                mod, target=target, params=params)
 
         # upload parameters to device
         ctx = tvm.cpu()
diff --git a/tutorials/frontend/deploy_model_on_android.py b/tutorials/frontend/deploy_model_on_android.py
index bc245f00d9287..72404132c19e1 100644
--- a/tutorials/frontend/deploy_model_on_android.py
+++ b/tutorials/frontend/deploy_model_on_android.py
@@ -92,7 +92,7 @@
 #
 # .. code-block:: bash
 #
-#   python -m tvm.exec.rpc_tracker --host=0.0.0.0 --port=9190
+#   python3 -m tvm.exec.rpc_tracker --host=0.0.0.0 --port=9190
 #
 # The expected output is
 #
@@ -130,8 +130,8 @@
 #
 #   # the additional include headers you want to add, e.g., SDK_PATH/adrenosdk/Development/Inc
 #   ADD_C_INCLUDES += /work/adrenosdk-linux-5_0/Development/Inc
-#   # download from https://github.com/KhronosGroup/OpenCL-Headers
-#   ADD_C_INCLUDES += /workspace/3rdparty/OpenCL-Headers/
+#   # downloaded from https://github.com/KhronosGroup/OpenCL-Headers
+#   ADD_C_INCLUDES += /usr/local/OpenCL-Headers/
 #
 #   # the additional link libs you want to add, e.g., ANDROID_LIB_PATH/libOpenCL.so
 #   ADD_LDLIBS = /workspace/pull-from-android-device/libOpenCL.so
@@ -155,7 +155,7 @@
 #
 # .. code-block:: bash
 #
-#   python -m tvm.exec.query_rpc_tracker --host=0.0.0.0 --port=9190
+#   python3 -m tvm.exec.query_rpc_tracker --host=0.0.0.0 --port=9190
 #
 # For example, if we have 1 Android device.
 # the output can be
@@ -180,7 +180,7 @@
 # .. code-block:: bash
 #
 #   cd /workspace/apps/android_rpc
-#   python tests/android_rpc_test.py
+#   python3 tests/android_rpc_test.py
 #
 
 ######################################################################
diff --git a/tutorials/frontend/deploy_model_on_rasp.py b/tutorials/frontend/deploy_model_on_rasp.py
index 78377849c10b2..d19805bdc2fbf 100644
--- a/tutorials/frontend/deploy_model_on_rasp.py
+++ b/tutorials/frontend/deploy_model_on_rasp.py
@@ -142,7 +142,7 @@ def transform_image(image):
 shape_dict = {'data': x.shape}
 mod, params = relay.frontend.from_mxnet(block, shape_dict)
 # we want a probability so add a softmax operator
-func = mod[mod.entry_func]
+func = mod["main"]
 func = relay.Function(func.params, relay.nn.softmax(func.body), None, func.type_params, func.attrs)
 
 ######################################################################
diff --git a/tutorials/frontend/from_mxnet.py b/tutorials/frontend/from_mxnet.py
index 1109fd9b7d1cf..d0e4c4ab0d180 100644
--- a/tutorials/frontend/from_mxnet.py
+++ b/tutorials/frontend/from_mxnet.py
@@ -84,7 +84,7 @@ def transform_image(image):
 shape_dict = {'data': x.shape}
 mod, params = relay.frontend.from_mxnet(block, shape_dict)
 ## we want a probability so add a softmax operator
-func = mod[mod.entry_func]
+func = mod["main"]
 func = relay.Function(func.params, relay.nn.softmax(func.body), None, func.type_params, func.attrs)
 
 ######################################################################
diff --git a/tutorials/frontend/using_external_lib.py b/tutorials/frontend/using_external_lib.py
index a33d4eb9dc7a5..35b015bffcd32 100644
--- a/tutorials/frontend/using_external_lib.py
+++ b/tutorials/frontend/using_external_lib.py
@@ -56,7 +56,7 @@
 simple_net = relay.nn.conv2d(data=data, weight=weight, kernel_size=(3,3), channels=out_channels, padding=(1, 1))
 simple_net = relay.nn.batch_norm(simple_net, bn_gamma, bn_beta, bn_mmean, bn_mvar)[0]
 simple_net = relay.nn.relu(simple_net)
-simple_net = relay.Function(relay.ir_pass.free_vars(simple_net), simple_net)
+simple_net = relay.Function(relay.analysis.free_vars(simple_net), simple_net)
 
 data_shape = (batch_size, 3, 224, 224)
 net, params = testing.create_workload(simple_net)
diff --git a/tutorials/relay_quick_start.py b/tutorials/relay_quick_start.py
index b21f4fc5571c0..26157f07d83e6 100644
--- a/tutorials/relay_quick_start.py
+++ b/tutorials/relay_quick_start.py
@@ -65,11 +65,11 @@
 data_shape = (batch_size,) + image_shape
 out_shape = (batch_size, num_class)
 
-net, params = relay.testing.resnet.get_workload(
+mod, params = relay.testing.resnet.get_workload(
     num_layers=18, batch_size=batch_size, image_shape=image_shape)
 
 # set show_meta_data=True if you want to show meta data
-print(net.astext(show_meta_data=False))
+print(mod.astext(show_meta_data=False))
 
 ######################################################################
 # Compilation
@@ -98,7 +98,7 @@
 target = tvm.target.cuda()
 with relay.build_config(opt_level=opt_level):
     graph, lib, params = relay.build_module.build(
-        net, target, params=params)
+        mod, target, params=params)
 
 #####################################################################
 # Run the generate library
diff --git a/version.py b/version.py
index 1df897a40fb4f..c949d5c2ead2f 100644
--- a/version.py
+++ b/version.py
@@ -24,8 +24,6 @@
 - tvm-root/include/tvm/runtime/c_runtime_api.h
 - tvm-root/web/tvm_runtime.js
 - tvm-root/conda/tvm/meta.yaml
-- tvm-root/conda/topi/meta.yaml
-- tvm-root/conda/nnvm/meta.yaml
 - tvm-root/conda/tvm-libs/meta.yaml
 """
 import os
@@ -71,7 +69,7 @@ def main():
     update(os.path.join(proj_root, "include", "tvm", "runtime", "c_runtime_api.h"),
            "(?<=TVM_VERSION \")[.0-9a-z]+", __version__)
     # conda
-    for path in ["tvm", "topi", "nnvm", "tvm-libs"]:
+    for path in ["tvm", "tvm-libs"]:
         update(os.path.join(proj_root, "conda", path, "meta.yaml"),
                "(?<=version = \")[.0-9a-z]+", __version__)
     # web
diff --git a/vta/python/vta/testing/util.py b/vta/python/vta/testing/util.py
index 30760409733cf..7da98efbeb5cb 100644
--- a/vta/python/vta/testing/util.py
+++ b/vta/python/vta/testing/util.py
@@ -54,21 +54,25 @@ def run(run_func):
 
     elif env.TARGET == "pynq":
 
+        # The environment variables below should be set if we are using
+        # a tracker to obtain a remote for a test device
         tracket_host = os.environ.get("TVM_TRACKER_HOST", None)
-        tracket_port = int(os.environ.get("TVM_TRACKER_PORT", None))
+        tracket_port = os.environ.get("TVM_TRACKER_PORT", None)
+        # Otherwise, we can set the variables below to directly
+        # obtain a remote from a test device
         pynq_host = os.environ.get("VTA_PYNQ_RPC_HOST", None)
-        pynq_port = int(os.environ.get("VTA_PYNQ_RPC_PORT", None))
+        pynq_port = os.environ.get("VTA_PYNQ_RPC_PORT", None)
         # Run device from fleet node if env variables are defined
         if tracket_host and tracket_port:
             remote = autotvm.measure.request_remote(env.TARGET,
                                                     tracket_host,
-                                                    tracket_port,
+                                                    int(tracket_port),
                                                     timeout=10000)
             run_func(env, remote)
         else:
             # Next, run on PYNQ if env variables are defined
             if pynq_host and pynq_port:
-                remote = rpc.connect(pynq_host, pynq_port)
+                remote = rpc.connect(pynq_host, int(pynq_port))
                 run_func(env, remote)
             else:
                 raise RuntimeError(
diff --git a/vta/python/vta/top/graphpack.py b/vta/python/vta/top/graphpack.py
index 6f901833ea159..98dcab2c07f9c 100644
--- a/vta/python/vta/top/graphpack.py
+++ b/vta/python/vta/top/graphpack.py
@@ -18,9 +18,17 @@
 """A Relay implementation of graph packing."""
 
 from tvm import relay
-from tvm.relay import op
+from tvm.relay import op, transform
 from tvm.relay import ExprMutator
 
+def run_opt_pass(expr, opt_pass):
+    """Exectue a relay pass."""
+    assert isinstance(opt_pass, transform.Pass)
+    mod = relay.Module.from_expr(expr)
+    mod = opt_pass(mod)
+    entry = mod["main"]
+    return entry if isinstance(expr, relay.Function) else entry.body
+
 def _to_shape(shape):
     return tuple(int(sh) for sh in shape)
 
@@ -231,7 +239,7 @@ def get_subgraph(expr, start_name, stop_name):
     """
     bitpack_start = op.op.get('annotation.bitpack_start')
     bitpack_end = op.op.get('annotation.bitpack_end')
-    anf = relay.ir_pass.to_a_normal_form(expr)
+    anf = run_opt_pass(expr, transform.ToANormalForm())
     def _recursion(anf, start_found, stop_found):
         """ Helper to obtain the subgraph.
         """
@@ -262,7 +270,7 @@ def _recursion(anf, start_found, stop_found):
             assert stop_found
             return anf
     annotated = _recursion(anf, False, False)
-    return relay.ir_pass.infer_type(relay.ir_pass.to_graph_normal_form(annotated))
+    return run_opt_pass(annotated, transform.ToGraphNormalForm())
 
 def graph_pack(expr,
                bfactor,
@@ -299,10 +307,10 @@ def graph_pack(expr,
     """
     assert isinstance(expr, relay.Function)
     expr = get_subgraph(expr, start_name, stop_name)
-    expr = relay.ir_pass.infer_type(expr)
+    expr = run_opt_pass(expr, transform.InferType())
     packer = ExprPack(
         bfactor, cfactor,
         weight_bits)
     expr = packer.visit(expr)
     assert not packer.start_pack
-    return relay.ir_pass.infer_type(expr)
+    return run_opt_pass(expr, transform.InferType())
diff --git a/vta/scripts/tune_resnet.py b/vta/scripts/tune_resnet.py
index 21aa96cd350fc..80a213ccd3ffa 100644
--- a/vta/scripts/tune_resnet.py
+++ b/vta/scripts/tune_resnet.py
@@ -127,7 +127,7 @@ def compile_network(opt, env, target):
     # Perform quantization in Relay
     with relay.quantize.qconfig(global_scale=8.0,
                                 skip_conv_layers=[0]):
-        relay_prog = relay.quantize.quantize(mod[mod.entry_func], params=params)
+        relay_prog = relay.quantize.quantize(mod["main"], params=params)
 
     # Perform graph packing and constant folding for VTA target
     if target.device_name == "vta":
@@ -139,7 +139,6 @@ def compile_network(opt, env, target):
             env.WGT_WIDTH,
             start_name=opt.start_name,
             stop_name=opt.stop_name)
-        relay_prog = relay.ir_pass.fold_constant(relay_prog)
 
     return relay_prog, params
 
diff --git a/vta/tutorials/autotvm/tune_relay_vta.py b/vta/tutorials/autotvm/tune_relay_vta.py
index bdeb6c5d03e2c..2bf33bcdf79f9 100644
--- a/vta/tutorials/autotvm/tune_relay_vta.py
+++ b/vta/tutorials/autotvm/tune_relay_vta.py
@@ -91,7 +91,7 @@ def compile_network(env, target, model, start_pack, stop_pack):
     # Perform quantization in Relay
     with relay.quantize.qconfig(global_scale=8.0,
                                 skip_conv_layers=[0]):
-        relay_prog = relay.quantize.quantize(mod[mod.entry_func], params=params)
+        relay_prog = relay.quantize.quantize(mod["main"], params=params)
 
     # Perform graph packing and constant folding for VTA target
     if target.device_name == "vta":
@@ -103,7 +103,6 @@ def compile_network(env, target, model, start_pack, stop_pack):
             env.WGT_WIDTH,
             start_name=start_pack,
             stop_name=stop_pack)
-        relay_prog = relay.ir_pass.fold_constant(relay_prog)
 
     return relay_prog, params
 
diff --git a/vta/tutorials/frontend/deploy_resnet_on_vta.py b/vta/tutorials/frontend/deploy_resnet_on_vta.py
index 271630e695588..c4e7aaf246b44 100644
--- a/vta/tutorials/frontend/deploy_resnet_on_vta.py
+++ b/vta/tutorials/frontend/deploy_resnet_on_vta.py
@@ -160,7 +160,7 @@
     # Perform quantization in Relay
     with relay.quantize.qconfig(global_scale=8.0,
                                 skip_conv_layers=[0]):
-        relay_prog = relay.quantize.quantize(mod[mod.entry_func], params=params)
+        relay_prog = relay.quantize.quantize(mod["main"], params=params)
 
     # Perform graph packing and constant folding for VTA target
     if target.device_name == "vta":
@@ -172,7 +172,6 @@
             env.WGT_WIDTH,
             start_name=start_pack,
             stop_name=stop_pack)
-        relay_prog = relay.ir_pass.fold_constant(relay_prog)
 
     # Compile Relay program with AlterOpLayout disabled
     with relay.build_config(opt_level=3, disabled_pass={"AlterOpLayout"}):
@@ -230,25 +229,39 @@
 m.set_input(**params)
 m.set_input('data', image)
 
-# Perform inference: we run the module 4 times,
-# and repeat 3 times to get error bounds
-timer = m.module.time_evaluator("run", ctx, number=4, repeat=3)
-tcost = timer()
+# Perform inference and gather execution statistics
+# More on: https://docs.tvm.ai/api/python/module.html#tvm.module.Module.time_evaluator
+num = 4 # number of times we run module for a single measurement
+rep = 3 # number of measurements (we derive std dev from this)
+timer = m.module.time_evaluator("run", ctx, number=num, repeat=rep)
+
+if env.TARGET == "sim":
+    simulator.clear_stats()
+    timer()
+    sim_stats = simulator.stats()
+    print("\nExecution statistics:")
+    for k, v in sim_stats.items():
+        # Since we execute the workload many times, we need to normalize stats
+        # Note that there is always one warm up run
+        # Therefore we divide the overall stats by (num * rep + 1)
+        print("\t{:<16}: {:>16}".format(k, v // (num * rep + 1)))
+else:
+    tcost = timer()
+    std = np.std(tcost.results) * 1000 / env.BATCH
+    mean = tcost.mean * 1000 / env.BATCH
+    print("\nPerformed inference in %.2fms/sample (std = %.2f)" % (mean, std))
 
 # Get classification results
 tvm_output = m.get_output(0, tvm.nd.empty((env.BATCH, 1000), "float32", remote.cpu(0)))
 top_categories = np.argsort(tvm_output.asnumpy()[0])
 
 # Report top-5 classification results
-std = np.std(tcost.results) * 1000 / env.BATCH
-mean = tcost.mean * 1000 / env.BATCH
-print("%s prediction" % model)
-print("                     #1:", synset[top_categories[-1]])
-print("                     #2:", synset[top_categories[-2]])
-print("                     #3:", synset[top_categories[-3]])
-print("                     #4:", synset[top_categories[-4]])
-print("                     #5:", synset[top_categories[-5]])
-print("Performed inference in %.2fms/sample (std = %.2f)" % (mean, std))
+print("\n%s prediction" % model)
+print("\t#1:", synset[top_categories[-1]])
+print("\t#2:", synset[top_categories[-2]])
+print("\t#3:", synset[top_categories[-3]])
+print("\t#4:", synset[top_categories[-4]])
+print("\t#5:", synset[top_categories[-5]])
 
 # This just checks that one of the 5 top categories
 # is one variety of cat; this is by no means an accurate