[INFRASTRUCTURE] Migrate to json based config. Move gemm test to integration. (#28)

* Migrate to json based config. Move gemm test to integration. * temp checkin * checkin example json

[INFRASTRUCTURE] Migrate to json based config. Move gemm test to integration. (#28)
* Migrate to json based config. Move gemm test to integration. * temp checkin * checkin example json
5c5806ba · Tianqi Chen · 666f32d6 · 5c5806ba · 5c5806ba · 5c5806ba
Commit 5c5806ba authored Apr 14, 2018 by Tianqi Chen
12 changed files
--- a/vta/Makefile
+++ b/vta/Makefile
 ROOTDIR = $(CURDIR)
-ifndef config
-ifneq ("$(wildcard ./config.mk)", "")
-	config = config.mk
-else
-	config = make/config.mk
-endif
-endif
-include $(config)
 export LDFLAGS = -pthread -lm
 export CFLAGS = -std=c++11 -Wall -O2 -Iinclude -fPIC
-ifdef NNVM_PATH
+VTA_CONFIG = python make/vta_config.py
-	CFLAGS += -I$(NNVM_PATH)/include
+CFLAGS += `${VTA_CONFIG} --cflags`
-else
+LDFLAGS += `${VTA_CONFIG} --ldflags`
-	NNVM_PATH = $(ROOTDIR)/nnvm
+VTA_TARGET := $(shell ${VTA_CONFIG} --target)
-	CFLAGS += -I$(NNVM_PATH)/include
-endif
-ifdef TVM_PATH
-	CFLAGS += -I$(TVM_PATH)/include -I$(TVM_PATH)/dlpack/include -I$(TVM_PATH)/HalideIR/src
-else
-	TVM_PATH = $(NNVM_PATH)/tvm
-	CFLAGS += -I$(TVM_PATH)/include -I$(TVM_PATH)/dlpack/include -I$(TVM_PATH)/HalideIR/src
-endif
-ifdef DMLC_CORE_PATH
-  CFLAGS += -I$(DMLC_CORE_PATH)/include
-else
-  CFLAGS += -I$(NNVM_PATH)/dmlc-core/include
-endif
-ifneq ($(ADD_CFLAGS), NONE)
-	CFLAGS += $(ADD_CFLAGS)
-endif
-ifneq ($(ADD_LDFLAGS), NONE)
-	LDFLAGS += $(ADD_LDFLAGS)
-endif
 UNAME_S := $(shell uname -s)
@@ -53,29 +21,30 @@ else
 	NO_WHOLE_ARCH= --no-whole-archive
 endif
-VTA_LIB_SRC = $(wildcard src/*.cc src/tvm/*.cc)
-ifeq ($(VTA_TARGET), pynq)
+VTA_LIB_SRC = $(wildcard src/*.cc)
+ifeq (${VTA_TARGET}, pynq)
 	VTA_LIB_SRC += $(wildcard src/pynq/*.cc)
-	LDFLAGS += -L/usr/lib -lsds_lib
-	LDFLAGS += -L/opt/python3.6/lib/python3.6/site-packages/pynq/drivers/
-	LDFLAGS += -L/opt/python3.6/lib/python3.6/site-packages/pynq/lib/
-	LDFLAGS += -l:libdma.so
 endif
-ifeq ($(VTA_TARGET), sim)
+ifeq (${VTA_TARGET}, sim)
 	VTA_LIB_SRC += $(wildcard src/sim/*.cc)
 endif
 VTA_LIB_OBJ = $(patsubst src/%.cc, build/%.o, $(VTA_LIB_SRC))
-all: lib/libvta.so
+all: lib/libvta.so lib/libvta.so.json
 build/%.o: src/%.cc
 	@mkdir -p $(@D)
 	$(CXX) $(CFLAGS) -MM -MT build/$*.o $< >build/$*.d
 	$(CXX) -c $(CFLAGS) -c $< -o $@
+lib/libvta.so.json: lib/libvta.so
+	@mkdir -p $(@D)
+	${VTA_CONFIG} --cfg-json > $@
 lib/libvta.so: $(VTA_LIB_OBJ)
 	@mkdir -p $(@D)
 	$(CXX) $(CFLAGS) -shared -o $@ $(filter %.o, $^) $(LDFLAGS)

--- a/vta/make/README.md
+++ b/vta/make/README.md
+# VTA Configuration
+Each VTA runtime/hardware configuration is specified by config.json file.
+You can copy the config.json to project root and modify the configuration
+before you type make.
+The config is going to affect the behavior of python package as well as
+the hardware runtime build.
\ No newline at end of file
--- a/vta/make/config.json
+++ b/vta/make/config.json
+{
+  "TARGET" : "pynq",
+  "LOG_INP_WIDTH" : 3,
+  "LOG_WGT_WIDTH" : 3,
+  "LOG_ACC_WIDTH" : 5,
+  "LOG_OUT_WIDTH" : 3,
+  "LOG_BATCH" : 0,
+  "LOG_BLOCK_IN" : 4,
+  "LOG_BLOCK_OUT" : 4,
+  "LOG_UOP_BUFF_SIZE" : 15,
+  "LOG_INP_BUFF_SIZE" : 15,
+  "LOG_WGT_BUFF_SIZE" : 15,
+  "LOG_ACC_BUFF_SIZE" : 17
+}
--- a/vta/make/config.mk
+++ b/vta/make/config.mk
-#-------------------------------------------------------------------------------
-#  Template configuration for compiling VTA runtime.
-#
-#  If you want to change the configuration, please use the following
-#  steps. Assume you are on the root directory of nnvm. First copy the this
-#  file so that any local changes will be ignored by git
-#
-#  $ cp make/config.mk .
-#
-#  Next modify the according entries, and then compile by
-#
-#  $ make
-#
-#  or build in parallel with 8 threads
-#
-#  $ make -j8
-#-------------------------------------------------------------------------------
-#---------------------
-# choice of compiler
-#--------------------
-# the additional link flags you want to add
-ADD_LDFLAGS=
-# the additional compile flags you want to add
-ADD_CFLAGS=
-# the hardware target, can be [sim, pynq]
-VTA_TARGET = pynq
-#---------------------
-# VTA hardware parameters
-#--------------------
-#  Log of input/activation width in bits (default 3 -> 8 bits)
-VTA_LOG_INP_WIDTH = 3
-#  Log of kernel weight width in bits (default 3 -> 8 bits)
-VTA_LOG_WGT_WIDTH = 3
-#  Log of accum width in bits (default 5 -> 32 bits)
-VTA_LOG_ACC_WIDTH = 5
-#  Log of tensor batch size (A in (A,B)x(B,C) matrix multiplication)
-VTA_LOG_BATCH = 0
-#  Log of tensor inner block size (B in (A,B)x(B,C) matrix multiplication)
-VTA_LOG_BLOCK_IN = 4
-#  Log of tensor outer block size (C in (A,B)x(B,C) matrix multiplication)
-VTA_LOG_BLOCK_OUT = 4
-#  Log of uop buffer size in Bytes
-VTA_LOG_UOP_BUFF_SIZE = 15
-#  Log of inp buffer size in Bytes
-VTA_LOG_INP_BUFF_SIZE = 15
-#  Log of wgt buffer size in Bytes
-VTA_LOG_WGT_BUFF_SIZE = 15
-#  Log of acc buffer size in Bytes
-VTA_LOG_ACC_BUFF_SIZE = 17
-#---------------------
-# Derived VTA hardware parameters
-#--------------------
-#  Input width in bits
-VTA_INP_WIDTH = $(shell echo "$$(( 1 << $(VTA_LOG_INP_WIDTH) ))" )
-#  Weight width in bits
-VTA_WGT_WIDTH = $(shell echo "$$(( 1 << $(VTA_LOG_WGT_WIDTH) ))" )
-#  Log of output width in bits
-VTA_LOG_OUT_WIDTH = $(VTA_LOG_INP_WIDTH)
-#  Output width in bits
-VTA_OUT_WIDTH = $(shell echo "$$(( 1 << $(VTA_LOG_OUT_WIDTH) ))" )
-#  Tensor batch size
-VTA_BATCH = $(shell echo "$$(( 1 << $(VTA_LOG_BATCH) ))" )
-#  Tensor outer block size
-VTA_IN_BLOCK = $(shell echo "$$(( 1 << $(VTA_LOG_BLOCK_IN) ))" )
-#  Tensor inner block size
-VTA_OUT_BLOCK = $(shell echo "$$(( 1 << $(VTA_LOG_BLOCK_OUT) ))" )
-#  Uop buffer size in Bytes
-VTA_UOP_BUFF_SIZE = $(shell echo "$$(( 1 << $(VTA_LOG_UOP_BUFF_SIZE) ))" )
-#  Inp buffer size in Bytes
-VTA_INP_BUFF_SIZE = $(shell echo "$$(( 1 << $(VTA_LOG_INP_BUFF_SIZE) ))" )
-#  Wgt buffer size in Bytes
-VTA_WGT_BUFF_SIZE = $(shell echo "$$(( 1 << $(VTA_LOG_WGT_BUFF_SIZE) ))" )
-#  Acc buffer size in Bytes
-VTA_ACC_BUFF_SIZE = $(shell echo "$$(( 1 << $(VTA_LOG_ACC_BUFF_SIZE) ))" )
-#  Log of out buffer size in Bytes
-VTA_LOG_OUT_BUFF_SIZE = \
-$(shell echo "$$(( $(VTA_LOG_ACC_BUFF_SIZE) + $(VTA_LOG_OUT_WIDTH) - $(VTA_LOG_ACC_WIDTH) ))" )
-#  Out buffer size in Bytes
-VTA_OUT_BUFF_SIZE = $(shell echo "$$(( 1 << $(VTA_LOG_OUT_BUFF_SIZE) ))" )
-# Update ADD_CFLAGS
-ADD_CFLAGS +=
-	-DVTA_TARGET=$(VTA_TARGET)\
-	-DVTA_LOG_WGT_WIDTH=$(VTA_LOG_WGT_WIDTH) -DVTA_LOG_INP_WIDTH=$(VTA_LOG_INP_WIDTH) \
-	-DVTA_LOG_ACC_WIDTH=$(VTA_LOG_ACC_WIDTH) -DVTA_LOG_OUT_WIDTH=$(VTA_LOG_OUT_WIDTH) \
-	-DVTA_LOG_BATCH=$(VTA_LOG_BATCH) \
-	-DVTA_LOG_BLOCK_IN=$(VTA_LOG_BLOCK_IN) -DVTA_LOG_BLOCK_OUT=$(VTA_LOG_BLOCK_OUT) \
-	-DVTA_LOG_UOP_BUFF_SIZE=$(VTA_LOG_UOP_BUFF_SIZE) -DVTA_LOG_INP_BUFF_SIZE=$(VTA_LOG_INP_BUFF_SIZE) \
-	-DVTA_LOG_WGT_BUFF_SIZE=$(VTA_LOG_WGT_BUFF_SIZE) -DVTA_LOG_ACC_BUFF_SIZE=$(VTA_LOG_ACC_BUFF_SIZE) \
-	-DVTA_LOG_OUT_BUFF_SIZE=$(VTA_LOG_OUT_BUFF_SIZE)
--- a/vta/make/vta_config.py
+++ b/vta/make/vta_config.py
+"""VTA config tool"""
+import os
+import sys
+import json
+import argparse
+def get_pkg_config(cfg):
+    """Get the pkg config object."""
+    curr_path = os.path.dirname(os.path.abspath(os.path.expanduser(__file__)))
+    proj_root = os.path.abspath(os.path.join(curr_path, "../"))
+    pkg_config_py = os.path.join(proj_root, "python/vta/pkg_config.py")
+    libpkg = {"__file__": pkg_config_py}
+    exec(compile(open(pkg_config_py, "rb").read(), pkg_config_py, "exec"), libpkg, libpkg)
+    PkgConfig = libpkg["PkgConfig"]
+    return PkgConfig(cfg, proj_root)
+def main():
+    """Main funciton"""
+    parser = argparse.ArgumentParser()
+    parser.add_argument("--cflags", action="store_true",
+                        help="print the cflags")
+    parser.add_argument("--update", action="store_true",
+                        help="Print out the json option.")
+    parser.add_argument("--ldflags", action="store_true",
+                        help="print the cflags")
+    parser.add_argument("--cfg-json", action="store_true",
+                        help="print all the config json")
+    parser.add_argument("--target", action="store_true",
+                        help="print the target")
+    args = parser.parse_args()
+    if len(sys.argv) == 1:
+        parser.print_help()
+        return
+    curr_path = os.path.dirname(
+        os.path.abspath(os.path.expanduser(__file__)))
+    proj_root = os.path.abspath(os.path.join(curr_path, "../"))
+    path_list = [
+        os.path.join(proj_root, "config.json"),
+        os.path.join(proj_root, "make/config.json")
+    ]
+    ok_path_list = [p for p in path_list if os.path.exists(p)]
+    if not ok_path_list:
+        raise RuntimeError("Cannot find config in %s" % str(path_list))
+    cfg = json.load(open(ok_path_list[0]))
+    cfg["LOG_OUT_WIDTH"] = cfg["LOG_INP_WIDTH"]
+    pkg = get_pkg_config(cfg)
+    if args.target:
+        print(pkg.target)
+    if args.cflags:
+        print(" ".join(pkg.cflags))
+    if args.ldflags:
+        print(" ".join(pkg.ldflags))
+    if args.cfg_json:
+        print(pkg.cfg_json)
+if __name__ == "__main__":
+    main()
--- a/vta/python/vta/__init__.py
+++ b/vta/python/vta/__init__.py
 """TVM-based VTA Compiler Toolchain"""
 from __future__ import absolute_import as _abs
-import sys
 from .environment import get_env, Environment
+from . import arm_conv2d, vta_conv2d
+from .build_module import build_config, lower, build
+from .rpc_client import reconfig_runtime, program_fpga
 try:
-    # allow optional import in config mode.
-    from . import arm_conv2d, vta_conv2d
-    from .build_module import build_config, lower, build
-    from .rpc_client import reconfig_runtime, program_fpga
    from . import graph
 except (ImportError, RuntimeError):
    pass
--- a/vta/python/vta/environment.py
+++ b/vta/python/vta/environment.py
@@ -3,10 +3,11 @@
 from __future__ import absolute_import as _abs
 import os
-import glob
+import json
 import copy
 import tvm
 from . import intrin
+from .pkg_config import PkgConfig
 class DevContext(object):
@@ -61,45 +62,6 @@ class DevContext(object):
        return 1 if self.DEBUG_NO_SYNC else qid
-class PkgConfig(object):
-    """Simple package config tool for VTA.
-    This is used to provide runtime specific configurations.
-    """
-    def __init__(self, env):
-        curr_path = os.path.dirname(os.path.abspath(os.path.expanduser(__file__)))
-        proj_root = os.path.abspath(os.path.join(curr_path, "../../"))
-        # include path
-        self.include_path = [
-            "-I%s/include" % proj_root,
-            "-I%s/nnvm/tvm/include" % proj_root,
-            "-I%s/nnvm/tvm/dlpack/include" % proj_root,
-            "-I%s/nnvm/dmlc-core/include" % proj_root
-        ]
-        # List of source files that can be used to build standalone library.
-        self.lib_source = []
-        self.lib_source += glob.glob("%s/src/*.cc" % proj_root)
-        self.lib_source += glob.glob("%s/src/%s/*.cc" % (proj_root, env.TARGET))
-        # macro keys
-        self.macro_defs = []
-        for key in env.cfg_keys:
-            self.macro_defs.append("-DVTA_%s=%s" % (key, str(getattr(env, key))))
-        if env.TARGET == "pynq":
-            self.ldflags = [
-                "-L/usr/lib",
-                "-lsds_lib",
-                "-L/opt/python3.6/lib/python3.6/site-packages/pynq/drivers/",
-                "-L/opt/python3.6/lib/python3.6/site-packages/pynq/lib/",
-                "-l:libdma.so"]
-        else:
-            self.ldflags = []
-    @property
-    def cflags(self):
-        return self.include_path + self.macro_defs
 class Environment(object):
    """Hareware configuration object.
@@ -123,19 +85,6 @@ class Environment(object):
          env = vta.get_env()
    """
    current = None
-    cfg_keys = [
-        "TARGET",
-        "LOG_INP_WIDTH",
-        "LOG_WGT_WIDTH",
-        "LOG_ACC_WIDTH",
-        "LOG_BATCH",
-        "LOG_BLOCK_IN",
-        "LOG_BLOCK_OUT",
-        "LOG_UOP_BUFF_SIZE",
-        "LOG_INP_BUFF_SIZE",
-        "LOG_WGT_BUFF_SIZE",
-        "LOG_ACC_BUFF_SIZE",
-    ]
    # constants
    MAX_XFER = 1 << 22
    # debug flags
@@ -152,10 +101,9 @@ class Environment(object):
    def __init__(self, cfg):
        # Log of input/activation width in bits
        self.__dict__.update(cfg)
-        for key in self.cfg_keys:
+        for key in PkgConfig.cfg_keys:
            if key not in cfg:
                raise ValueError("Expect key %s in cfg" % key)
-        self.LOG_OUT_WIDTH = self.LOG_INP_WIDTH
        self.LOG_OUT_BUFF_SIZE = (
            self.LOG_ACC_BUFF_SIZE +
            self.LOG_OUT_WIDTH -
@@ -195,7 +143,12 @@ class Environment(object):
        self.mock_mode = False
        self._mock_env = None
        self._dev_ctx = None
-        self._pkg_config = None
+    def pkg_config(self):
+        """PkgConfig instance"""
+        curr_path = os.path.dirname(os.path.abspath(os.path.expanduser(__file__)))
+        proj_root = os.path.abspath(os.path.join(curr_path, "../../"))
+        return PkgConfig(self.__dict__, proj_root)
    @property
    def dev(self):
@@ -205,13 +158,6 @@ class Environment(object):
        return self._dev_ctx
    @property
-    def pkg_config(self):
-        """PkgConfig instance"""
-        if self._pkg_config is None:
-            self._pkg_config = PkgConfig(self)
-        return self._pkg_config
-    @property
    def mock(self):
        """A mock version of the Environment
@@ -327,30 +273,19 @@ def coproc_dep_pop(op):
 def _init_env():
    """Iniitalize the default global env"""
-    python_vta_dir = os.path.dirname(__file__)
+    curr_path = os.path.dirname(
-    filename = os.path.join(python_vta_dir, '../../config.mk')
+        os.path.abspath(os.path.expanduser(__file__)))
-    keys = set()
+    proj_root = os.path.abspath(os.path.join(curr_path, "../../"))
+    path_list = [
-    for k in Environment.cfg_keys:
+        os.path.join(curr_path, "config.json"),
-        keys.add("VTA_" + k)
+        os.path.join(proj_root, "config.json"),
+        os.path.join(proj_root, "make/config.json")
-    if not os.path.isfile(filename):
+    ]
+    path_list = [p for p in path_list if os.path.exists(p)]
+    if not path_list:
        raise RuntimeError(
-            "Error: {} not found.make sure you have config.mk in your vta root"
+            "Error: {} not found.make sure you have config.json in your vta root"
            .format(filename))
+    return Environment(json.load(open(path_list[0])))
-    cfg = {}
-    with open(filename) as f:
-        for line in f:
-            for k in keys:
-                if k  +" =" in line:
-                    val = line.split("=")[1].strip()
-                    if k.startswith("VTA_"):
-                        k = k[4:]
-                    try:
-                        cfg[k] = int(val)
-                    except ValueError:
-                        cfg[k] = val
-    return Environment(cfg)
 Environment.current = _init_env()
--- a/vta/python/vta/exec/rpc_server.py
+++ b/vta/python/vta/exec/rpc_server.py
@@ -8,11 +8,13 @@ import logging
 import argparse
 import os
 import ctypes
+import json
 import tvm
 from tvm._ffi.base import c_str
 from tvm.contrib import rpc, cc
 from ..environment import get_env
+from ..pkg_config import PkgConfig
 @tvm.register_func("tvm.contrib.rpc.server.start", override=True)
@@ -21,8 +23,9 @@ def server_start():
    # pylint: disable=unused-variable
    curr_path = os.path.dirname(
        os.path.abspath(os.path.expanduser(__file__)))
-    dll_path = os.path.abspath(
+    proj_root = os.path.abspath(os.path.join(curr_path, "../../.."))
-        os.path.join(curr_path, "../../../lib/libvta.so"))
+    dll_path = os.path.abspath(os.path.join(proj_root, "lib/libvta.so"))
+    cfg_path = os.path.abspath(os.path.join(proj_root, "lib/libvta.so.json"))
    runtime_dll = []
    _load_module = tvm.get_global_func("tvm.contrib.rpc.server.load_module")
@@ -56,7 +59,7 @@ def server_start():
            runtime_dll.pop()
    @tvm.register_func("tvm.contrib.vta.reconfig_runtime", override=True)
-    def reconfig_runtime(cflags):
+    def reconfig_runtime(cfg_json):
        """Rebuild and reload runtime with new configuration.
        Parameters
@@ -66,16 +69,26 @@ def server_start():
        """
        if runtime_dll:
            raise RuntimeError("Can only reconfig in the beginning of session...")
-        cflags = cflags.split()
        env = get_env()
+        cfg = json.loads(cfg_json)
+        cfg["TARGET"] = env.TARGET
+        pkg = PkgConfig(cfg, proj_root)
+        # check if the configuration is already the same
+        if os.path.isfile(cfg_path):
+            old_cfg = json.load(open(cfg_path))
+            if pkg.same_config(old_cfg):
+                logging.info("Skip reconfiguration because runtime config is the same")
+                return
        cflags += ["-O2", "-std=c++11"]
-        cflags += env.pkg_config.include_path
+        cflags += pkg.cflags
-        ldflags = env.pkg_config.ldflags
+        ldflags = pkg.ldflags
        lib_name = dll_path
        source = env.pkg_config.lib_source
        logging.info("Rebuild runtime: output=%s, cflags=%s, source=%s, ldflags=%s",
                     dll_path, str(cflags), str(source), str(ldflags))
        cc.create_shared(lib_name, source, cflags + ldflags)
+        with open(cfg_path, "w") as outputfile:
+            json.dump(pkg.cfg_json, outputfile)
 def main():

--- a/vta/python/vta/pkg_config.py
+++ b/vta/python/vta/pkg_config.py
+"""VTA Package configuration module
+This module is dependency free and can be used to configure package.
+"""
+from __future__ import absolute_import as _abs
+import json
+import glob
+class PkgConfig(object):
+    """Simple package config tool for VTA.
+    This is used to provide runtime specific configurations.
+    Parameters
+    ----------
+    cfg : dict
+        The config dictionary
+    proj_root : str
+        Path to the project root
+    """
+    cfg_keys = [
+        "TARGET",
+        "LOG_INP_WIDTH",
+        "LOG_WGT_WIDTH",
+        "LOG_ACC_WIDTH",
+        "LOG_OUT_WIDTH",
+        "LOG_BATCH",
+        "LOG_BLOCK_IN",
+        "LOG_BLOCK_OUT",
+        "LOG_UOP_BUFF_SIZE",
+        "LOG_INP_BUFF_SIZE",
+        "LOG_WGT_BUFF_SIZE",
+        "LOG_ACC_BUFF_SIZE",
+    ]
+    def __init__(self, cfg, proj_root):
+        # include path
+        self.include_path = [
+            "-I%s/include" % proj_root,
+            "-I%s/nnvm/tvm/include" % proj_root,
+            "-I%s/nnvm/tvm/dlpack/include" % proj_root,
+            "-I%s/nnvm/dmlc-core/include" % proj_root
+        ]
+        # List of source files that can be used to build standalone library.
+        self.lib_source = []
+        self.lib_source += glob.glob("%s/src/*.cc" % proj_root)
+        self.lib_source += glob.glob("%s/src/%s/*.cc" % (proj_root, cfg["TARGET"]))
+        # macro keys
+        self.macro_defs = []
+        self.cfg_dict = {}
+        for key in self.cfg_keys:
+            self.macro_defs.append("-DVTA_%s=%s" % (key, str(cfg[key])))
+            self.cfg_dict[key] = cfg[key]
+        self.target = cfg["TARGET"]
+        if self.target == "pynq":
+            self.ldflags = [
+                "-L/usr/lib",
+                "-lsds_lib",
+                "-L/opt/python3.6/lib/python3.6/site-packages/pynq/drivers/",
+                "-L/opt/python3.6/lib/python3.6/site-packages/pynq/lib/",
+                "-l:libdma.so"]
+        else:
+            self.ldflags = []
+    @property
+    def cflags(self):
+        return self.include_path + self.macro_defs
+    @property
+    def cfg_json(self):
+        return json.dumps(self.cfg_dict, indent=2)
+    def same_config(self, cfg):
+        """Compare if cfg is same as current config.
+        Parameters
+        ----------
+        cfg : the configuration
+            The configuration
+        Returns
+        -------
+        equal : bool
+            Whether the configuration is the same.
+        """
+        for k, v in self.cfg_dict.items():
+            if k not in cfg:
+                return False
+            if cfg[k] != v:
+                return False
+        return True
--- a/vta/python/vta/rpc_client.py
+++ b/vta/python/vta/rpc_client.py
@@ -12,23 +12,8 @@ def reconfig_runtime(remote):
        The TVM RPC session
    """
    env = get_env()
-    keys = ["VTA_LOG_WGT_WIDTH",
-            "VTA_LOG_INP_WIDTH",
-            "VTA_LOG_ACC_WIDTH",
-            "VTA_LOG_OUT_WIDTH",
-            "VTA_LOG_BATCH",
-            "VTA_LOG_BLOCK_IN",
-            "VTA_LOG_BLOCK_OUT",
-            "VTA_LOG_UOP_BUFF_SIZE",
-            "VTA_LOG_INP_BUFF_SIZE",
-            "VTA_LOG_WGT_BUFF_SIZE",
-            "VTA_LOG_ACC_BUFF_SIZE",
-            "VTA_LOG_OUT_BUFF_SIZE"]
-    cflags = []
-    for k in keys:
-        cflags += ["-D%s=%s" % (k, str(getattr(env, k[4:])))]
    freconfig = remote.get_function("tvm.contrib.vta.reconfig_runtime")
-    freconfig(" ".join(cflags))
+    freconfig(env.pkg_config().cfg_json)
 def program_fpga(remote, bitstream):

--- a/vta/src/sim/sim_driver.cc
+++ b/vta/src/sim/sim_driver.cc
@@ -109,9 +109,12 @@ class DRAM {
   * \return The true virtual address;
   */
  void* GetAddr(uint64_t phy_addr) {
+    CHECK_NE(phy_addr, 0)
+        << "trying to get address that is nullptr";
    std::lock_guard<std::mutex> lock(mutex_);
    uint64_t loc = (phy_addr >> kPageBits) - 1;
-    CHECK_LT(loc, ptable_.size());
+    CHECK_LT(loc, ptable_.size())
+        << "phy_addr=" << phy_addr;
    Page* p = ptable_[loc];
    CHECK(p != nullptr);
    size_t offset = (loc - p->ptable_begin) << kPageBits;
@@ -173,7 +176,7 @@ class DRAM {
 private:
  // The bits in page table
-  static constexpr vta_phy_addr_t kPageBits = 16;
+  static constexpr vta_phy_addr_t kPageBits = 12;
  // page size, also the maximum allocable size 16 K
  static constexpr vta_phy_addr_t kPageSize = 1 << kPageBits;
  /*! \brief A page in the DRAM */
@@ -388,6 +391,7 @@ class Device {
  }
  void RunStore(const VTAMemInsn* op) {
+    if (op->x_size == 0) return;
    if (op->memory_type == VTA_MEM_ID_ACC ||
        op->memory_type == VTA_MEM_ID_UOP) {
      prof_->out_store_nbytes += (

--- a/vta/tests/python/pynq/test_benchmark_gemm.py
+++ b/vta/tests/python/pynq/test_benchmark_gemm.py
-import os
 import tvm
-import vta
 import numpy as np
-import time
+from tvm.contrib import util
-from tvm.contrib import rpc, util
+import vta.testing
-host = "pynq"
-port = 9091
-target = "llvm -target=armv7-none-linux-gnueabihf"
+def test_gemm():
-def test_gemm_packed(batch_size, channel, block):
+    def run_gemm_packed(env, remote, batch_size, channel, block):
-    env = vta.get_env()
        data_shape = (batch_size // env.BATCH,
                      channel // env.BLOCK_IN,
                      env.BATCH,
@@ -61,9 +55,9 @@ def test_gemm_packed(batch_size, channel, block):
                          name="res")
        def verify(s, check_correctness=True):
-        mod = vta.build(s, [data, weight, res], "ext_dev", target, name="gemm")
+            mod = vta.build(s, [data, weight, res],
+                            "ext_dev", env.target_host, name="gemm")
            temp = util.tempdir()
-        remote = rpc.connect(host, port)
            mod.save(temp.relpath("gemm.o"))
            remote.upload(temp.relpath("gemm.o"))
            f = remote.load_module("gemm.o")
@@ -156,6 +150,7 @@ def test_gemm_packed(batch_size, channel, block):
                s[res_max].pragma(s[res_max].op.axis[0], alu)
                s[res].pragma(s[res].op.axis[0], store_out)
            if print_ir:
                print(tvm.lower(s, [data, weight, res], simple_mode=True))
            return verify(s, check_correctness)
@@ -173,8 +168,6 @@ def test_gemm_packed(batch_size, channel, block):
            with vta.build_config():
                run_test("NORMAL", print_ir, True)
-        print("")
        def gevm_unittest(print_ir):
            mock = env.mock
            print("----- GEMM Unit Test-------")
@@ -187,7 +180,6 @@ def test_gemm_packed(batch_size, channel, block):
                print("\tTime cost = %g sec/op, %g GFLOPS" % (cost.mean, gops))
            with vta.build_config():
                run_test("NORMAL", print_ir)
-        print("")
        def alu_unittest(print_ir):
            mock = env.mock
@@ -249,18 +241,17 @@ def test_gemm_packed(batch_size, channel, block):
                run_test("NORMAL", print_ir)
            print("")
        gemm_normal(False)
        gevm_unittest(False)
        alu_unittest(False)
-    # FIXME: report time that is too short
-    # load_inp_unittest(False)
-    # load_wgt_unittest(False)
-    # store_out_unittest(False)
+    def _run(env, remote):
+        print("========GEMM 128=========")
+        run_gemm_packed(env, remote, 128, 128, 128)
-print("========GEMM 128=========")
+    vta.testing.run(_run)
-test_gemm_packed(128, 128, 128)
-# FIXME: hanging run
+if __name__ == "__main__":
-# print("========GEMM 1024========")
+    test_gemm()
-# test_gemm_packed(1024, 1024, 128)