Review comments addressed

apache · Jul 19, 2018 · a454b24 · a454b24
1 parent 6e5ba73
commit a454b24
Showing 1 changed file with 71 additions and 84 deletions.
diff --git a/tutorials/nnvm/nlp/from_darknet_rnn.py b/tutorials/nnvm/nlp/from_darknet_rnn.py
@@ -1,6 +1,8 @@
 """
 Compile Darknet Models for RNN
 ==============================
+**Author**: `Siju Samuel <https://siju-samuel.github.io/>`_
+
 This article is an introductory tutorial to deploy darknet rnn models with NNVM.
 
 This script will run a character prediction model
@@ -19,81 +21,55 @@
 by the script.
 """
 import random
-import os
-import sys
-import time
-import urllib
-import requests
 import numpy as np
-import urllib.request as urllib2
+from mxnet.gluon.utils import download
 import tvm
 from tvm.contrib import graph_runtime
 from nnvm.testing.darknet import __darknetffi__
 import nnvm
 import nnvm.frontend.darknet
 
-MODEL_NAME = 'rnn' #Model name
-seed = 'Thus' #Seed value
-num = 1000 #Number of characters to predict
+# Set the parameters
+# -----------------------
+# Set the seed value and the number of characters to predict
+
+#Model name
+MODEL_NAME = 'rnn'
+#Seed value
+seed = 'Thus'
+#Number of characters to predict
+num = 1000
 
+# Download required files
+# -----------------------
 # Download cfg and weights file if first time.
 CFG_NAME = MODEL_NAME + '.cfg'
 WEIGHTS_NAME = MODEL_NAME + '.weights'
 REPO_URL = 'https://github.com/dmlc/web-data/blob/master/darknet/'
 CFG_URL = REPO_URL + 'cfg/' + CFG_NAME + '?raw=true'
 WEIGHTS_URL = REPO_URL + 'weights/' + WEIGHTS_NAME + '?raw=true'
 
-def _dl_progress(count, block_size, total_size):
-    """Show the download progress."""
-    global start_time
-    if count == 0:
-        start_time = time.time()
-        return
-    duration = time.time() - start_time
-    progress_size = int(count * block_size)
-    speed = int(progress_size / (1024 * duration))
-    percent = int(count * block_size * 100 / total_size)
-    sys.stdout.write("\r...%d%%, %d MB, %d KB/s, %d seconds passed" %
-                     (percent, progress_size / (1024 * 1024), speed, duration))
-    sys.stdout.flush()
-
-def _download(url, path, overwrite=False, sizecompare=False):
-    """Downloads the file from the internet.
-    """
-    if os.path.isfile(path) and not overwrite:
-        if sizecompare:
-            file_size = os.path.getsize(path)
-            res_head = requests.head(url)
-            res_get = requests.get(url, stream=True)
-            if 'Content-Length' not in res_head.headers:
-                res_get = urllib2.urlopen(url)
-            url_file_size = int(res_get.headers['Content-Length'])
-            if url_file_size != file_size:
-                print("exist file got corrupted, downloading", path, " file freshly")
-                _download(url, path, True, False)
-                return
-        print('File {} exists, skip.'.format(path))
-        return
-    print('Downloading from url {} to {}'.format(url, path))
-    try:
-        urllib.request.urlretrieve(url, path, reporthook=_dl_progress)
-        print('')
-    except:
-        urllib.urlretrieve(url, path, reporthook=_dl_progress)
-
-_download(CFG_URL, CFG_NAME)
-_download(WEIGHTS_URL, WEIGHTS_NAME)
+download(CFG_URL, CFG_NAME)
+download(WEIGHTS_URL, WEIGHTS_NAME)
 
 # Download and Load darknet library
 DARKNET_LIB = 'libdarknet.so'
 DARKNET_URL = REPO_URL + 'lib/' + DARKNET_LIB + '?raw=true'
-_download(DARKNET_URL, DARKNET_LIB)
+download(DARKNET_URL, DARKNET_LIB)
 DARKNET_LIB = __darknetffi__.dlopen('./' + DARKNET_LIB)
 cfg = "./" + str(CFG_NAME)
 weights = "./" + str(WEIGHTS_NAME)
 net = DARKNET_LIB.load_network(cfg.encode('utf-8'), weights.encode('utf-8'), 0)
 dtype = 'float32'
 batch_size = 1
+
+# Import the graph to NNVM
+# ------------------------
+# Import darknet graph definition to nnvm.
+#
+# Results:
+#   sym: nnvm graph for rnn model
+#   params: params converted from darknet weights
 print("Converting darknet rnn model to nnvm symbols...")
 sym, params = nnvm.frontend.darknet.from_darknet(net, dtype)
 
@@ -110,45 +86,17 @@ def _download(url, path, overwrite=False, sizecompare=False):
 with nnvm.compiler.build_config(opt_level=2):
     graph, lib, params = nnvm.compiler.build(sym, target, shape_dict, dtype_dict, params)
 
-# Save the json
-def _save_lib():
-    '''Save the graph, params and .so to the current directory'''
-    print("Saving the compiled output...")
-    path_name = 'nnvm_darknet_' + MODEL_NAME
-    path_lib = path_name + '_deploy_lib.so'
-    lib.export_library(path_lib)
-    with open(path_name + "deploy_graph.json", "w") as fo:
-        fo.write(graph.json())
-    with open(path_name + "deploy_param.params", "wb") as fo:
-        fo.write(nnvm.compiler.save_param_dict(params))
-#_save_lib()
-
-# Execute on TVM
-ctx = tvm.cpu(0)
+# Execute the portable graph on TVM
+# ---------------------------------
+# Now we can try deploying the NNVM compiled model on cpu target.
 
+# Set the cpu context
+ctx = tvm.cpu(0)
 # Create graph runtime
 m = graph_runtime.create(graph, lib, ctx)
+# Set the params to runtime
 m.set_input(**params)
 
-print("RNN generaring text...")
-
-def _proc_rnn_output(out_data):
-    '''Generate the characters from the output array'''
-    sum_array = 0
-    n = out_data.size
-    r = random.uniform(0, 1)
-    for j in range(n):
-        if out_data[j] < .0001:
-            out_data[j] = 0
-        sum_array += out_data[j]
-
-    for j in range(n):
-        out_data[j] *= float(1.0) / sum_array
-        r = r - out_data[j]
-        if r <= 0:
-            return j
-    return n-1
-
 def _init_state_memory(rnn_cells_count, dtype):
     '''Initialize memory for states'''
     states = {}
@@ -171,26 +119,65 @@ def _get_state_output(runtime, states):
         states[state] = runtime.get_output((i), tvm.nd.empty(data.shape, data.dtype))
         i += 1
 
+def _proc_rnn_output(out_data):
+    '''Generate the characters from the output array'''
+    sum_array = 0
+    n = out_data.size
+    r = random.uniform(0, 1)
+    for j in range(n):
+        if out_data[j] < 0.0001:
+            out_data[j] = 0
+        sum_array += out_data[j]
+
+    for j in range(n):
+        out_data[j] *= float(1.0) / sum_array
+        r = r - out_data[j]
+        if r <= 0:
+            return j
+    return n-1
+
+print("RNN generaring text...")
+
 out_shape = (net.outputs,)
 rnn_cells_count = 3
 
+# Initialize state memory
+# -----------------------
 states = _init_state_memory(rnn_cells_count, dtype)
 
 len_seed = len(seed)
 count = len_seed + num
 out_txt = ""
+
+#Initialize random seed
 random.seed(0)
 c = ord(seed[0])
 inp_data = np.zeros([net.inputs], dtype)
+
+# Run the model
+# -------------
+
+# Predict character by character till `num`
 for i in range(count):
     inp_data[c] = 1
+
+    # Set the input data
     m.set_input('data', tvm.nd.array(inp_data.astype(dtype)))
     inp_data[c] = 0
+
+    # Set the state inputs
     _set_state_input(m, states)
+
+    # Run the model
     m.run()
+
+    # Get the output
     tvm_out = m.get_output(0, tvm.nd.empty(out_shape, dtype)).asnumpy()
 
+    # Get the state outputs
     _get_state_output(m, states)
+
+    # Get the predicted character and keep buffering it
     c = ord(seed[i])  if i < len_seed else _proc_rnn_output(tvm_out)
     out_txt += chr(c)