From c24586064db8b6fcdcec0ef5e6ae67a62a0a2b0a Mon Sep 17 00:00:00 2001
From: kmader <kevinmader@4quant.com>
Date: Tue, 6 Sep 2016 21:46:34 +0200
Subject: [PATCH 1/4] change requirements to allow newer versions

---
 requirements.txt | 18 +++++++++---------
 1 file changed, 9 insertions(+), 9 deletions(-)

diff --git a/requirements.txt b/requirements.txt
index 5f3ff60..3620361 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -1,9 +1,9 @@
-h5py==2.6.0
-Keras==1.0.2
-numpy==1.11.0
-pydot-ng==1.0.0
-pyparsing==2.1.1
-PyYAML==3.11
-scipy==0.17.0
-six==1.10.0
-Theano==0.8.2
+h5py>=2.6.0
+Keras>=1.0.2
+numpy>=1.11.0
+pydot-ng>=1.0.0
+pyparsing>=2.1.1
+PyYAML>=3.11
+scipy>=0.17.0
+six>=1.10.0
+Theano>=0.8.2

From 8d400a8e8c564ef002199c37546aa14d13a9e34d Mon Sep 17 00:00:00 2001
From: kmader <kevinmader@4quant.com>
Date: Tue, 6 Sep 2016 21:52:45 +0200
Subject: [PATCH 2/4] first 3to2 run

---
 src/npi/__init__.py                 |   2 +-
 src/npi/add/__init__.py             |   2 +-
 src/npi/add/create_training_data.py |  19 ++--
 src/npi/add/lib.py                  |  91 +++++++++----------
 src/npi/add/model.py                | 135 ++++++++++++++--------------
 src/npi/add/test_model.py           |  14 +--
 src/npi/add/training_model.py       |  11 ++-
 src/npi/core.py                     |  53 +++++------
 src/npi/terminal_core.py            |  35 ++++----
 9 files changed, 189 insertions(+), 173 deletions(-)

diff --git a/src/npi/__init__.py b/src/npi/__init__.py
index b6cd2be..8a675c1 100644
--- a/src/npi/__init__.py
+++ b/src/npi/__init__.py
@@ -1,4 +1,4 @@
 #!/usr/bin/env python
 # coding: utf-8
 
-__author__ = 'k_morishita'
+__author__ = u'k_morishita'
diff --git a/src/npi/add/__init__.py b/src/npi/add/__init__.py
index b6cd2be..8a675c1 100644
--- a/src/npi/add/__init__.py
+++ b/src/npi/add/__init__.py
@@ -1,4 +1,4 @@
 #!/usr/bin/env python
 # coding: utf-8
 
-__author__ = 'k_morishita'
+__author__ = u'k_morishita'
diff --git a/src/npi/add/create_training_data.py b/src/npi/add/create_training_data.py
index aeab650..bf8326a 100644
--- a/src/npi/add/create_training_data.py
+++ b/src/npi/add/create_training_data.py
@@ -1,4 +1,6 @@
 # coding: utf-8
+from __future__ import with_statement
+from __future__ import absolute_import
 import os
 import curses
 import pickle
@@ -8,9 +10,10 @@
 from npi.add.lib import AdditionEnv, AdditionProgramSet, AdditionTeacher, create_char_map, create_questions, run_npi
 from npi.core import ResultLogger
 from npi.terminal_core import TerminalNPIRunner, Terminal
+from io import open
 
 
-def main(stdscr, filename: str, num: int, result_logger: ResultLogger):
+def main(stdscr, filename, num, result_logger):
     terminal = Terminal(stdscr, create_char_map())
     terminal.init_window(FIELD_WIDTH, FIELD_ROW)
     program_set = AdditionProgramSet()
@@ -25,24 +28,24 @@ def main(stdscr, filename: str, num: int, result_logger: ResultLogger):
         addition_env.reset()
         q = copy(data)
         run_npi(addition_env, npi_runner, program_set.ADD, data)
-        steps_list.append({"q": q, "steps": npi_runner.step_list})
+        steps_list.append({u"q": q, u"steps": npi_runner.step_list})
         result_logger.write(data)
         terminal.add_log(data)
 
     if filename:
-        with open(filename, 'wb') as f:
+        with open(filename, u'wb') as f:
             pickle.dump(steps_list, f, protocol=pickle.HIGHEST_PROTOCOL)
 
-if __name__ == '__main__':
+if __name__ == u'__main__':
     import sys
-    DEBUG_MODE = os.environ.get('DEBUG')
+    DEBUG_MODE = os.environ.get(u'DEBUG')
     if DEBUG_MODE:
         output_filename = None
         num_data = 3
-        log_filename = 'result.log'
+        log_filename = u'result.log'
     else:
         output_filename = sys.argv[1] if len(sys.argv) > 1 else None
         num_data = int(sys.argv[2]) if len(sys.argv) > 2 else 1000
-        log_filename = sys.argv[3] if len(sys.argv) > 3 else 'result.log'
+        log_filename = sys.argv[3] if len(sys.argv) > 3 else u'result.log'
     curses.wrapper(main, output_filename, num_data, ResultLogger(log_filename))
-    print("create %d training data" % num_data)
+    print u"create %d training data" % num_data
diff --git a/src/npi/add/lib.py b/src/npi/add/lib.py
index 5aa21de..8e491a3 100644
--- a/src/npi/add/lib.py
+++ b/src/npi/add/lib.py
@@ -1,4 +1,5 @@
 # coding: utf-8
+from __future__ import absolute_import
 from random import random
 
 import numpy as np
@@ -6,11 +7,11 @@
 from npi.core import Program, IntegerArguments, StepOutput, NPIStep, PG_CONTINUE, PG_RETURN
 from npi.terminal_core import Screen, Terminal
 
-__author__ = 'k_morishita'
+__author__ = u'k_morishita'
 
 
-class AdditionEnv:
-    """
+class AdditionEnv(object):
+    u"""
     Environment of Addition
     """
     def __init__(self, height, width, num_chars):
@@ -23,9 +24,9 @@ def reset(self):
         self.screen.fill(0)
         self.pointers = [self.screen.width-1] * self.screen.height  # rightmost
 
-    def get_observation(self) -> np.ndarray:
+    def get_observation(self):
         value = []
-        for row in range(len(self.pointers)):
+        for row in xrange(len(self.pointers)):
             value.append(self.to_one_hot(self.screen[row, self.pointers[row]]))
         return np.array(value)  # shape of FIELD_ROW * FIELD_DEPTH
 
@@ -34,13 +35,13 @@ def to_one_hot(self, ch):
         if 0 <= ch < self.num_chars:
             ret[ch] = 1
         else:
-            raise IndexError("ch must be 0 <= ch < %s, but %s" % (self.num_chars, ch))
+            raise IndexError(u"ch must be 0 <= ch < %s, but %s" % (self.num_chars, ch))
         return ret
 
     def setup_problem(self, num1, num2):
-        for i, s in enumerate(reversed("%s" % num1)):
+        for i, s in enumerate(reversed(u"%s" % num1)):
             self.screen[0, -(i+1)] = int(s) + 1
-        for i, s in enumerate(reversed("%s" % num2)):
+        for i, s in enumerate(reversed(u"%s" % num2)):
             self.screen[1, -(i+1)] = int(s) + 1
 
     def move_pointer(self, row, left_or_right):
@@ -53,11 +54,11 @@ def write(self, row, ch):
             self.screen[row, self.pointers[row]] = ch
 
     def get_output(self):
-        s = ""
+        s = u""
         for ch in self.screen[3]:
             if ch > 0:
-                s += "%s" % (ch-1)
-        return int(s or "0")
+                s += u"%s" % (ch-1)
+        return int(s or u"0")
 
 
 class MovePtrProgram(Program):
@@ -70,7 +71,7 @@ class MovePtrProgram(Program):
     TO_LEFT = 0
     TO_RIGHT = 1
 
-    def do(self, env: AdditionEnv, args: IntegerArguments):
+    def do(self, env, args):
         ptr_kind = args.decode_at(0)
         left_or_right = args.decode_at(1)
         env.move_pointer(ptr_kind, left_or_right)
@@ -81,21 +82,21 @@ class WriteProgram(Program):
     WRITE_TO_CARRY = 0
     WRITE_TO_OUTPUT = 1
 
-    def do(self, env: AdditionEnv, args: IntegerArguments):
+    def do(self, env, args):
         row = 2 if args.decode_at(0) == self.WRITE_TO_CARRY else 3
         digit = args.decode_at(1)
         env.write(row, digit+1)
 
 
-class AdditionProgramSet:
-    NOP = Program('NOP')
-    MOVE_PTR = MovePtrProgram('MOVE_PTR', 4, 2)  # PTR_KIND(4), LEFT_OR_RIGHT(2)
-    WRITE = WriteProgram('WRITE', 2, 10)       # CARRY_OR_OUT(2), DIGITS(10)
-    ADD = Program('ADD')
-    ADD1 = Program('ADD1')
-    CARRY = Program('CARRY')
-    LSHIFT = Program('LSHIFT')
-    RSHIFT = Program('RSHIFT')
+class AdditionProgramSet(object):
+    NOP = Program(u'NOP')
+    MOVE_PTR = MovePtrProgram(u'MOVE_PTR', 4, 2)  # PTR_KIND(4), LEFT_OR_RIGHT(2)
+    WRITE = WriteProgram(u'WRITE', 2, 10)       # CARRY_OR_OUT(2), DIGITS(10)
+    ADD = Program(u'ADD')
+    ADD1 = Program(u'ADD1')
+    CARRY = Program(u'CARRY')
+    LSHIFT = Program(u'LSHIFT')
+    RSHIFT = Program(u'RSHIFT')
 
     def __init__(self):
         self.map = {}
@@ -109,17 +110,17 @@ def __init__(self):
         self.register(self.LSHIFT)
         self.register(self.RSHIFT)
 
-    def register(self, pg: Program):
+    def register(self, pg):
         pg.program_id = self.program_id
         self.map[pg.program_id] = pg
         self.program_id += 1
 
-    def get(self, i: int):
+    def get(self, i):
         return self.map.get(i)
 
 
 class AdditionTeacher(NPIStep):
-    def __init__(self, program_set: AdditionProgramSet):
+    def __init__(self, program_set):
         self.pg_set = program_set
         self.step_queue = None
         self.step_queue_stack = []
@@ -141,7 +142,7 @@ def register_subprogram(self, pg, method):
         self.sub_program[pg.program_id] = method
 
     @staticmethod
-    def decode_params(env_observation: np.ndarray, arguments: IntegerArguments):
+    def decode_params(env_observation, arguments):
         return env_observation.argmax(axis=1), arguments.decode_all()
 
     def enter_function(self):
@@ -151,7 +152,7 @@ def enter_function(self):
     def exit_function(self):
         self.step_queue = self.step_queue_stack.pop()
 
-    def step(self, env_observation: np.ndarray, pg: Program, arguments: IntegerArguments) -> StepOutput:
+    def step(self, env_observation, pg, arguments):
         if not self.step_queue:
             self.step_queue = self.sub_program[pg.program_id](env_observation, arguments)
         if self.step_queue:
@@ -162,17 +163,17 @@ def step(self, env_observation: np.ndarray, pg: Program, arguments: IntegerArgum
         return ret
 
     @staticmethod
-    def convert_for_step_return(step_values: tuple) -> StepOutput:
+    def convert_for_step_return(step_values):
         if len(step_values) == 2:
             return StepOutput(PG_CONTINUE, step_values[0], IntegerArguments(step_values[1]))
         else:
             return StepOutput(step_values[0], step_values[1], IntegerArguments(step_values[2]))
 
     @staticmethod
-    def pg_primitive(env_observation: np.ndarray, arguments: IntegerArguments):
+    def pg_primitive(env_observation, arguments):
         return None
 
-    def pg_add(self, env_observation: np.ndarray, arguments: IntegerArguments):
+    def pg_add(self, env_observation, arguments):
         ret = []
         (in1, in2, carry, output), (a1, a2, a3) = self.decode_params(env_observation, arguments)
         if in1 == 0 and in2 == 0 and carry == 0:
@@ -181,7 +182,7 @@ def pg_add(self, env_observation: np.ndarray, arguments: IntegerArguments):
         ret.append((self.pg_set.LSHIFT, None))
         return ret
 
-    def pg_add1(self, env_observation: np.ndarray, arguments: IntegerArguments):
+    def pg_add1(self, env_observation, arguments):
         ret = []
         p = self.pg_set
         (in1, in2, carry, output), (a1, a2, a3) = self.decode_params(env_observation, arguments)
@@ -200,7 +201,7 @@ def sum_ch_list(ch_list):
                 ret += ch - 1
         return ret
 
-    def pg_carry(self, env_observation: np.ndarray, arguments: IntegerArguments):
+    def pg_carry(self, env_observation, arguments):
         ret = []
         p = self.pg_set
         ret.append((p.MOVE_PTR, (p.MOVE_PTR.PTR_CARRY, p.MOVE_PTR.TO_LEFT)))
@@ -208,7 +209,7 @@ def pg_carry(self, env_observation: np.ndarray, arguments: IntegerArguments):
         ret.append((PG_RETURN, p.MOVE_PTR, (p.MOVE_PTR.PTR_CARRY, p.MOVE_PTR.TO_RIGHT)))
         return ret
 
-    def pg_lshift(self, env_observation: np.ndarray, arguments: IntegerArguments):
+    def pg_lshift(self, env_observation, arguments):
         ret = []
         p = self.pg_set
         ret.append((p.MOVE_PTR, (p.MOVE_PTR.PTR_IN1, p.MOVE_PTR.TO_LEFT)))
@@ -217,7 +218,7 @@ def pg_lshift(self, env_observation: np.ndarray, arguments: IntegerArguments):
         ret.append((PG_RETURN, p.MOVE_PTR, (p.MOVE_PTR.PTR_OUT, p.MOVE_PTR.TO_LEFT)))
         return ret
 
-    def pg_rshift(self, env_observation: np.ndarray, arguments: IntegerArguments):
+    def pg_rshift(self, env_observation, arguments):
         ret = []
         p = self.pg_set
         ret.append((p.MOVE_PTR, (p.MOVE_PTR.PTR_IN1, p.MOVE_PTR.TO_RIGHT)))
@@ -228,21 +229,21 @@ def pg_rshift(self, env_observation: np.ndarray, arguments: IntegerArguments):
 
 
 def create_char_map():
-    char_map = dict((i+1, "%s" % i) for i in range(10))
-    char_map[0] = ' '
+    char_map = dict((i+1, u"%s" % i) for i in xrange(10))
+    char_map[0] = u' '
     return char_map
 
 
 def create_questions(num=100, max_number=10000):
     questions = []
-    for in1 in range(10):
-        for in2 in range(10):
+    for in1 in xrange(10):
+        for in2 in xrange(10):
             questions.append(dict(in1=in1, in2=in2))
 
-    for _ in range(100):
+    for _ in xrange(100):
         questions.append(dict(in1=int(random() * 100), in2=int(random() * 100)))
 
-    for _ in range(100):
+    for _ in xrange(100):
         questions.append(dict(in1=int(random() * 1000), in2=int(random() * 1000)))
 
     questions += [
@@ -255,19 +256,19 @@ def create_questions(num=100, max_number=10000):
 
 def create_random_questions(num=100, max_number=10000):
     questions = []
-    for _ in range(num):
+    for _ in xrange(num):
         questions.append(dict(in1=int(random() * max_number), in2=int(random() * max_number)))
     return questions
 
 
 def run_npi(addition_env, npi_runner, program, data):
-    data['expect'] = data['in1'] + data['in2']
+    data[u'expect'] = data[u'in1'] + data[u'in2']
 
-    addition_env.setup_problem(data['in1'], data['in2'])
+    addition_env.setup_problem(data[u'in1'], data[u'in2'])
 
     npi_runner.reset()
     npi_runner.display_env(addition_env, force=True)
     npi_runner.npi_program_interface(addition_env, program, IntegerArguments())
 
-    data['result'] = addition_env.get_output()
-    data['correct'] = data['result'] == data['expect']
+    data[u'result'] = addition_env.get_output()
+    data[u'correct'] = data[u'result'] == data[u'expect']
diff --git a/src/npi/add/model.py b/src/npi/add/model.py
index 42a8e4c..794d2ff 100644
--- a/src/npi/add/model.py
+++ b/src/npi/add/model.py
@@ -1,5 +1,7 @@
 #!/usr/bin/env python
 # coding: utf-8
+from __future__ import division
+from __future__ import absolute_import
 import os
 from collections import Counter
 from copy import copy
@@ -22,15 +24,16 @@
 from npi.core import NPIStep, Program, IntegerArguments, StepOutput, RuntimeSystem, PG_RETURN, StepInOut, StepInput, \
     to_one_hot_array
 from npi.terminal_core import TerminalNPIRunner
+from itertools import izip
 
-__author__ = 'k_morishita'
+__author__ = u'k_morishita'
 
 
 class AdditionNPIModel(NPIStep):
     model = None
     f_enc = None
 
-    def __init__(self, system: RuntimeSystem, model_path: str=None, program_set: AdditionProgramSet=None):
+    def __init__(self, system, model_path=None, program_set=None):
         self.system = system
         self.model_path = model_path
         self.program_set = program_set
@@ -42,58 +45,58 @@ def __init__(self, system: RuntimeSystem, model_path: str=None, program_set: Add
     def build(self):
         enc_size = self.size_of_env_observation()
         argument_size = IntegerArguments.size_of_arguments
-        input_enc = InputLayer(batch_input_shape=(self.batch_size, enc_size), name='input_enc')
-        input_arg = InputLayer(batch_input_shape=(self.batch_size, argument_size), name='input_arg')
+        input_enc = InputLayer(batch_input_shape=(self.batch_size, enc_size), name=u'input_enc')
+        input_arg = InputLayer(batch_input_shape=(self.batch_size, argument_size), name=u'input_arg')
         input_prg = Embedding(input_dim=PROGRAM_VEC_SIZE, output_dim=PROGRAM_KEY_VEC_SIZE, input_length=1,
                               batch_input_shape=(self.batch_size, 1))
 
-        f_enc = Sequential(name='f_enc')
-        f_enc.add(Merge([input_enc, input_arg], mode='concat'))
+        f_enc = Sequential(name=u'f_enc')
+        f_enc.add(Merge([input_enc, input_arg], mode=u'concat'))
         f_enc.add(MaxoutDense(128, nb_feature=4))
         self.f_enc = f_enc
 
-        program_embedding = Sequential(name='program_embedding')
+        program_embedding = Sequential(name=u'program_embedding')
         program_embedding.add(input_prg)
 
-        f_enc_convert = Sequential(name='f_enc_convert')
+        f_enc_convert = Sequential(name=u'f_enc_convert')
         f_enc_convert.add(f_enc)
         f_enc_convert.add(RepeatVector(1))
 
-        f_lstm = Sequential(name='f_lstm')
-        f_lstm.add(Merge([f_enc_convert, program_embedding], mode='concat'))
+        f_lstm = Sequential(name=u'f_lstm')
+        f_lstm.add(Merge([f_enc_convert, program_embedding], mode=u'concat'))
         f_lstm.add(LSTM(256, return_sequences=False, stateful=True, W_regularizer=l2(0.0000001)))
-        f_lstm.add(Activation('relu', name='relu_lstm_1'))
+        f_lstm.add(Activation(u'relu', name=u'relu_lstm_1'))
         f_lstm.add(RepeatVector(1))
         f_lstm.add(LSTM(256, return_sequences=False, stateful=True, W_regularizer=l2(0.0000001)))
-        f_lstm.add(Activation('relu', name='relu_lstm_2'))
+        f_lstm.add(Activation(u'relu', name=u'relu_lstm_2'))
         # plot(f_lstm, to_file='f_lstm.png', show_shapes=True)
 
-        f_end = Sequential(name='f_end')
+        f_end = Sequential(name=u'f_end')
         f_end.add(f_lstm)
         f_end.add(Dense(1, W_regularizer=l2(0.001)))
-        f_end.add(Activation('sigmoid', name='sigmoid_end'))
+        f_end.add(Activation(u'sigmoid', name=u'sigmoid_end'))
 
-        f_prog = Sequential(name='f_prog')
+        f_prog = Sequential(name=u'f_prog')
         f_prog.add(f_lstm)
-        f_prog.add(Dense(PROGRAM_KEY_VEC_SIZE, activation="relu"))
+        f_prog.add(Dense(PROGRAM_KEY_VEC_SIZE, activation=u"relu"))
         f_prog.add(Dense(PROGRAM_VEC_SIZE, W_regularizer=l2(0.0001)))
-        f_prog.add(Activation('softmax', name='softmax_prog'))
+        f_prog.add(Activation(u'softmax', name=u'softmax_prog'))
         # plot(f_prog, to_file='f_prog.png', show_shapes=True)
 
         f_args = []
-        for ai in range(1, IntegerArguments.max_arg_num+1):
-            f_arg = Sequential(name='f_arg%s' % ai)
+        for ai in xrange(1, IntegerArguments.max_arg_num+1):
+            f_arg = Sequential(name=u'f_arg%s' % ai)
             f_arg.add(f_lstm)
             f_arg.add(Dense(IntegerArguments.depth, W_regularizer=l2(0.0001)))
-            f_arg.add(Activation('softmax', name='softmax_arg%s' % ai))
+            f_arg.add(Activation(u'softmax', name=u'softmax_arg%s' % ai))
             f_args.append(f_arg)
         # plot(f_arg, to_file='f_arg.png', show_shapes=True)
 
         self.model = Model([input_enc.input, input_arg.input, input_prg.input],
                            [f_end.output, f_prog.output] + [fa.output for fa in f_args],
-                           name="npi")
+                           name=u"npi")
         self.compile_model()
-        plot(self.model, to_file='model.png', show_shapes=True)
+        plot(self.model, to_file=u'model.png', show_shapes=True)
 
     def reset(self):
         super(AdditionNPIModel, self).reset()
@@ -104,11 +107,11 @@ def reset(self):
     def compile_model(self, lr=0.0001, arg_weight=1.):
         arg_num = IntegerArguments.max_arg_num
         optimizer = Adam(lr=lr)
-        loss = ['binary_crossentropy', 'categorical_crossentropy'] + ['categorical_crossentropy'] * arg_num
+        loss = [u'binary_crossentropy', u'categorical_crossentropy'] + [u'categorical_crossentropy'] * arg_num
         self.model.compile(optimizer=optimizer, loss=loss, loss_weights=[0.25, 0.25] + [arg_weight] * arg_num)
 
     def fit(self, steps_list, epoch=3000):
-        """
+        u"""
 
         :param int epoch:
         :param typing.List[typing.Dict[q=dict, steps=typing.List[StepInOut]]] steps_list:
@@ -118,8 +121,8 @@ def fit(self, steps_list, epoch=3000):
         def filter_question(condition_func):
             sub_steps_list = []
             for steps_dict in steps_list:
-                question = steps_dict['q']
-                if condition_func(question['in1'], question['in2']):
+                question = steps_dict[u'q']
+                if condition_func(question[u'in1'], question[u'in2']):
                     sub_steps_list.append(steps_dict)
             return sub_steps_list
 
@@ -148,18 +151,18 @@ def filter_question(condition_func):
         # all_ok = self.fit_to_subset(filter_question(lambda a, b: a < 10 and b < 10), pass_rate=pr)
         # print("%s is pass_rate >= %s: %s" % (q_type, pr, all_ok))
 
-        q_type = "training questions of a<100 and b<100"
-        print(q_type)
+        q_type = u"training questions of a<100 and b<100"
+        print q_type
         pr = 0.8
         all_ok = self.fit_to_subset(filter_question(lambda a, b: a < 100 and b < 100), pass_rate=pr)
-        print("%s is pass_rate >= %s: %s" % (q_type, pr, all_ok))
+        print u"%s is pass_rate >= %s: %s" % (q_type, pr, all_ok)
 
         while True:
             if self.test_and_learn([10, 100, 1000]):
                 break
 
-            q_type = "training questions of ALL"
-            print(q_type)
+            q_type = u"training questions of ALL"
+            print q_type
 
             q_num = 100
             skip_correct = False
@@ -168,10 +171,10 @@ def filter_question(condition_func):
             np.random.shuffle(questions)
             questions = questions[:q_num]
             all_ok = self.fit_to_subset(questions, pass_rate=pr, skip_correct=skip_correct)
-            print("%s is pass_rate >= %s: %s" % (q_type, pr, all_ok))
+            print u"%s is pass_rate >= %s: %s" % (q_type, pr, all_ok)
 
     def fit_to_subset(self, steps_list, pass_rate=1.0, skip_correct=False):
-        for i in range(10):
+        for i in xrange(10):
             all_ok = self.do_learn(steps_list, 100, pass_rate=pass_rate, skip_correct=skip_correct)
             if all_ok:
                 return True
@@ -179,10 +182,10 @@ def fit_to_subset(self, steps_list, pass_rate=1.0, skip_correct=False):
 
     def test_and_learn(self, num_questions):
         for num in num_questions:
-            print("test all type of %d questions" % num)
+            print u"test all type of %d questions" % num
             cc, wc, wrong_questions = self.test_to_subset(create_random_questions(num))
             acc_rate = cc/(cc+wc)
-            print("Accuracy %s(OK=%d, NG=%d)" % (acc_rate, cc, wc))
+            print u"Accuracy %s(OK=%d, NG=%d)" % (acc_rate, cc, wc)
             if wc > 0:
                 self.fit_to_subset(wrong_questions, pass_rate=1.0, skip_correct=False)
                 return False
@@ -201,13 +204,13 @@ def test_to_subset(self, questions):
                 correct_count += 1
             else:
                 self.question_test(addition_env, teacher_runner, question)
-                wrong_steps_list.append({"q": question, "steps": teacher_runner.step_list})
+                wrong_steps_list.append({u"q": question, u"steps": teacher_runner.step_list})
                 wrong_count += 1
         return correct_count, wrong_count, wrong_steps_list
 
     @staticmethod
     def dict_to_str(d):
-        return str(tuple([(k, d[k]) for k in sorted(d)]))
+        return unicode(tuple([(k, d[k]) for k in sorted(d)]))
 
     def do_learn(self, steps_list, epoch, pass_rate=1.0, skip_correct=False):
         addition_env = AdditionEnv(FIELD_ROW, FIELD_WIDTH, FIELD_DEPTH)
@@ -216,19 +219,19 @@ def do_learn(self, steps_list, epoch, pass_rate=1.0, skip_correct=False):
         correct_count = Counter()
         no_change_count = 0
         last_loss = 1000
-        for ep in range(1, epoch+1):
+        for ep in xrange(1, epoch+1):
             correct_new = wrong_new = 0
             losses = []
             ok_rate = []
             np.random.shuffle(steps_list)
             for idx, steps_dict in enumerate(steps_list):
-                question = copy(steps_dict['q'])
+                question = copy(steps_dict[u'q'])
                 question_key = self.dict_to_str(question)
                 if self.question_test(addition_env, npi_runner, question):
                     if correct_count[question_key] == 0:
                         correct_new += 1
                     correct_count[question_key] += 1
-                    print("GOOD!: ep=%2d idx=%3d :%s CorrectCount=%s" % (ep, idx, self.dict_to_str(question), correct_count[question_key]))
+                    print u"GOOD!: ep=%2d idx=%3d :%s CorrectCount=%s" % (ep, idx, self.dict_to_str(question), correct_count[question_key])
                     ok_rate.append(1)
                     cc = correct_count[question_key]
                     if skip_correct or int(math.sqrt(cc)) ** 2 != cc:
@@ -236,11 +239,11 @@ def do_learn(self, steps_list, epoch, pass_rate=1.0, skip_correct=False):
                 else:
                     ok_rate.append(0)
                     if correct_count[question_key] > 0:
-                        print("Degraded: ep=%2d idx=%3d :%s CorrectCount=%s -> 0" % (ep, idx, self.dict_to_str(question), correct_count[question_key]))
+                        print u"Degraded: ep=%2d idx=%3d :%s CorrectCount=%s -> 0" % (ep, idx, self.dict_to_str(question), correct_count[question_key])
                         correct_count[question_key] = 0
                         wrong_new += 1
 
-                steps = steps_dict['steps']
+                steps = steps_dict[u'steps']
                 xs = []
                 ys = []
                 ws = []
@@ -252,18 +255,18 @@ def do_learn(self, steps_list, epoch, pass_rate=1.0, skip_correct=False):
 
                 self.reset()
 
-                for i, (x, y, w) in enumerate(zip(xs, ys, ws)):
+                for i, (x, y, w) in enumerate(izip(xs, ys, ws)):
                     loss = self.model.train_on_batch(x, y, sample_weight=w)
                     if not np.isfinite(loss):
-                        print("Loss is not finite!, Last Input=%s" % ([i, (x, y, w)]))
+                        print u"Loss is not finite!, Last Input=%s" % ([i, (x, y, w)])
                         self.print_weights(last_weights, detail=True)
-                        raise RuntimeError("Loss is not finite!")
+                        raise RuntimeError(u"Loss is not finite!")
                     losses.append(loss)
                     last_weights = self.model.get_weights()
             if losses:
                 cur_loss = np.average(losses)
-                print("ep=%2d: ok_rate=%.2f%% (+%s -%s): ave loss %s (%s samples)" %
-                      (ep, np.average(ok_rate)*100, correct_new, wrong_new, cur_loss, len(steps_list)))
+                print u"ep=%2d: ok_rate=%.2f%% (+%s -%s): ave loss %s (%s samples)" %
+                      (ep, np.average(ok_rate)*100, correct_new, wrong_new, cur_loss, len(steps_list))
                 # self.print_weights()
                 if correct_new + wrong_new == 0:
                     no_change_count += 1
@@ -271,39 +274,39 @@ def do_learn(self, steps_list, epoch, pass_rate=1.0, skip_correct=False):
                     no_change_count = 0
 
                 if math.fabs(1 - cur_loss/last_loss) < 0.001 and no_change_count > 5:
-                    print("math.fabs(1 - cur_loss/last_loss) < 0.001 and no_change_count > 5:")
+                    print u"math.fabs(1 - cur_loss/last_loss) < 0.001 and no_change_count > 5:"
                     return False
                 last_loss = cur_loss
-                print("=" * 80)
+                print u"=" * 80
             self.save()
             if np.average(ok_rate) >= pass_rate:
                 return True
         return False
 
     def update_learning_rate(self, learning_rate, arg_weight=1.):
-        print("Re-Compile Model lr=%s aw=%s" % (learning_rate, arg_weight))
+        print u"Re-Compile Model lr=%s aw=%s" % (learning_rate, arg_weight)
         self.compile_model(learning_rate, arg_weight=arg_weight)
 
     def train_f_enc(self, steps_list, epoch=50):
-        print("training f_enc")
-        f_add0 = Sequential(name='f_add0')
+        print u"training f_enc"
+        f_add0 = Sequential(name=u'f_add0')
         f_add0.add(self.f_enc)
         f_add0.add(Dense(FIELD_DEPTH))
-        f_add0.add(Activation('softmax', name='softmax_add0'))
+        f_add0.add(Activation(u'softmax', name=u'softmax_add0'))
 
-        f_add1 = Sequential(name='f_add1')
+        f_add1 = Sequential(name=u'f_add1')
         f_add1.add(self.f_enc)
         f_add1.add(Dense(FIELD_DEPTH))
-        f_add1.add(Activation('softmax', name='softmax_add1'))
+        f_add1.add(Activation(u'softmax', name=u'softmax_add1'))
 
-        env_model = Model(self.f_enc.inputs, [f_add0.output, f_add1.output], name="env_model")
-        env_model.compile(optimizer='adam', loss=['categorical_crossentropy']*2)
+        env_model = Model(self.f_enc.inputs, [f_add0.output, f_add1.output], name=u"env_model")
+        env_model.compile(optimizer=u'adam', loss=[u'categorical_crossentropy']*2)
 
-        for ep in range(epoch):
+        for ep in xrange(epoch):
             losses = []
             for idx, steps_dict in enumerate(steps_list):
                 prev = None
-                for step in steps_dict['steps']:
+                for step in steps_dict[u'steps']:
                     x = self.convert_input(step.input)[:2]
                     env_values = step.input.env.reshape((4, -1))
                     in1 = np.clip(env_values[0].argmax() - 1, 0, 9)
@@ -319,7 +322,7 @@ def train_f_enc(self, steps_list, epoch=50):
                     y = [yy.reshape((self.batch_size, -1)) for yy in [y0, y1]]
                     loss = env_model.train_on_batch(x, y)
                     losses.append(loss)
-            print("ep %3d: loss=%s" % (ep, np.average(losses)))
+            print u"ep %3d: loss=%s" % (ep, np.average(losses))
             if np.average(losses) < 1e-06:
                 break
 
@@ -328,18 +331,18 @@ def question_test(self, addition_env, npi_runner, question):
         self.reset()
         try:
             run_npi(addition_env, npi_runner, self.program_set.ADD, question)
-            if question['correct']:
+            if question[u'correct']:
                 return True
         except StopIteration:
             pass
         return False
 
-    def convert_input(self, p_in: StepInput):
+    def convert_input(self, p_in):
         x_pg = np.array((p_in.program.program_id,))
         x = [xx.reshape((self.batch_size, -1)) for xx in (p_in.env, p_in.arguments.values, x_pg)]
         return x
 
-    def convert_output(self, p_out: StepOutput):
+    def convert_output(self, p_out):
         y = [np.array((p_out.r,))]
         weights = [[1.]]
         if p_out.program:
@@ -359,7 +362,7 @@ def convert_output(self, p_out: StepOutput):
         weights = [np.array(w) for w in weights]
         return [yy.reshape((self.batch_size, -1)) for yy in y], weights
 
-    def step(self, env_observation: np.ndarray, pg: Program, arguments: IntegerArguments) -> StepOutput:
+    def step(self, env_observation, pg, arguments):
         x = self.convert_input(StepInput(env_observation, pg, arguments))
         results = self.model.predict(x, batch_size=1)  # if batch_size==1, returns single row
 
@@ -379,10 +382,10 @@ def load_weights(self):
     def print_weights(self, weights=None, detail=False):
         weights = weights or self.model.get_weights()
         for w in weights:
-            print("w%s: sum(w)=%s, ave(w)=%s" % (w.shape, np.sum(w), np.average(w)))
+            print u"w%s: sum(w)=%s, ave(w)=%s" % (w.shape, np.sum(w), np.average(w))
         if detail:
             for w in weights:
-                print("%s: %s" % (w.shape, w))
+                print u"%s: %s" % (w.shape, w)
 
     @staticmethod
     def size_of_env_observation():
diff --git a/src/npi/add/test_model.py b/src/npi/add/test_model.py
index c456c4c..ad9eb3a 100644
--- a/src/npi/add/test_model.py
+++ b/src/npi/add/test_model.py
@@ -1,4 +1,6 @@
 # coding: utf-8
+from __future__ import division
+from __future__ import absolute_import
 import curses
 import os
 import pickle
@@ -10,7 +12,7 @@
 from npi.terminal_core import TerminalNPIRunner, Terminal
 
 
-def main(stdscr, model_path: str, num: int, result_logger: ResultLogger):
+def main(stdscr, model_path, num, result_logger):
     terminal = Terminal(stdscr, create_char_map())
     terminal.init_window(FIELD_WIDTH, FIELD_ROW)
     program_set = AdditionProgramSet()
@@ -29,18 +31,18 @@ def main(stdscr, model_path: str, num: int, result_logger: ResultLogger):
         run_npi(addition_env, npi_runner, program_set.ADD, data)
         result_logger.write(data)
         terminal.add_log(data)
-        if data['correct']:
+        if data[u'correct']:
             correct_count += 1
         else:
             wrong_count += 1
     return correct_count, wrong_count
 
 
-if __name__ == '__main__':
+if __name__ == u'__main__':
     import sys
-    DEBUG_MODE = os.environ.get('DEBUG')
+    DEBUG_MODE = os.environ.get(u'DEBUG')
     model_path_ = sys.argv[1]
     num_data = int(sys.argv[2]) if len(sys.argv) > 2 else 1000
-    log_filename = sys.argv[3] if len(sys.argv) > 3 else 'result.log'
+    log_filename = sys.argv[3] if len(sys.argv) > 3 else u'result.log'
     cc, wc = curses.wrapper(main, model_path_, num_data, ResultLogger(log_filename))
-    print("Accuracy %s(OK=%d, NG=%d)" % (cc/(cc+wc), cc, wc))
+    print u"Accuracy %s(OK=%d, NG=%d)" % (cc/(cc+wc), cc, wc)
diff --git a/src/npi/add/training_model.py b/src/npi/add/training_model.py
index 6fdf8cb..3bb64c7 100644
--- a/src/npi/add/training_model.py
+++ b/src/npi/add/training_model.py
@@ -1,4 +1,6 @@
 # coding: utf-8
+from __future__ import with_statement
+from __future__ import absolute_import
 import os
 import pickle
 
@@ -7,22 +9,23 @@
 from npi.add.model import AdditionNPIModel
 from npi.core import ResultLogger, RuntimeSystem
 from npi.terminal_core import TerminalNPIRunner, Terminal
+from io import open
 
 
-def main(filename: str, model_path: str):
+def main(filename, model_path):
     system = RuntimeSystem()
     program_set = AdditionProgramSet()
 
-    with open(filename, 'rb') as f:
+    with open(filename, u'rb') as f:
         steps_list = pickle.load(f)
 
     npi_model = AdditionNPIModel(system, model_path, program_set)
     npi_model.fit(steps_list)
 
 
-if __name__ == '__main__':
+if __name__ == u'__main__':
     import sys
-    DEBUG_MODE = os.environ.get('DEBUG')
+    DEBUG_MODE = os.environ.get(u'DEBUG')
     train_filename = sys.argv[1]
     model_output = sys.argv[2]
     main(train_filename, model_output)
diff --git a/src/npi/core.py b/src/npi/core.py
index 3d63a13..c418de0 100644
--- a/src/npi/core.py
+++ b/src/npi/core.py
@@ -1,9 +1,12 @@
 # coding: utf-8
 
+from __future__ import with_statement
+from __future__ import absolute_import
 import json
 from copy import copy
 
 import numpy as np
+from io import open
 
 MAX_ARG_NUM = 3
 ARG_DEPTH = 10   # 0~9 digit. one-hot.
@@ -12,12 +15,12 @@
 PG_RETURN = 1
 
 
-class IntegerArguments:
+class IntegerArguments(object):
     depth = ARG_DEPTH
     max_arg_num = MAX_ARG_NUM
     size_of_arguments = depth * max_arg_num
 
-    def __init__(self, args: list=None, values: np.ndarray=None):
+    def __init__(self, args=None, values=None):
         if values is not None:
             self.values = values.reshape((self.max_arg_num, self.depth))
         else:
@@ -33,20 +36,20 @@ def copy(self):
         return obj
 
     def decode_all(self):
-        return [self.decode_at(i) for i in range(len(self.values))]
+        return [self.decode_at(i) for i in xrange(len(self.values))]
 
-    def decode_at(self, index: int) -> int:
+    def decode_at(self, index):
         return self.values[index].argmax()
 
-    def update_to(self, index: int, integer: int):
+    def update_to(self, index, integer):
         self.values[index] = 0
         self.values[index, int(np.clip(integer, 0, self.depth-1))] = 1
 
     def __str__(self):
-        return "<IA: %s>" % self.decode_all()
+        return u"<IA: %s>" % self.decode_all()
 
 
-class Program:
+class Program(object):
     output_to_env = False
 
     def __init__(self, name, *args):
@@ -54,56 +57,56 @@ def __init__(self, name, *args):
         self.args = args
         self.program_id = None
 
-    def description_with_args(self, args: IntegerArguments) -> str:
+    def description_with_args(self, args):
         int_args = args.decode_all()
-        return "%s(%s)" % (self.name, ", ".join([str(x) for x in int_args]))
+        return u"%s(%s)" % (self.name, u", ".join([unicode(x) for x in int_args]))
 
     def to_one_hot(self, size, dtype=np.float):
         ret = np.zeros((size,), dtype=dtype)
         ret[self.program_id] = 1
         return ret
 
-    def do(self, env, args: IntegerArguments):
+    def do(self, env, args):
         raise NotImplementedError()
 
     def __str__(self):
-        return "<Program: name=%s>" % self.name
+        return u"<Program: name=%s>" % self.name
 
 
-class StepInput:
-    def __init__(self, env: np.ndarray, program: Program, arguments: IntegerArguments):
+class StepInput(object):
+    def __init__(self, env, program, arguments):
         self.env = env
         self.program = program
         self.arguments = arguments
 
 
-class StepOutput:
-    def __init__(self, r: float, program: Program=None, arguments: IntegerArguments=None):
+class StepOutput(object):
+    def __init__(self, r, program=None, arguments=None):
         self.r = r
         self.program = program
         self.arguments = arguments
 
     def __str__(self):
-        return "<StepOutput: r=%s pg=%s arg=%s>" % (self.r, self.program, self.arguments)
+        return u"<StepOutput: r=%s pg=%s arg=%s>" % (self.r, self.program, self.arguments)
 
 
-class StepInOut:
-    def __init__(self, input: StepInput, output: StepOutput):
+class StepInOut(object):
+    def __init__(self, input, output):
         self.input = input
         self.output = output
 
 
-class ResultLogger:
+class ResultLogger(object):
     def __init__(self, filename):
         self.filename = filename
 
     def write(self, obj):
-        with open(self.filename, "a") as f:
+        with open(self.filename, u"a") as f:
             json.dump(obj, f)
-            f.write("\n")
+            f.write(u"\n")
 
 
-class NPIStep:
+class NPIStep(object):
     def reset(self):
         pass
 
@@ -113,11 +116,11 @@ def enter_function(self):
     def exit_function(self):
         pass
 
-    def step(self, env_observation: np.ndarray, pg: Program, arguments: IntegerArguments) -> StepOutput:
+    def step(self, env_observation, pg, arguments):
         raise NotImplementedError()
 
 
-class RuntimeSystem:
+class RuntimeSystem(object):
     def __init__(self, terminal=None):
         self.terminal = terminal
 
@@ -125,7 +128,7 @@ def logging(self, message):
         if self.terminal:
             self.terminal.add_log(message)
         else:
-            print(message)
+            print message
 
 
 def to_one_hot_array(idx, size, dtype=np.int8):
diff --git a/src/npi/terminal_core.py b/src/npi/terminal_core.py
index 670fdbf..c65e408 100644
--- a/src/npi/terminal_core.py
+++ b/src/npi/terminal_core.py
@@ -1,14 +1,15 @@
 #!/usr/bin/env python
 # coding: utf-8
+from __future__ import absolute_import
 import curses
 import numpy as np
 
 from npi.core import Program, IntegerArguments, NPIStep, StepOutput, StepInput, StepInOut
 
-__author__ = 'k_morishita'
+__author__ = u'k_morishita'
 
 
-class Screen:
+class Screen(object):
     data = None
 
     def __init__(self, height, width):
@@ -32,7 +33,7 @@ def __getitem__(self, item):
         return self.data[item]
 
 
-class Terminal:
+class Terminal(object):
     W_TOP = 1
     W_LEFT = 1
     LOG_WINDOW_HEIGHT = 10
@@ -45,9 +46,9 @@ class Terminal:
     log_window = None
 
     def __init__(self, stdscr, char_map=None):
-        print(type(stdscr))
+        print type(stdscr)
         self.stdscr = stdscr
-        self.char_map = char_map or dict((ch, chr(ch)) for ch in range(128))
+        self.char_map = char_map or dict((ch, unichr(ch)) for ch in xrange(128))
         self.log_list = []
 
     def init_window(self, width, height):
@@ -69,8 +70,8 @@ def wait_for_key(self):
         self.stdscr.getch()
 
     def update_main_screen(self, screen):
-        for y in range(screen.height):
-            line = "".join([self.char_map[ch] for ch in screen[y]])
+        for y in xrange(screen.height):
+            line = u"".join([self.char_map[ch] for ch in screen[y]])
             self.ignore_error_add_str(self.main_window, y, 0, line)
 
     def update_main_window_attr(self, screen, y, x, attr):
@@ -87,17 +88,17 @@ def update_info_screen(self, info_list):
         self.info_window.refresh()
 
     def add_log(self, line):
-        self.log_list.insert(0, str(line)[:self.LOG_WINDOW_WIDTH])
+        self.log_list.insert(0, unicode(line)[:self.LOG_WINDOW_WIDTH])
         self.log_list = self.log_list[:self.LOG_WINDOW_HEIGHT-1]
         self.log_window.clear()
         for i, line in enumerate(self.log_list):
-            line = str(line) + " " * (self.LOG_WINDOW_WIDTH - len(str(line)))
+            line = unicode(line) + u" " * (self.LOG_WINDOW_WIDTH - len(unicode(line)))
             self.log_window.addstr(i, 0, line)
         self.log_window.refresh()
 
     @staticmethod
     def ignore_error_add_str(win, y, x, s, attr=curses.A_NORMAL):
-        """一番右下に書き込むと例外が飛んでくるけど、漢は黙って無視するのがお作法らしい？"""
+        u"""一番右下に書き込むと例外が飛んでくるけど、漢は黙って無視するのがお作法らしい？"""
         try:
             win.addstr(y, x, s, attr)
         except curses.error:
@@ -111,8 +112,8 @@ def show_env_to_terminal(terminal, env):
     terminal.refresh_main_window()
 
 
-class TerminalNPIRunner:
-    def __init__(self, terminal: Terminal, model: NPIStep=None, recording=True, max_depth=10, max_step=1000):
+class TerminalNPIRunner(object):
+    def __init__(self, terminal, model=None, recording=True, max_depth=10, max_step=1000):
         self.terminal = terminal
         self.model = model
         self.steps = 0
@@ -132,19 +133,19 @@ def display_env(self, env, force=False):
         if (self.verbose or force) and self.terminal:
             show_env_to_terminal(self.terminal, env)
 
-    def display_information(self, program: Program, arguments: IntegerArguments, result: StepOutput, depth: int):
+    def display_information(self, program, arguments, result, depth):
         if self.verbose and self.terminal:
             information = [
-                "Step %2d Depth: %2d" % (self.steps, depth),
+                u"Step %2d Depth: %2d" % (self.steps, depth),
                 program.description_with_args(arguments),
-                'r=%.2f' % result.r,
+                u'r=%.2f' % result.r,
             ]
             if result.program:
-                information.append("-> %s" % result.program.description_with_args(result.arguments))
+                information.append(u"-> %s" % result.program.description_with_args(result.arguments))
             self.terminal.update_info_screen(information)
             self.wait()
 
-    def npi_program_interface(self, env, program: Program, arguments: IntegerArguments, depth=0):
+    def npi_program_interface(self, env, program, arguments, depth=0):
         if self.max_depth < depth or self.max_step < self.steps:
             raise StopIteration()
 

From f2921cb92d49920ac48d54b0211219d631bde217 Mon Sep 17 00:00:00 2001
From: kmader <kevinmader@4quant.com>
Date: Tue, 6 Sep 2016 22:32:47 +0200
Subject: [PATCH 3/4] fixing unicode text

---
 src/npi/__init__.py                 |   2 +-
 src/npi/add/__init__.py             |   2 +-
 src/npi/add/create_training_data.py |  14 ++--
 src/npi/add/lib.py                  |  44 ++++++------
 src/npi/add/model.py                | 106 ++++++++++++++--------------
 src/npi/add/test_model.py           |  10 +--
 src/npi/add/training_model.py       |   6 +-
 src/npi/core.py                     |  15 ++--
 src/npi/terminal_core.py            |  14 ++--
 9 files changed, 107 insertions(+), 106 deletions(-)

diff --git a/src/npi/__init__.py b/src/npi/__init__.py
index 8a675c1..b6cd2be 100644
--- a/src/npi/__init__.py
+++ b/src/npi/__init__.py
@@ -1,4 +1,4 @@
 #!/usr/bin/env python
 # coding: utf-8
 
-__author__ = u'k_morishita'
+__author__ = 'k_morishita'
diff --git a/src/npi/add/__init__.py b/src/npi/add/__init__.py
index 8a675c1..b6cd2be 100644
--- a/src/npi/add/__init__.py
+++ b/src/npi/add/__init__.py
@@ -1,4 +1,4 @@
 #!/usr/bin/env python
 # coding: utf-8
 
-__author__ = u'k_morishita'
+__author__ = 'k_morishita'
diff --git a/src/npi/add/create_training_data.py b/src/npi/add/create_training_data.py
index bf8326a..08d7143 100644
--- a/src/npi/add/create_training_data.py
+++ b/src/npi/add/create_training_data.py
@@ -28,24 +28,24 @@ def main(stdscr, filename, num, result_logger):
         addition_env.reset()
         q = copy(data)
         run_npi(addition_env, npi_runner, program_set.ADD, data)
-        steps_list.append({u"q": q, u"steps": npi_runner.step_list})
+        steps_list.append({"q": q, "steps": npi_runner.step_list})
         result_logger.write(data)
         terminal.add_log(data)
 
     if filename:
-        with open(filename, u'wb') as f:
+        with open(filename, 'wb') as f:
             pickle.dump(steps_list, f, protocol=pickle.HIGHEST_PROTOCOL)
 
-if __name__ == u'__main__':
+if __name__ == '__main__':
     import sys
-    DEBUG_MODE = os.environ.get(u'DEBUG')
+    DEBUG_MODE = os.environ.get('DEBUG')
     if DEBUG_MODE:
         output_filename = None
         num_data = 3
-        log_filename = u'result.log'
+        log_filename = 'result.log'
     else:
         output_filename = sys.argv[1] if len(sys.argv) > 1 else None
         num_data = int(sys.argv[2]) if len(sys.argv) > 2 else 1000
-        log_filename = sys.argv[3] if len(sys.argv) > 3 else u'result.log'
+        log_filename = sys.argv[3] if len(sys.argv) > 3 else 'result.log'
     curses.wrapper(main, output_filename, num_data, ResultLogger(log_filename))
-    print u"create %d training data" % num_data
+    print "create %d training data" % num_data
diff --git a/src/npi/add/lib.py b/src/npi/add/lib.py
index 8e491a3..5f083fe 100644
--- a/src/npi/add/lib.py
+++ b/src/npi/add/lib.py
@@ -7,11 +7,11 @@
 from npi.core import Program, IntegerArguments, StepOutput, NPIStep, PG_CONTINUE, PG_RETURN
 from npi.terminal_core import Screen, Terminal
 
-__author__ = u'k_morishita'
+__author__ = 'k_morishita'
 
 
 class AdditionEnv(object):
-    u"""
+    """
     Environment of Addition
     """
     def __init__(self, height, width, num_chars):
@@ -35,13 +35,13 @@ def to_one_hot(self, ch):
         if 0 <= ch < self.num_chars:
             ret[ch] = 1
         else:
-            raise IndexError(u"ch must be 0 <= ch < %s, but %s" % (self.num_chars, ch))
+            raise IndexError("ch must be 0 <= ch < %s, but %s" % (self.num_chars, ch))
         return ret
 
     def setup_problem(self, num1, num2):
-        for i, s in enumerate(reversed(u"%s" % num1)):
+        for i, s in enumerate(reversed("%s" % num1)):
             self.screen[0, -(i+1)] = int(s) + 1
-        for i, s in enumerate(reversed(u"%s" % num2)):
+        for i, s in enumerate(reversed("%s" % num2)):
             self.screen[1, -(i+1)] = int(s) + 1
 
     def move_pointer(self, row, left_or_right):
@@ -54,11 +54,11 @@ def write(self, row, ch):
             self.screen[row, self.pointers[row]] = ch
 
     def get_output(self):
-        s = u""
+        s = ""
         for ch in self.screen[3]:
             if ch > 0:
-                s += u"%s" % (ch-1)
-        return int(s or u"0")
+                s += "%s" % (ch-1)
+        return int(s or "0")
 
 
 class MovePtrProgram(Program):
@@ -89,14 +89,14 @@ def do(self, env, args):
 
 
 class AdditionProgramSet(object):
-    NOP = Program(u'NOP')
-    MOVE_PTR = MovePtrProgram(u'MOVE_PTR', 4, 2)  # PTR_KIND(4), LEFT_OR_RIGHT(2)
-    WRITE = WriteProgram(u'WRITE', 2, 10)       # CARRY_OR_OUT(2), DIGITS(10)
-    ADD = Program(u'ADD')
-    ADD1 = Program(u'ADD1')
-    CARRY = Program(u'CARRY')
-    LSHIFT = Program(u'LSHIFT')
-    RSHIFT = Program(u'RSHIFT')
+    NOP = Program('NOP')
+    MOVE_PTR = MovePtrProgram('MOVE_PTR', 4, 2)  # PTR_KIND(4), LEFT_OR_RIGHT(2)
+    WRITE = WriteProgram('WRITE', 2, 10)       # CARRY_OR_OUT(2), DIGITS(10)
+    ADD = Program('ADD')
+    ADD1 = Program('ADD1')
+    CARRY = Program('CARRY')
+    LSHIFT = Program('LSHIFT')
+    RSHIFT = Program('RSHIFT')
 
     def __init__(self):
         self.map = {}
@@ -229,8 +229,8 @@ def pg_rshift(self, env_observation, arguments):
 
 
 def create_char_map():
-    char_map = dict((i+1, u"%s" % i) for i in xrange(10))
-    char_map[0] = u' '
+    char_map = dict((i+1, "%s" % i) for i in xrange(10))
+    char_map[0] = ' '
     return char_map
 
 
@@ -262,13 +262,13 @@ def create_random_questions(num=100, max_number=10000):
 
 
 def run_npi(addition_env, npi_runner, program, data):
-    data[u'expect'] = data[u'in1'] + data[u'in2']
+    data['expect'] = data['in1'] + data['in2']
 
-    addition_env.setup_problem(data[u'in1'], data[u'in2'])
+    addition_env.setup_problem(data['in1'], data['in2'])
 
     npi_runner.reset()
     npi_runner.display_env(addition_env, force=True)
     npi_runner.npi_program_interface(addition_env, program, IntegerArguments())
 
-    data[u'result'] = addition_env.get_output()
-    data[u'correct'] = data[u'result'] == data[u'expect']
+    data['result'] = addition_env.get_output()
+    data['correct'] = data['result'] == data['expect']
diff --git a/src/npi/add/model.py b/src/npi/add/model.py
index 794d2ff..32e70bd 100644
--- a/src/npi/add/model.py
+++ b/src/npi/add/model.py
@@ -26,7 +26,7 @@
 from npi.terminal_core import TerminalNPIRunner
 from itertools import izip
 
-__author__ = u'k_morishita'
+__author__ = 'k_morishita'
 
 
 class AdditionNPIModel(NPIStep):
@@ -45,58 +45,58 @@ def __init__(self, system, model_path=None, program_set=None):
     def build(self):
         enc_size = self.size_of_env_observation()
         argument_size = IntegerArguments.size_of_arguments
-        input_enc = InputLayer(batch_input_shape=(self.batch_size, enc_size), name=u'input_enc')
-        input_arg = InputLayer(batch_input_shape=(self.batch_size, argument_size), name=u'input_arg')
+        input_enc = InputLayer(batch_input_shape=(self.batch_size, enc_size), name='input_enc')
+        input_arg = InputLayer(batch_input_shape=(self.batch_size, argument_size), name='input_arg')
         input_prg = Embedding(input_dim=PROGRAM_VEC_SIZE, output_dim=PROGRAM_KEY_VEC_SIZE, input_length=1,
                               batch_input_shape=(self.batch_size, 1))
 
-        f_enc = Sequential(name=u'f_enc')
-        f_enc.add(Merge([input_enc, input_arg], mode=u'concat'))
+        f_enc = Sequential(name='f_enc')
+        f_enc.add(Merge([input_enc, input_arg], mode='concat'))
         f_enc.add(MaxoutDense(128, nb_feature=4))
         self.f_enc = f_enc
 
-        program_embedding = Sequential(name=u'program_embedding')
+        program_embedding = Sequential(name='program_embedding')
         program_embedding.add(input_prg)
 
-        f_enc_convert = Sequential(name=u'f_enc_convert')
+        f_enc_convert = Sequential(name='f_enc_convert')
         f_enc_convert.add(f_enc)
         f_enc_convert.add(RepeatVector(1))
 
-        f_lstm = Sequential(name=u'f_lstm')
-        f_lstm.add(Merge([f_enc_convert, program_embedding], mode=u'concat'))
+        f_lstm = Sequential(name='f_lstm')
+        f_lstm.add(Merge([f_enc_convert, program_embedding], mode='concat'))
         f_lstm.add(LSTM(256, return_sequences=False, stateful=True, W_regularizer=l2(0.0000001)))
-        f_lstm.add(Activation(u'relu', name=u'relu_lstm_1'))
+        f_lstm.add(Activation('rel', name='relu_lstm_1'))
         f_lstm.add(RepeatVector(1))
         f_lstm.add(LSTM(256, return_sequences=False, stateful=True, W_regularizer=l2(0.0000001)))
-        f_lstm.add(Activation(u'relu', name=u'relu_lstm_2'))
+        f_lstm.add(Activation('rel', name='relu_lstm_2'))
         # plot(f_lstm, to_file='f_lstm.png', show_shapes=True)
 
-        f_end = Sequential(name=u'f_end')
+        f_end = Sequential(name='f_end')
         f_end.add(f_lstm)
         f_end.add(Dense(1, W_regularizer=l2(0.001)))
-        f_end.add(Activation(u'sigmoid', name=u'sigmoid_end'))
+        f_end.add(Activation('sigmoid', name='sigmoid_end'))
 
-        f_prog = Sequential(name=u'f_prog')
+        f_prog = Sequential(name='f_prog')
         f_prog.add(f_lstm)
-        f_prog.add(Dense(PROGRAM_KEY_VEC_SIZE, activation=u"relu"))
+        f_prog.add(Dense(PROGRAM_KEY_VEC_SIZE, activation="rel"))
         f_prog.add(Dense(PROGRAM_VEC_SIZE, W_regularizer=l2(0.0001)))
-        f_prog.add(Activation(u'softmax', name=u'softmax_prog'))
+        f_prog.add(Activation('softmax', name='softmax_prog'))
         # plot(f_prog, to_file='f_prog.png', show_shapes=True)
 
         f_args = []
         for ai in xrange(1, IntegerArguments.max_arg_num+1):
-            f_arg = Sequential(name=u'f_arg%s' % ai)
+            f_arg = Sequential(name='f_arg%s' % ai)
             f_arg.add(f_lstm)
             f_arg.add(Dense(IntegerArguments.depth, W_regularizer=l2(0.0001)))
-            f_arg.add(Activation(u'softmax', name=u'softmax_arg%s' % ai))
+            f_arg.add(Activation('softmax', name='softmax_arg%s' % ai))
             f_args.append(f_arg)
         # plot(f_arg, to_file='f_arg.png', show_shapes=True)
 
         self.model = Model([input_enc.input, input_arg.input, input_prg.input],
                            [f_end.output, f_prog.output] + [fa.output for fa in f_args],
-                           name=u"npi")
+                           name="npi")
         self.compile_model()
-        plot(self.model, to_file=u'model.png', show_shapes=True)
+        plot(self.model, to_file='model.png', show_shapes=True)
 
     def reset(self):
         super(AdditionNPIModel, self).reset()
@@ -107,11 +107,11 @@ def reset(self):
     def compile_model(self, lr=0.0001, arg_weight=1.):
         arg_num = IntegerArguments.max_arg_num
         optimizer = Adam(lr=lr)
-        loss = [u'binary_crossentropy', u'categorical_crossentropy'] + [u'categorical_crossentropy'] * arg_num
+        loss = ['binary_crossentropy', 'categorical_crossentropy'] + ['categorical_crossentropy'] * arg_num
         self.model.compile(optimizer=optimizer, loss=loss, loss_weights=[0.25, 0.25] + [arg_weight] * arg_num)
 
     def fit(self, steps_list, epoch=3000):
-        u"""
+        """
 
         :param int epoch:
         :param typing.List[typing.Dict[q=dict, steps=typing.List[StepInOut]]] steps_list:
@@ -121,8 +121,8 @@ def fit(self, steps_list, epoch=3000):
         def filter_question(condition_func):
             sub_steps_list = []
             for steps_dict in steps_list:
-                question = steps_dict[u'q']
-                if condition_func(question[u'in1'], question[u'in2']):
+                question = steps_dict['q']
+                if condition_func(question['in1'], question['in2']):
                     sub_steps_list.append(steps_dict)
             return sub_steps_list
 
@@ -151,17 +151,17 @@ def filter_question(condition_func):
         # all_ok = self.fit_to_subset(filter_question(lambda a, b: a < 10 and b < 10), pass_rate=pr)
         # print("%s is pass_rate >= %s: %s" % (q_type, pr, all_ok))
 
-        q_type = u"training questions of a<100 and b<100"
+        q_type = "training questions of a<100 and b<100"
         print q_type
         pr = 0.8
         all_ok = self.fit_to_subset(filter_question(lambda a, b: a < 100 and b < 100), pass_rate=pr)
-        print u"%s is pass_rate >= %s: %s" % (q_type, pr, all_ok)
+        print "%s is pass_rate >= %s: %s" % (q_type, pr, all_ok)
 
         while True:
             if self.test_and_learn([10, 100, 1000]):
                 break
 
-            q_type = u"training questions of ALL"
+            q_type = "training questions of ALL"
             print q_type
 
             q_num = 100
@@ -171,7 +171,7 @@ def filter_question(condition_func):
             np.random.shuffle(questions)
             questions = questions[:q_num]
             all_ok = self.fit_to_subset(questions, pass_rate=pr, skip_correct=skip_correct)
-            print u"%s is pass_rate >= %s: %s" % (q_type, pr, all_ok)
+            print "%s is pass_rate >= %s: %s" % (q_type, pr, all_ok)
 
     def fit_to_subset(self, steps_list, pass_rate=1.0, skip_correct=False):
         for i in xrange(10):
@@ -182,10 +182,10 @@ def fit_to_subset(self, steps_list, pass_rate=1.0, skip_correct=False):
 
     def test_and_learn(self, num_questions):
         for num in num_questions:
-            print u"test all type of %d questions" % num
+            print "test all type of %d questions" % num
             cc, wc, wrong_questions = self.test_to_subset(create_random_questions(num))
             acc_rate = cc/(cc+wc)
-            print u"Accuracy %s(OK=%d, NG=%d)" % (acc_rate, cc, wc)
+            print "Accuracy %s(OK=%d, NG=%d)" % (acc_rate, cc, wc)
             if wc > 0:
                 self.fit_to_subset(wrong_questions, pass_rate=1.0, skip_correct=False)
                 return False
@@ -204,7 +204,7 @@ def test_to_subset(self, questions):
                 correct_count += 1
             else:
                 self.question_test(addition_env, teacher_runner, question)
-                wrong_steps_list.append({u"q": question, u"steps": teacher_runner.step_list})
+                wrong_steps_list.append({"q": question, "steps": teacher_runner.step_list})
                 wrong_count += 1
         return correct_count, wrong_count, wrong_steps_list
 
@@ -225,13 +225,13 @@ def do_learn(self, steps_list, epoch, pass_rate=1.0, skip_correct=False):
             ok_rate = []
             np.random.shuffle(steps_list)
             for idx, steps_dict in enumerate(steps_list):
-                question = copy(steps_dict[u'q'])
+                question = copy(steps_dict['q'])
                 question_key = self.dict_to_str(question)
                 if self.question_test(addition_env, npi_runner, question):
                     if correct_count[question_key] == 0:
                         correct_new += 1
                     correct_count[question_key] += 1
-                    print u"GOOD!: ep=%2d idx=%3d :%s CorrectCount=%s" % (ep, idx, self.dict_to_str(question), correct_count[question_key])
+                    print "GOOD!: ep=%2d idx=%3d :%s CorrectCount=%s" % (ep, idx, self.dict_to_str(question), correct_count[question_key])
                     ok_rate.append(1)
                     cc = correct_count[question_key]
                     if skip_correct or int(math.sqrt(cc)) ** 2 != cc:
@@ -239,11 +239,11 @@ def do_learn(self, steps_list, epoch, pass_rate=1.0, skip_correct=False):
                 else:
                     ok_rate.append(0)
                     if correct_count[question_key] > 0:
-                        print u"Degraded: ep=%2d idx=%3d :%s CorrectCount=%s -> 0" % (ep, idx, self.dict_to_str(question), correct_count[question_key])
+                        print "Degraded: ep=%2d idx=%3d :%s CorrectCount=%s -> 0" % (ep, idx, self.dict_to_str(question), correct_count[question_key])
                         correct_count[question_key] = 0
                         wrong_new += 1
 
-                steps = steps_dict[u'steps']
+                steps = steps_dict['steps']
                 xs = []
                 ys = []
                 ws = []
@@ -258,14 +258,14 @@ def do_learn(self, steps_list, epoch, pass_rate=1.0, skip_correct=False):
                 for i, (x, y, w) in enumerate(izip(xs, ys, ws)):
                     loss = self.model.train_on_batch(x, y, sample_weight=w)
                     if not np.isfinite(loss):
-                        print u"Loss is not finite!, Last Input=%s" % ([i, (x, y, w)])
+                        print "Loss is not finite!, Last Input=%s" % ([i, (x, y, w)])
                         self.print_weights(last_weights, detail=True)
-                        raise RuntimeError(u"Loss is not finite!")
+                        raise RuntimeError("Loss is not finite!")
                     losses.append(loss)
                     last_weights = self.model.get_weights()
             if losses:
                 cur_loss = np.average(losses)
-                print u"ep=%2d: ok_rate=%.2f%% (+%s -%s): ave loss %s (%s samples)" %
+                print "ep=%2d: ok_rate=%.2f%% (+%s -%s): ave loss %s (%s samples)" %
                       (ep, np.average(ok_rate)*100, correct_new, wrong_new, cur_loss, len(steps_list))
                 # self.print_weights()
                 if correct_new + wrong_new == 0:
@@ -274,39 +274,39 @@ def do_learn(self, steps_list, epoch, pass_rate=1.0, skip_correct=False):
                     no_change_count = 0
 
                 if math.fabs(1 - cur_loss/last_loss) < 0.001 and no_change_count > 5:
-                    print u"math.fabs(1 - cur_loss/last_loss) < 0.001 and no_change_count > 5:"
+                    print "math.fabs(1 - cur_loss/last_loss) < 0.001 and no_change_count > 5:"
                     return False
                 last_loss = cur_loss
-                print u"=" * 80
+                print "=" * 80
             self.save()
             if np.average(ok_rate) >= pass_rate:
                 return True
         return False
 
     def update_learning_rate(self, learning_rate, arg_weight=1.):
-        print u"Re-Compile Model lr=%s aw=%s" % (learning_rate, arg_weight)
+        print "Re-Compile Model lr=%s aw=%s" % (learning_rate, arg_weight)
         self.compile_model(learning_rate, arg_weight=arg_weight)
 
     def train_f_enc(self, steps_list, epoch=50):
-        print u"training f_enc"
-        f_add0 = Sequential(name=u'f_add0')
+        print "training f_enc"
+        f_add0 = Sequential(name='f_add0')
         f_add0.add(self.f_enc)
         f_add0.add(Dense(FIELD_DEPTH))
-        f_add0.add(Activation(u'softmax', name=u'softmax_add0'))
+        f_add0.add(Activation('softmax', name='softmax_add0'))
 
-        f_add1 = Sequential(name=u'f_add1')
+        f_add1 = Sequential(name='f_add1')
         f_add1.add(self.f_enc)
         f_add1.add(Dense(FIELD_DEPTH))
-        f_add1.add(Activation(u'softmax', name=u'softmax_add1'))
+        f_add1.add(Activation('softmax', name='softmax_add1'))
 
-        env_model = Model(self.f_enc.inputs, [f_add0.output, f_add1.output], name=u"env_model")
-        env_model.compile(optimizer=u'adam', loss=[u'categorical_crossentropy']*2)
+        env_model = Model(self.f_enc.inputs, [f_add0.output, f_add1.output], name="env_model")
+        env_model.compile(optimizer='adam', loss=['categorical_crossentropy']*2)
 
         for ep in xrange(epoch):
             losses = []
             for idx, steps_dict in enumerate(steps_list):
                 prev = None
-                for step in steps_dict[u'steps']:
+                for step in steps_dict['steps']:
                     x = self.convert_input(step.input)[:2]
                     env_values = step.input.env.reshape((4, -1))
                     in1 = np.clip(env_values[0].argmax() - 1, 0, 9)
@@ -322,7 +322,7 @@ def train_f_enc(self, steps_list, epoch=50):
                     y = [yy.reshape((self.batch_size, -1)) for yy in [y0, y1]]
                     loss = env_model.train_on_batch(x, y)
                     losses.append(loss)
-            print u"ep %3d: loss=%s" % (ep, np.average(losses))
+            print "ep %3d: loss=%s" % (ep, np.average(losses))
             if np.average(losses) < 1e-06:
                 break
 
@@ -331,7 +331,7 @@ def question_test(self, addition_env, npi_runner, question):
         self.reset()
         try:
             run_npi(addition_env, npi_runner, self.program_set.ADD, question)
-            if question[u'correct']:
+            if question['correct']:
                 return True
         except StopIteration:
             pass
@@ -382,10 +382,10 @@ def load_weights(self):
     def print_weights(self, weights=None, detail=False):
         weights = weights or self.model.get_weights()
         for w in weights:
-            print u"w%s: sum(w)=%s, ave(w)=%s" % (w.shape, np.sum(w), np.average(w))
+            print "w%s: sum(w)=%s, ave(w)=%s" % (w.shape, np.sum(w), np.average(w))
         if detail:
             for w in weights:
-                print u"%s: %s" % (w.shape, w)
+                print "%s: %s" % (w.shape, w)
 
     @staticmethod
     def size_of_env_observation():
diff --git a/src/npi/add/test_model.py b/src/npi/add/test_model.py
index ad9eb3a..5dd6c27 100644
--- a/src/npi/add/test_model.py
+++ b/src/npi/add/test_model.py
@@ -31,18 +31,18 @@ def main(stdscr, model_path, num, result_logger):
         run_npi(addition_env, npi_runner, program_set.ADD, data)
         result_logger.write(data)
         terminal.add_log(data)
-        if data[u'correct']:
+        if data['correct']:
             correct_count += 1
         else:
             wrong_count += 1
     return correct_count, wrong_count
 
 
-if __name__ == u'__main__':
+if __name__ == '__main__':
     import sys
-    DEBUG_MODE = os.environ.get(u'DEBUG')
+    DEBUG_MODE = os.environ.get('DEBUG')
     model_path_ = sys.argv[1]
     num_data = int(sys.argv[2]) if len(sys.argv) > 2 else 1000
-    log_filename = sys.argv[3] if len(sys.argv) > 3 else u'result.log'
+    log_filename = sys.argv[3] if len(sys.argv) > 3 else 'result.log'
     cc, wc = curses.wrapper(main, model_path_, num_data, ResultLogger(log_filename))
-    print u"Accuracy %s(OK=%d, NG=%d)" % (cc/(cc+wc), cc, wc)
+    print "Accuracy %s(OK=%d, NG=%d)" % (cc/(cc+wc), cc, wc)
diff --git a/src/npi/add/training_model.py b/src/npi/add/training_model.py
index 3bb64c7..f89f2e5 100644
--- a/src/npi/add/training_model.py
+++ b/src/npi/add/training_model.py
@@ -16,16 +16,16 @@ def main(filename, model_path):
     system = RuntimeSystem()
     program_set = AdditionProgramSet()
 
-    with open(filename, u'rb') as f:
+    with open(filename, 'rb') as f:
         steps_list = pickle.load(f)
 
     npi_model = AdditionNPIModel(system, model_path, program_set)
     npi_model.fit(steps_list)
 
 
-if __name__ == u'__main__':
+if __name__ == '__main__':
     import sys
-    DEBUG_MODE = os.environ.get(u'DEBUG')
+    DEBUG_MODE = os.environ.get('DEBUG')
     train_filename = sys.argv[1]
     model_output = sys.argv[2]
     main(train_filename, model_output)
diff --git a/src/npi/core.py b/src/npi/core.py
index c418de0..f06026b 100644
--- a/src/npi/core.py
+++ b/src/npi/core.py
@@ -46,7 +46,7 @@ def update_to(self, index, integer):
         self.values[index, int(np.clip(integer, 0, self.depth-1))] = 1
 
     def __str__(self):
-        return u"<IA: %s>" % self.decode_all()
+        return "<IA: %s>" % self.decode_all()
 
 
 class Program(object):
@@ -59,7 +59,7 @@ def __init__(self, name, *args):
 
     def description_with_args(self, args):
         int_args = args.decode_all()
-        return u"%s(%s)" % (self.name, u", ".join([unicode(x) for x in int_args]))
+        return "%s(%s)" % (self.name, ", ".join([unicode(x) for x in int_args]))
 
     def to_one_hot(self, size, dtype=np.float):
         ret = np.zeros((size,), dtype=dtype)
@@ -70,7 +70,7 @@ def do(self, env, args):
         raise NotImplementedError()
 
     def __str__(self):
-        return u"<Program: name=%s>" % self.name
+        return "<Program: name=%s>" % self.name
 
 
 class StepInput(object):
@@ -87,7 +87,7 @@ def __init__(self, r, program=None, arguments=None):
         self.arguments = arguments
 
     def __str__(self):
-        return u"<StepOutput: r=%s pg=%s arg=%s>" % (self.r, self.program, self.arguments)
+        return "<StepOutput: r=%s pg=%s arg=%s>" % (self.r, self.program, self.arguments)
 
 
 class StepInOut(object):
@@ -101,9 +101,10 @@ def __init__(self, filename):
         self.filename = filename
 
     def write(self, obj):
-        with open(self.filename, u"a") as f:
-            json.dump(obj, f)
-            f.write(u"\n")
+        with open(self.filename, "a") as f:
+            #json.dump(obj, f)
+            #f.write('\n')
+            pass
 
 
 class NPIStep(object):
diff --git a/src/npi/terminal_core.py b/src/npi/terminal_core.py
index c65e408..c5c22f9 100644
--- a/src/npi/terminal_core.py
+++ b/src/npi/terminal_core.py
@@ -6,7 +6,7 @@
 
 from npi.core import Program, IntegerArguments, NPIStep, StepOutput, StepInput, StepInOut
 
-__author__ = u'k_morishita'
+__author__ = 'k_morishita'
 
 
 class Screen(object):
@@ -71,7 +71,7 @@ def wait_for_key(self):
 
     def update_main_screen(self, screen):
         for y in xrange(screen.height):
-            line = u"".join([self.char_map[ch] for ch in screen[y]])
+            line = "".join([self.char_map[ch] for ch in screen[y]])
             self.ignore_error_add_str(self.main_window, y, 0, line)
 
     def update_main_window_attr(self, screen, y, x, attr):
@@ -92,13 +92,13 @@ def add_log(self, line):
         self.log_list = self.log_list[:self.LOG_WINDOW_HEIGHT-1]
         self.log_window.clear()
         for i, line in enumerate(self.log_list):
-            line = unicode(line) + u" " * (self.LOG_WINDOW_WIDTH - len(unicode(line)))
+            line = unicode(line) + " " * (self.LOG_WINDOW_WIDTH - len(unicode(line)))
             self.log_window.addstr(i, 0, line)
         self.log_window.refresh()
 
     @staticmethod
     def ignore_error_add_str(win, y, x, s, attr=curses.A_NORMAL):
-        u"""一番右下に書き込むと例外が飛んでくるけど、漢は黙って無視するのがお作法らしい？"""
+        """一番右下に書き込むと例外が飛んでくるけど、漢は黙って無視するのがお作法らしい？"""
         try:
             win.addstr(y, x, s, attr)
         except curses.error:
@@ -136,12 +136,12 @@ def display_env(self, env, force=False):
     def display_information(self, program, arguments, result, depth):
         if self.verbose and self.terminal:
             information = [
-                u"Step %2d Depth: %2d" % (self.steps, depth),
+                "Step %2d Depth: %2d" % (self.steps, depth),
                 program.description_with_args(arguments),
-                u'r=%.2f' % result.r,
+                'r=%.2f' % result.r,
             ]
             if result.program:
-                information.append(u"-> %s" % result.program.description_with_args(result.arguments))
+                information.append("-> %s" % result.program.description_with_args(result.arguments))
             self.terminal.update_info_screen(information)
             self.wait()
 

From 77898a16ed90437fe11c38c33a47099700ad8ba7 Mon Sep 17 00:00:00 2001
From: kmader <kevinmader@4quant.com>
Date: Tue, 6 Sep 2016 23:46:59 +0200
Subject: [PATCH 4/4] first working version with notebooks and model output

---
 README.md                  |   5 +-
 notebooks/TrainModel.ipynb | 947 +++++++++++++++++++++++++++++++++++++
 src/npi/add/model.py       |  23 +-
 3 files changed, 965 insertions(+), 10 deletions(-)
 create mode 100644 notebooks/TrainModel.ipynb

diff --git a/README.md b/README.md
index 7445a5d..da951f8 100644
--- a/README.md
+++ b/README.md
@@ -2,16 +2,19 @@ About
 =====
 
 Implementation of [Neural Programmer-Interpreters](http://arxiv.org/abs/1511.06279) with Keras.
+Modified to use Python2 instead of Python3 and with example Jupyter notebooks (in the notebooks directory). 
 
 How to Demo
 ===========
 
 [Demo Movie](https://youtu.be/s7PuBqwI2YA)
 
+[View the Notebook](notebooks/TrainModel.ipynb)
+
 requirement
 -----------
 
-* Python3
+* Python2
 
 setup
 -----
diff --git a/notebooks/TrainModel.ipynb b/notebooks/TrainModel.ipynb
new file mode 100644
index 0000000..0ade0ae
--- /dev/null
+++ b/notebooks/TrainModel.ipynb
@@ -0,0 +1,947 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Train the Model\n",
+    "The notebook is a copy of the training_model.py script designed for interactive use. Use the notebook after you have already creating training data using the following instructions. To run them inside jupyter add an extra ../ to the beginning.\n",
+    "\n",
+    "### create training dataset\n",
+    "```\n",
+    "sh src/run_create_addition_data.sh\n",
+    "```\n",
+    "\n",
+    "### create training dataset with showing steps on terminal\n",
+    "```\n",
+    "DEBUG=1 sh src/run_create_addition_data.sh\n",
+    "```"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "Using Theano backend.\n"
+     ]
+    }
+   ],
+   "source": [
+    "# coding: utf-8\n",
+    "import sys\n",
+    "\n",
+    "from __future__ import with_statement\n",
+    "from __future__ import absolute_import\n",
+    "import os\n",
+    "import pickle\n",
+    "sys.path.append('../src') # for the NPI tools\n",
+    "from npi.add.config import FIELD_ROW, FIELD_WIDTH, FIELD_DEPTH\n",
+    "from npi.add.lib import AdditionEnv, AdditionProgramSet, AdditionTeacher, create_char_map, create_questions, run_npi\n",
+    "from npi.add.model import AdditionNPIModel\n",
+    "from npi.core import ResultLogger, RuntimeSystem\n",
+    "from npi.terminal_core import TerminalNPIRunner, Terminal\n",
+    "from io import open\n",
+    "from glob import glob\n",
+    "from IPython.display import SVG"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [],
+   "source": [
+    "train_datasets = glob('../data/*.pkl')\n",
+    "assert len(train_datasets) > 0\n",
+    "model_path = '../data/addition.model'"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "DEBUG_MODE = os.environ.get('DEBUG')\n",
+    "system = RuntimeSystem()\n",
+    "program_set = AdditionProgramSet()\n",
+    "with open(train_datasets[0], 'rb') as f:\n",
+    "        steps_list = pickle.load(f)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [],
+   "source": [
+    "npi_model = AdditionNPIModel(system, model_path, program_set)\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [
+    {
+     "data": {
+      "image/svg+xml": [
+       "<svg height=\"578pt\" viewBox=\"0.00 0.00 677.59 578.20\" width=\"678pt\" xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\">\n",
+       "<g class=\"graph\" id=\"graph0\" transform=\"scale(1 1) rotate(0) translate(4 574.2)\">\n",
+       "<title>G</title>\n",
+       "<polygon fill=\"white\" points=\"-4,4 -4,-574.2 673.587,-574.2 673.587,4 -4,4\" stroke=\"none\"/>\n",
+       "<!-- 4599299216 -->\n",
+       "<g class=\"node\" id=\"node1\"><title>4599299216</title>\n",
+       "<polygon fill=\"none\" points=\"0,-520.1 0,-569.7 330.625,-569.7 330.625,-520.1 0,-520.1\" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"83.9948\" y=\"-540.7\">f_enc_convert (Sequential)</text>\n",
+       "<polyline fill=\"none\" points=\"167.99,-520.1 167.99,-569.7 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"195.825\" y=\"-553.1\">input:</text>\n",
+       "<polyline fill=\"none\" points=\"167.99,-544.9 223.661,-544.9 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"195.825\" y=\"-528.3\">output:</text>\n",
+       "<polyline fill=\"none\" points=\"223.661,-520.1 223.661,-569.7 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"277.143\" y=\"-553.1\">[(1, 44), (1, 30)]</text>\n",
+       "<polyline fill=\"none\" points=\"223.661,-544.9 330.625,-544.9 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"276.822\" y=\"-528.3\">(1, 1, 128)</text>\n",
+       "</g>\n",
+       "<!-- 5033807632 -->\n",
+       "<g class=\"node\" id=\"node3\"><title>5033807632</title>\n",
+       "<polygon fill=\"none\" points=\"184.827,-433.5 184.827,-483.1 489.798,-483.1 489.798,-433.5 184.827,-433.5\" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"241.995\" y=\"-454.1\">merge_2 (Merge)</text>\n",
+       "<polyline fill=\"none\" points=\"299.163,-433.5 299.163,-483.1 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"326.999\" y=\"-466.5\">input:</text>\n",
+       "<polyline fill=\"none\" points=\"299.163,-458.3 354.835,-458.3 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"326.999\" y=\"-441.7\">output:</text>\n",
+       "<polyline fill=\"none\" points=\"354.835,-433.5 354.835,-483.1 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"422.316\" y=\"-466.5\">[(1, 1, 128), (1, 1, 5)]</text>\n",
+       "<polyline fill=\"none\" points=\"354.835,-458.3 489.798,-458.3 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"421.995\" y=\"-441.7\">(1, 1, 133)</text>\n",
+       "</g>\n",
+       "<!-- 4599299216&#45;&gt;5033807632 -->\n",
+       "<g class=\"edge\" id=\"edge1\"><title>4599299216-&gt;5033807632</title>\n",
+       "<path d=\"M214.141,-519.883C234.472,-509.883 258.235,-498.195 279.436,-487.767\" fill=\"none\" stroke=\"black\"/>\n",
+       "<polygon fill=\"black\" points=\"281.232,-490.785 288.66,-483.23 278.142,-484.503 281.232,-490.785\" stroke=\"black\"/>\n",
+       "</g>\n",
+       "<!-- 4625154448 -->\n",
+       "<g class=\"node\" id=\"node2\"><title>4625154448</title>\n",
+       "<polygon fill=\"none\" points=\"349.038,-520.1 349.038,-569.7 669.587,-569.7 669.587,-520.1 349.038,-520.1\" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"451.316\" y=\"-540.7\">program_embedding (Sequential)</text>\n",
+       "<polyline fill=\"none\" points=\"553.594,-520.1 553.594,-569.7 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"581.43\" y=\"-553.1\">input:</text>\n",
+       "<polyline fill=\"none\" points=\"553.594,-544.9 609.266,-544.9 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"581.43\" y=\"-528.3\">output:</text>\n",
+       "<polyline fill=\"none\" points=\"609.266,-520.1 609.266,-569.7 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"639.427\" y=\"-553.1\">(1, 1)</text>\n",
+       "<polyline fill=\"none\" points=\"609.266,-544.9 669.587,-544.9 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"639.427\" y=\"-528.3\">(1, 1, 5)</text>\n",
+       "</g>\n",
+       "<!-- 4625154448&#45;&gt;5033807632 -->\n",
+       "<g class=\"edge\" id=\"edge2\"><title>4625154448-&gt;5033807632</title>\n",
+       "<path d=\"M460.484,-519.883C440.153,-509.883 416.39,-498.195 395.189,-487.767\" fill=\"none\" stroke=\"black\"/>\n",
+       "<polygon fill=\"black\" points=\"396.483,-484.503 385.965,-483.23 393.393,-490.785 396.483,-484.503\" stroke=\"black\"/>\n",
+       "</g>\n",
+       "<!-- 5009279184 -->\n",
+       "<g class=\"node\" id=\"node4\"><title>5009279184</title>\n",
+       "<polygon fill=\"none\" points=\"220.181,-346.9 220.181,-396.5 454.444,-396.5 454.444,-346.9 220.181,-346.9\" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"272.316\" y=\"-367.5\">lstm_1 (LSTM)</text>\n",
+       "<polyline fill=\"none\" points=\"324.451,-346.9 324.451,-396.5 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"352.287\" y=\"-379.9\">input:</text>\n",
+       "<polyline fill=\"none\" points=\"324.451,-371.7 380.123,-371.7 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"352.287\" y=\"-355.1\">output:</text>\n",
+       "<polyline fill=\"none\" points=\"380.123,-346.9 380.123,-396.5 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"417.283\" y=\"-379.9\">(1, 1, 133)</text>\n",
+       "<polyline fill=\"none\" points=\"380.123,-371.7 454.444,-371.7 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"417.283\" y=\"-355.1\">(1, 256)</text>\n",
+       "</g>\n",
+       "<!-- 5033807632&#45;&gt;5009279184 -->\n",
+       "<g class=\"edge\" id=\"edge3\"><title>5033807632-&gt;5009279184</title>\n",
+       "<path d=\"M337.312,-433.283C337.312,-425.067 337.312,-415.712 337.312,-406.852\" fill=\"none\" stroke=\"black\"/>\n",
+       "<polygon fill=\"black\" points=\"340.813,-406.777 337.312,-396.777 333.813,-406.777 340.813,-406.777\" stroke=\"black\"/>\n",
+       "</g>\n",
+       "<!-- 5074307728 -->\n",
+       "<g class=\"node\" id=\"node5\"><title>5074307728</title>\n",
+       "<polygon fill=\"none\" points=\"201.915,-260.3 201.915,-309.9 472.71,-309.9 472.71,-260.3 201.915,-260.3\" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"279.316\" y=\"-280.9\">relu_lstm_1 (Activation)</text>\n",
+       "<polyline fill=\"none\" points=\"356.717,-260.3 356.717,-309.9 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"384.553\" y=\"-293.3\">input:</text>\n",
+       "<polyline fill=\"none\" points=\"356.717,-285.1 412.389,-285.1 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"384.553\" y=\"-268.5\">output:</text>\n",
+       "<polyline fill=\"none\" points=\"412.389,-260.3 412.389,-309.9 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"442.549\" y=\"-293.3\">(1, 256)</text>\n",
+       "<polyline fill=\"none\" points=\"412.389,-285.1 472.71,-285.1 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"442.549\" y=\"-268.5\">(1, 256)</text>\n",
+       "</g>\n",
+       "<!-- 5009279184&#45;&gt;5074307728 -->\n",
+       "<g class=\"edge\" id=\"edge4\"><title>5009279184-&gt;5074307728</title>\n",
+       "<path d=\"M337.312,-346.683C337.312,-338.467 337.312,-329.112 337.312,-320.252\" fill=\"none\" stroke=\"black\"/>\n",
+       "<polygon fill=\"black\" points=\"340.813,-320.177 337.312,-310.177 333.813,-320.177 340.813,-320.177\" stroke=\"black\"/>\n",
+       "</g>\n",
+       "<!-- 4508958928 -->\n",
+       "<g class=\"node\" id=\"node6\"><title>4508958928</title>\n",
+       "<polygon fill=\"none\" points=\"177.839,-173.7 177.839,-223.3 496.786,-223.3 496.786,-173.7 177.839,-173.7\" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"272.316\" y=\"-194.3\">repeatvector_2 (RepeatVector)</text>\n",
+       "<polyline fill=\"none\" points=\"366.793,-173.7 366.793,-223.3 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"394.629\" y=\"-206.7\">input:</text>\n",
+       "<polyline fill=\"none\" points=\"366.793,-198.5 422.465,-198.5 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"394.629\" y=\"-181.9\">output:</text>\n",
+       "<polyline fill=\"none\" points=\"422.465,-173.7 422.465,-223.3 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"459.626\" y=\"-206.7\">(1, 256)</text>\n",
+       "<polyline fill=\"none\" points=\"422.465,-198.5 496.786,-198.5 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"459.626\" y=\"-181.9\">(1, 1, 256)</text>\n",
+       "</g>\n",
+       "<!-- 5074307728&#45;&gt;4508958928 -->\n",
+       "<g class=\"edge\" id=\"edge5\"><title>5074307728-&gt;4508958928</title>\n",
+       "<path d=\"M337.312,-260.083C337.312,-251.867 337.312,-242.512 337.312,-233.652\" fill=\"none\" stroke=\"black\"/>\n",
+       "<polygon fill=\"black\" points=\"340.813,-233.577 337.312,-223.577 333.813,-233.577 340.813,-233.577\" stroke=\"black\"/>\n",
+       "</g>\n",
+       "<!-- 4738189776 -->\n",
+       "<g class=\"node\" id=\"node7\"><title>4738189776</title>\n",
+       "<polygon fill=\"none\" points=\"220.181,-87.1 220.181,-136.7 454.444,-136.7 454.444,-87.1 220.181,-87.1\" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"272.316\" y=\"-107.7\">lstm_2 (LSTM)</text>\n",
+       "<polyline fill=\"none\" points=\"324.451,-87.1 324.451,-136.7 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"352.287\" y=\"-120.1\">input:</text>\n",
+       "<polyline fill=\"none\" points=\"324.451,-111.9 380.123,-111.9 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"352.287\" y=\"-95.3\">output:</text>\n",
+       "<polyline fill=\"none\" points=\"380.123,-87.1 380.123,-136.7 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"417.283\" y=\"-120.1\">(1, 1, 256)</text>\n",
+       "<polyline fill=\"none\" points=\"380.123,-111.9 454.444,-111.9 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"417.283\" y=\"-95.3\">(1, 256)</text>\n",
+       "</g>\n",
+       "<!-- 4508958928&#45;&gt;4738189776 -->\n",
+       "<g class=\"edge\" id=\"edge6\"><title>4508958928-&gt;4738189776</title>\n",
+       "<path d=\"M337.312,-173.483C337.312,-165.267 337.312,-155.912 337.312,-147.052\" fill=\"none\" stroke=\"black\"/>\n",
+       "<polygon fill=\"black\" points=\"340.813,-146.977 337.312,-136.977 333.813,-146.977 340.813,-146.977\" stroke=\"black\"/>\n",
+       "</g>\n",
+       "<!-- 4599983056 -->\n",
+       "<g class=\"node\" id=\"node8\"><title>4599983056</title>\n",
+       "<polygon fill=\"none\" points=\"201.915,-0.5 201.915,-50.1 472.71,-50.1 472.71,-0.5 201.915,-0.5\" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"279.316\" y=\"-21.1\">relu_lstm_2 (Activation)</text>\n",
+       "<polyline fill=\"none\" points=\"356.717,-0.5 356.717,-50.1 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"384.553\" y=\"-33.5\">input:</text>\n",
+       "<polyline fill=\"none\" points=\"356.717,-25.3 412.389,-25.3 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"384.553\" y=\"-8.7\">output:</text>\n",
+       "<polyline fill=\"none\" points=\"412.389,-0.5 412.389,-50.1 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"442.549\" y=\"-33.5\">(1, 256)</text>\n",
+       "<polyline fill=\"none\" points=\"412.389,-25.3 472.71,-25.3 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"442.549\" y=\"-8.7\">(1, 256)</text>\n",
+       "</g>\n",
+       "<!-- 4738189776&#45;&gt;4599983056 -->\n",
+       "<g class=\"edge\" id=\"edge7\"><title>4738189776-&gt;4599983056</title>\n",
+       "<path d=\"M337.312,-86.8833C337.312,-78.6673 337.312,-69.3117 337.312,-60.4518\" fill=\"none\" stroke=\"black\"/>\n",
+       "<polygon fill=\"black\" points=\"340.813,-60.3767 337.312,-50.3767 333.813,-60.3768 340.813,-60.3767\" stroke=\"black\"/>\n",
+       "</g>\n",
+       "</g>\n",
+       "</svg>"
+      ],
+      "text/plain": [
+       "<IPython.core.display.SVG object>"
+      ]
+     },
+     "execution_count": 6,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "SVG('f_lstm.svg')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 7,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [
+    {
+     "data": {
+      "image/svg+xml": [
+       "<svg height=\"838pt\" viewBox=\"0.00 0.00 677.59 838.00\" width=\"678pt\" xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\">\n",
+       "<g class=\"graph\" id=\"graph0\" transform=\"scale(1 1) rotate(0) translate(4 834)\">\n",
+       "<title>G</title>\n",
+       "<polygon fill=\"white\" points=\"-4,4 -4,-834 673.587,-834 673.587,4 -4,4\" stroke=\"none\"/>\n",
+       "<!-- 4599299216 -->\n",
+       "<g class=\"node\" id=\"node1\"><title>4599299216</title>\n",
+       "<polygon fill=\"none\" points=\"0,-779.9 0,-829.5 330.625,-829.5 330.625,-779.9 0,-779.9\" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"83.9948\" y=\"-800.5\">f_enc_convert (Sequential)</text>\n",
+       "<polyline fill=\"none\" points=\"167.99,-779.9 167.99,-829.5 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"195.825\" y=\"-812.9\">input:</text>\n",
+       "<polyline fill=\"none\" points=\"167.99,-804.7 223.661,-804.7 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"195.825\" y=\"-788.1\">output:</text>\n",
+       "<polyline fill=\"none\" points=\"223.661,-779.9 223.661,-829.5 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"277.143\" y=\"-812.9\">[(1, 44), (1, 30)]</text>\n",
+       "<polyline fill=\"none\" points=\"223.661,-804.7 330.625,-804.7 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"276.822\" y=\"-788.1\">(1, 1, 128)</text>\n",
+       "</g>\n",
+       "<!-- 5033807632 -->\n",
+       "<g class=\"node\" id=\"node3\"><title>5033807632</title>\n",
+       "<polygon fill=\"none\" points=\"184.827,-693.3 184.827,-742.9 489.798,-742.9 489.798,-693.3 184.827,-693.3\" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"241.995\" y=\"-713.9\">merge_2 (Merge)</text>\n",
+       "<polyline fill=\"none\" points=\"299.163,-693.3 299.163,-742.9 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"326.999\" y=\"-726.3\">input:</text>\n",
+       "<polyline fill=\"none\" points=\"299.163,-718.1 354.835,-718.1 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"326.999\" y=\"-701.5\">output:</text>\n",
+       "<polyline fill=\"none\" points=\"354.835,-693.3 354.835,-742.9 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"422.316\" y=\"-726.3\">[(1, 1, 128), (1, 1, 5)]</text>\n",
+       "<polyline fill=\"none\" points=\"354.835,-718.1 489.798,-718.1 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"421.995\" y=\"-701.5\">(1, 1, 133)</text>\n",
+       "</g>\n",
+       "<!-- 4599299216&#45;&gt;5033807632 -->\n",
+       "<g class=\"edge\" id=\"edge1\"><title>4599299216-&gt;5033807632</title>\n",
+       "<path d=\"M214.141,-779.683C234.472,-769.683 258.235,-757.995 279.436,-747.567\" fill=\"none\" stroke=\"black\"/>\n",
+       "<polygon fill=\"black\" points=\"281.232,-750.585 288.66,-743.03 278.142,-744.303 281.232,-750.585\" stroke=\"black\"/>\n",
+       "</g>\n",
+       "<!-- 4625154448 -->\n",
+       "<g class=\"node\" id=\"node2\"><title>4625154448</title>\n",
+       "<polygon fill=\"none\" points=\"349.038,-779.9 349.038,-829.5 669.587,-829.5 669.587,-779.9 349.038,-779.9\" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"451.316\" y=\"-800.5\">program_embedding (Sequential)</text>\n",
+       "<polyline fill=\"none\" points=\"553.594,-779.9 553.594,-829.5 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"581.43\" y=\"-812.9\">input:</text>\n",
+       "<polyline fill=\"none\" points=\"553.594,-804.7 609.266,-804.7 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"581.43\" y=\"-788.1\">output:</text>\n",
+       "<polyline fill=\"none\" points=\"609.266,-779.9 609.266,-829.5 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"639.427\" y=\"-812.9\">(1, 1)</text>\n",
+       "<polyline fill=\"none\" points=\"609.266,-804.7 669.587,-804.7 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"639.427\" y=\"-788.1\">(1, 1, 5)</text>\n",
+       "</g>\n",
+       "<!-- 4625154448&#45;&gt;5033807632 -->\n",
+       "<g class=\"edge\" id=\"edge2\"><title>4625154448-&gt;5033807632</title>\n",
+       "<path d=\"M460.484,-779.683C440.153,-769.683 416.39,-757.995 395.189,-747.567\" fill=\"none\" stroke=\"black\"/>\n",
+       "<polygon fill=\"black\" points=\"396.483,-744.303 385.965,-743.03 393.393,-750.585 396.483,-744.303\" stroke=\"black\"/>\n",
+       "</g>\n",
+       "<!-- 5009279184 -->\n",
+       "<g class=\"node\" id=\"node4\"><title>5009279184</title>\n",
+       "<polygon fill=\"none\" points=\"220.181,-606.7 220.181,-656.3 454.444,-656.3 454.444,-606.7 220.181,-606.7\" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"272.316\" y=\"-627.3\">lstm_1 (LSTM)</text>\n",
+       "<polyline fill=\"none\" points=\"324.451,-606.7 324.451,-656.3 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"352.287\" y=\"-639.7\">input:</text>\n",
+       "<polyline fill=\"none\" points=\"324.451,-631.5 380.123,-631.5 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"352.287\" y=\"-614.9\">output:</text>\n",
+       "<polyline fill=\"none\" points=\"380.123,-606.7 380.123,-656.3 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"417.283\" y=\"-639.7\">(1, 1, 133)</text>\n",
+       "<polyline fill=\"none\" points=\"380.123,-631.5 454.444,-631.5 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"417.283\" y=\"-614.9\">(1, 256)</text>\n",
+       "</g>\n",
+       "<!-- 5033807632&#45;&gt;5009279184 -->\n",
+       "<g class=\"edge\" id=\"edge3\"><title>5033807632-&gt;5009279184</title>\n",
+       "<path d=\"M337.312,-693.083C337.312,-684.867 337.312,-675.512 337.312,-666.652\" fill=\"none\" stroke=\"black\"/>\n",
+       "<polygon fill=\"black\" points=\"340.813,-666.577 337.312,-656.577 333.813,-666.577 340.813,-666.577\" stroke=\"black\"/>\n",
+       "</g>\n",
+       "<!-- 5074307728 -->\n",
+       "<g class=\"node\" id=\"node5\"><title>5074307728</title>\n",
+       "<polygon fill=\"none\" points=\"201.915,-520.1 201.915,-569.7 472.71,-569.7 472.71,-520.1 201.915,-520.1\" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"279.316\" y=\"-540.7\">relu_lstm_1 (Activation)</text>\n",
+       "<polyline fill=\"none\" points=\"356.717,-520.1 356.717,-569.7 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"384.553\" y=\"-553.1\">input:</text>\n",
+       "<polyline fill=\"none\" points=\"356.717,-544.9 412.389,-544.9 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"384.553\" y=\"-528.3\">output:</text>\n",
+       "<polyline fill=\"none\" points=\"412.389,-520.1 412.389,-569.7 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"442.549\" y=\"-553.1\">(1, 256)</text>\n",
+       "<polyline fill=\"none\" points=\"412.389,-544.9 472.71,-544.9 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"442.549\" y=\"-528.3\">(1, 256)</text>\n",
+       "</g>\n",
+       "<!-- 5009279184&#45;&gt;5074307728 -->\n",
+       "<g class=\"edge\" id=\"edge4\"><title>5009279184-&gt;5074307728</title>\n",
+       "<path d=\"M337.312,-606.483C337.312,-598.267 337.312,-588.912 337.312,-580.052\" fill=\"none\" stroke=\"black\"/>\n",
+       "<polygon fill=\"black\" points=\"340.813,-579.977 337.312,-569.977 333.813,-579.977 340.813,-579.977\" stroke=\"black\"/>\n",
+       "</g>\n",
+       "<!-- 4508958928 -->\n",
+       "<g class=\"node\" id=\"node6\"><title>4508958928</title>\n",
+       "<polygon fill=\"none\" points=\"177.839,-433.5 177.839,-483.1 496.786,-483.1 496.786,-433.5 177.839,-433.5\" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"272.316\" y=\"-454.1\">repeatvector_2 (RepeatVector)</text>\n",
+       "<polyline fill=\"none\" points=\"366.793,-433.5 366.793,-483.1 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"394.629\" y=\"-466.5\">input:</text>\n",
+       "<polyline fill=\"none\" points=\"366.793,-458.3 422.465,-458.3 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"394.629\" y=\"-441.7\">output:</text>\n",
+       "<polyline fill=\"none\" points=\"422.465,-433.5 422.465,-483.1 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"459.626\" y=\"-466.5\">(1, 256)</text>\n",
+       "<polyline fill=\"none\" points=\"422.465,-458.3 496.786,-458.3 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"459.626\" y=\"-441.7\">(1, 1, 256)</text>\n",
+       "</g>\n",
+       "<!-- 5074307728&#45;&gt;4508958928 -->\n",
+       "<g class=\"edge\" id=\"edge5\"><title>5074307728-&gt;4508958928</title>\n",
+       "<path d=\"M337.312,-519.883C337.312,-511.667 337.312,-502.312 337.312,-493.452\" fill=\"none\" stroke=\"black\"/>\n",
+       "<polygon fill=\"black\" points=\"340.813,-493.377 337.312,-483.377 333.813,-493.377 340.813,-493.377\" stroke=\"black\"/>\n",
+       "</g>\n",
+       "<!-- 4738189776 -->\n",
+       "<g class=\"node\" id=\"node7\"><title>4738189776</title>\n",
+       "<polygon fill=\"none\" points=\"220.181,-346.9 220.181,-396.5 454.444,-396.5 454.444,-346.9 220.181,-346.9\" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"272.316\" y=\"-367.5\">lstm_2 (LSTM)</text>\n",
+       "<polyline fill=\"none\" points=\"324.451,-346.9 324.451,-396.5 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"352.287\" y=\"-379.9\">input:</text>\n",
+       "<polyline fill=\"none\" points=\"324.451,-371.7 380.123,-371.7 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"352.287\" y=\"-355.1\">output:</text>\n",
+       "<polyline fill=\"none\" points=\"380.123,-346.9 380.123,-396.5 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"417.283\" y=\"-379.9\">(1, 1, 256)</text>\n",
+       "<polyline fill=\"none\" points=\"380.123,-371.7 454.444,-371.7 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"417.283\" y=\"-355.1\">(1, 256)</text>\n",
+       "</g>\n",
+       "<!-- 4508958928&#45;&gt;4738189776 -->\n",
+       "<g class=\"edge\" id=\"edge6\"><title>4508958928-&gt;4738189776</title>\n",
+       "<path d=\"M337.312,-433.283C337.312,-425.067 337.312,-415.712 337.312,-406.852\" fill=\"none\" stroke=\"black\"/>\n",
+       "<polygon fill=\"black\" points=\"340.813,-406.777 337.312,-396.777 333.813,-406.777 340.813,-406.777\" stroke=\"black\"/>\n",
+       "</g>\n",
+       "<!-- 4599983056 -->\n",
+       "<g class=\"node\" id=\"node8\"><title>4599983056</title>\n",
+       "<polygon fill=\"none\" points=\"201.915,-260.3 201.915,-309.9 472.71,-309.9 472.71,-260.3 201.915,-260.3\" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"279.316\" y=\"-280.9\">relu_lstm_2 (Activation)</text>\n",
+       "<polyline fill=\"none\" points=\"356.717,-260.3 356.717,-309.9 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"384.553\" y=\"-293.3\">input:</text>\n",
+       "<polyline fill=\"none\" points=\"356.717,-285.1 412.389,-285.1 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"384.553\" y=\"-268.5\">output:</text>\n",
+       "<polyline fill=\"none\" points=\"412.389,-260.3 412.389,-309.9 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"442.549\" y=\"-293.3\">(1, 256)</text>\n",
+       "<polyline fill=\"none\" points=\"412.389,-285.1 472.71,-285.1 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"442.549\" y=\"-268.5\">(1, 256)</text>\n",
+       "</g>\n",
+       "<!-- 4738189776&#45;&gt;4599983056 -->\n",
+       "<g class=\"edge\" id=\"edge7\"><title>4738189776-&gt;4599983056</title>\n",
+       "<path d=\"M337.312,-346.683C337.312,-338.467 337.312,-329.112 337.312,-320.252\" fill=\"none\" stroke=\"black\"/>\n",
+       "<polygon fill=\"black\" points=\"340.813,-320.177 337.312,-310.177 333.813,-320.177 340.813,-320.177\" stroke=\"black\"/>\n",
+       "</g>\n",
+       "<!-- 4495123344 -->\n",
+       "<g class=\"node\" id=\"node9\"><title>4495123344</title>\n",
+       "<polygon fill=\"none\" points=\"224.478,-173.7 224.478,-223.3 450.147,-223.3 450.147,-173.7 224.478,-173.7\" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"279.316\" y=\"-194.3\">dense_2 (Dense)</text>\n",
+       "<polyline fill=\"none\" points=\"334.154,-173.7 334.154,-223.3 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"361.99\" y=\"-206.7\">input:</text>\n",
+       "<polyline fill=\"none\" points=\"334.154,-198.5 389.826,-198.5 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"361.99\" y=\"-181.9\">output:</text>\n",
+       "<polyline fill=\"none\" points=\"389.826,-173.7 389.826,-223.3 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"419.986\" y=\"-206.7\">(1, 256)</text>\n",
+       "<polyline fill=\"none\" points=\"389.826,-198.5 450.147,-198.5 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"419.986\" y=\"-181.9\">(1, 5)</text>\n",
+       "</g>\n",
+       "<!-- 4599983056&#45;&gt;4495123344 -->\n",
+       "<g class=\"edge\" id=\"edge8\"><title>4599983056-&gt;4495123344</title>\n",
+       "<path d=\"M337.312,-260.083C337.312,-251.867 337.312,-242.512 337.312,-233.652\" fill=\"none\" stroke=\"black\"/>\n",
+       "<polygon fill=\"black\" points=\"340.813,-233.577 337.312,-223.577 333.813,-233.577 340.813,-233.577\" stroke=\"black\"/>\n",
+       "</g>\n",
+       "<!-- 4743679824 -->\n",
+       "<g class=\"node\" id=\"node10\"><title>4743679824</title>\n",
+       "<polygon fill=\"none\" points=\"227.978,-87.1 227.978,-136.7 446.647,-136.7 446.647,-87.1 227.978,-87.1\" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"282.816\" y=\"-107.7\">dense_3 (Dense)</text>\n",
+       "<polyline fill=\"none\" points=\"337.654,-87.1 337.654,-136.7 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"365.49\" y=\"-120.1\">input:</text>\n",
+       "<polyline fill=\"none\" points=\"337.654,-111.9 393.326,-111.9 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"365.49\" y=\"-95.3\">output:</text>\n",
+       "<polyline fill=\"none\" points=\"393.326,-87.1 393.326,-136.7 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"419.986\" y=\"-120.1\">(1, 5)</text>\n",
+       "<polyline fill=\"none\" points=\"393.326,-111.9 446.647,-111.9 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"419.986\" y=\"-95.3\">(1, 10)</text>\n",
+       "</g>\n",
+       "<!-- 4495123344&#45;&gt;4743679824 -->\n",
+       "<g class=\"edge\" id=\"edge9\"><title>4495123344-&gt;4743679824</title>\n",
+       "<path d=\"M337.312,-173.483C337.312,-165.267 337.312,-155.912 337.312,-147.052\" fill=\"none\" stroke=\"black\"/>\n",
+       "<polygon fill=\"black\" points=\"340.813,-146.977 337.312,-136.977 333.813,-146.977 340.813,-146.977\" stroke=\"black\"/>\n",
+       "</g>\n",
+       "<!-- 5072433936 -->\n",
+       "<g class=\"node\" id=\"node11\"><title>5072433936</title>\n",
+       "<polygon fill=\"none\" points=\"199.975,-0.5 199.975,-50.1 474.649,-50.1 474.649,-0.5 199.975,-0.5\" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"282.816\" y=\"-21.1\">softmax_prog (Activation)</text>\n",
+       "<polyline fill=\"none\" points=\"365.657,-0.5 365.657,-50.1 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"393.492\" y=\"-33.5\">input:</text>\n",
+       "<polyline fill=\"none\" points=\"365.657,-25.3 421.328,-25.3 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"393.492\" y=\"-8.7\">output:</text>\n",
+       "<polyline fill=\"none\" points=\"421.328,-0.5 421.328,-50.1 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"447.989\" y=\"-33.5\">(1, 10)</text>\n",
+       "<polyline fill=\"none\" points=\"421.328,-25.3 474.649,-25.3 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"447.989\" y=\"-8.7\">(1, 10)</text>\n",
+       "</g>\n",
+       "<!-- 4743679824&#45;&gt;5072433936 -->\n",
+       "<g class=\"edge\" id=\"edge10\"><title>4743679824-&gt;5072433936</title>\n",
+       "<path d=\"M337.312,-86.8833C337.312,-78.6673 337.312,-69.3117 337.312,-60.4518\" fill=\"none\" stroke=\"black\"/>\n",
+       "<polygon fill=\"black\" points=\"340.813,-60.3767 337.312,-50.3767 333.813,-60.3768 340.813,-60.3767\" stroke=\"black\"/>\n",
+       "</g>\n",
+       "</g>\n",
+       "</svg>"
+      ],
+      "text/plain": [
+       "<IPython.core.display.SVG object>"
+      ]
+     },
+     "execution_count": 7,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "SVG('f_prog.svg')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 8,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [
+    {
+     "data": {
+      "image/svg+xml": [
+       "<svg height=\"838pt\" viewBox=\"0.00 0.00 1410.28 838.00\" width=\"1410pt\" xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\">\n",
+       "<g class=\"graph\" id=\"graph0\" transform=\"scale(1 1) rotate(0) translate(4 834)\">\n",
+       "<title>G</title>\n",
+       "<polygon fill=\"white\" points=\"-4,4 -4,-834 1406.28,-834 1406.28,4 -4,4\" stroke=\"none\"/>\n",
+       "<!-- 4599299216 -->\n",
+       "<g class=\"node\" id=\"node1\"><title>4599299216</title>\n",
+       "<polygon fill=\"none\" points=\"344.024,-779.9 344.024,-829.5 674.649,-829.5 674.649,-779.9 344.024,-779.9\" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"428.019\" y=\"-800.5\">f_enc_convert (Sequential)</text>\n",
+       "<polyline fill=\"none\" points=\"512.014,-779.9 512.014,-829.5 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"539.85\" y=\"-812.9\">input:</text>\n",
+       "<polyline fill=\"none\" points=\"512.014,-804.7 567.686,-804.7 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"539.85\" y=\"-788.1\">output:</text>\n",
+       "<polyline fill=\"none\" points=\"567.686,-779.9 567.686,-829.5 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"621.168\" y=\"-812.9\">[(1, 44), (1, 30)]</text>\n",
+       "<polyline fill=\"none\" points=\"567.686,-804.7 674.649,-804.7 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"620.846\" y=\"-788.1\">(1, 1, 128)</text>\n",
+       "</g>\n",
+       "<!-- 5033807632 -->\n",
+       "<g class=\"node\" id=\"node3\"><title>5033807632</title>\n",
+       "<polygon fill=\"none\" points=\"528.851,-693.3 528.851,-742.9 833.823,-742.9 833.823,-693.3 528.851,-693.3\" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"586.019\" y=\"-713.9\">merge_2 (Merge)</text>\n",
+       "<polyline fill=\"none\" points=\"643.187,-693.3 643.187,-742.9 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"671.023\" y=\"-726.3\">input:</text>\n",
+       "<polyline fill=\"none\" points=\"643.187,-718.1 698.859,-718.1 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"671.023\" y=\"-701.5\">output:</text>\n",
+       "<polyline fill=\"none\" points=\"698.859,-693.3 698.859,-742.9 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"766.341\" y=\"-726.3\">[(1, 1, 128), (1, 1, 5)]</text>\n",
+       "<polyline fill=\"none\" points=\"698.859,-718.1 833.823,-718.1 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"766.02\" y=\"-701.5\">(1, 1, 133)</text>\n",
+       "</g>\n",
+       "<!-- 4599299216&#45;&gt;5033807632 -->\n",
+       "<g class=\"edge\" id=\"edge1\"><title>4599299216-&gt;5033807632</title>\n",
+       "<path d=\"M558.165,-779.683C578.496,-769.683 602.259,-757.995 623.46,-747.567\" fill=\"none\" stroke=\"black\"/>\n",
+       "<polygon fill=\"black\" points=\"625.256,-750.585 632.685,-743.03 622.167,-744.303 625.256,-750.585\" stroke=\"black\"/>\n",
+       "</g>\n",
+       "<!-- 4625154448 -->\n",
+       "<g class=\"node\" id=\"node2\"><title>4625154448</title>\n",
+       "<polygon fill=\"none\" points=\"693.062,-779.9 693.062,-829.5 1013.61,-829.5 1013.61,-779.9 693.062,-779.9\" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"795.341\" y=\"-800.5\">program_embedding (Sequential)</text>\n",
+       "<polyline fill=\"none\" points=\"897.619,-779.9 897.619,-829.5 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"925.455\" y=\"-812.9\">input:</text>\n",
+       "<polyline fill=\"none\" points=\"897.619,-804.7 953.29,-804.7 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"925.455\" y=\"-788.1\">output:</text>\n",
+       "<polyline fill=\"none\" points=\"953.29,-779.9 953.29,-829.5 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"983.451\" y=\"-812.9\">(1, 1)</text>\n",
+       "<polyline fill=\"none\" points=\"953.29,-804.7 1013.61,-804.7 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"983.451\" y=\"-788.1\">(1, 1, 5)</text>\n",
+       "</g>\n",
+       "<!-- 4625154448&#45;&gt;5033807632 -->\n",
+       "<g class=\"edge\" id=\"edge2\"><title>4625154448-&gt;5033807632</title>\n",
+       "<path d=\"M804.509,-779.683C784.178,-769.683 760.415,-757.995 739.214,-747.567\" fill=\"none\" stroke=\"black\"/>\n",
+       "<polygon fill=\"black\" points=\"740.507,-744.303 729.989,-743.03 737.418,-750.585 740.507,-744.303\" stroke=\"black\"/>\n",
+       "</g>\n",
+       "<!-- 5009279184 -->\n",
+       "<g class=\"node\" id=\"node4\"><title>5009279184</title>\n",
+       "<polygon fill=\"none\" points=\"564.206,-606.7 564.206,-656.3 798.468,-656.3 798.468,-606.7 564.206,-606.7\" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"616.341\" y=\"-627.3\">lstm_1 (LSTM)</text>\n",
+       "<polyline fill=\"none\" points=\"668.476,-606.7 668.476,-656.3 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"696.311\" y=\"-639.7\">input:</text>\n",
+       "<polyline fill=\"none\" points=\"668.476,-631.5 724.147,-631.5 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"696.311\" y=\"-614.9\">output:</text>\n",
+       "<polyline fill=\"none\" points=\"724.147,-606.7 724.147,-656.3 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"761.308\" y=\"-639.7\">(1, 1, 133)</text>\n",
+       "<polyline fill=\"none\" points=\"724.147,-631.5 798.468,-631.5 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"761.308\" y=\"-614.9\">(1, 256)</text>\n",
+       "</g>\n",
+       "<!-- 5033807632&#45;&gt;5009279184 -->\n",
+       "<g class=\"edge\" id=\"edge3\"><title>5033807632-&gt;5009279184</title>\n",
+       "<path d=\"M681.337,-693.083C681.337,-684.867 681.337,-675.512 681.337,-666.652\" fill=\"none\" stroke=\"black\"/>\n",
+       "<polygon fill=\"black\" points=\"684.837,-666.577 681.337,-656.577 677.837,-666.577 684.837,-666.577\" stroke=\"black\"/>\n",
+       "</g>\n",
+       "<!-- 5074307728 -->\n",
+       "<g class=\"node\" id=\"node5\"><title>5074307728</title>\n",
+       "<polygon fill=\"none\" points=\"545.94,-520.1 545.94,-569.7 816.734,-569.7 816.734,-520.1 545.94,-520.1\" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"623.341\" y=\"-540.7\">relu_lstm_1 (Activation)</text>\n",
+       "<polyline fill=\"none\" points=\"700.741,-520.1 700.741,-569.7 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"728.577\" y=\"-553.1\">input:</text>\n",
+       "<polyline fill=\"none\" points=\"700.741,-544.9 756.413,-544.9 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"728.577\" y=\"-528.3\">output:</text>\n",
+       "<polyline fill=\"none\" points=\"756.413,-520.1 756.413,-569.7 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"786.574\" y=\"-553.1\">(1, 256)</text>\n",
+       "<polyline fill=\"none\" points=\"756.413,-544.9 816.734,-544.9 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"786.574\" y=\"-528.3\">(1, 256)</text>\n",
+       "</g>\n",
+       "<!-- 5009279184&#45;&gt;5074307728 -->\n",
+       "<g class=\"edge\" id=\"edge4\"><title>5009279184-&gt;5074307728</title>\n",
+       "<path d=\"M681.337,-606.483C681.337,-598.267 681.337,-588.912 681.337,-580.052\" fill=\"none\" stroke=\"black\"/>\n",
+       "<polygon fill=\"black\" points=\"684.837,-579.977 681.337,-569.977 677.837,-579.977 684.837,-579.977\" stroke=\"black\"/>\n",
+       "</g>\n",
+       "<!-- 4508958928 -->\n",
+       "<g class=\"node\" id=\"node6\"><title>4508958928</title>\n",
+       "<polygon fill=\"none\" points=\"521.863,-433.5 521.863,-483.1 840.811,-483.1 840.811,-433.5 521.863,-433.5\" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"616.341\" y=\"-454.1\">repeatvector_2 (RepeatVector)</text>\n",
+       "<polyline fill=\"none\" points=\"710.818,-433.5 710.818,-483.1 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"738.654\" y=\"-466.5\">input:</text>\n",
+       "<polyline fill=\"none\" points=\"710.818,-458.3 766.49,-458.3 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"738.654\" y=\"-441.7\">output:</text>\n",
+       "<polyline fill=\"none\" points=\"766.49,-433.5 766.49,-483.1 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"803.65\" y=\"-466.5\">(1, 256)</text>\n",
+       "<polyline fill=\"none\" points=\"766.49,-458.3 840.811,-458.3 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"803.65\" y=\"-441.7\">(1, 1, 256)</text>\n",
+       "</g>\n",
+       "<!-- 5074307728&#45;&gt;4508958928 -->\n",
+       "<g class=\"edge\" id=\"edge5\"><title>5074307728-&gt;4508958928</title>\n",
+       "<path d=\"M681.337,-519.883C681.337,-511.667 681.337,-502.312 681.337,-493.452\" fill=\"none\" stroke=\"black\"/>\n",
+       "<polygon fill=\"black\" points=\"684.837,-493.377 681.337,-483.377 677.837,-493.377 684.837,-493.377\" stroke=\"black\"/>\n",
+       "</g>\n",
+       "<!-- 4738189776 -->\n",
+       "<g class=\"node\" id=\"node7\"><title>4738189776</title>\n",
+       "<polygon fill=\"none\" points=\"564.206,-346.9 564.206,-396.5 798.468,-396.5 798.468,-346.9 564.206,-346.9\" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"616.341\" y=\"-367.5\">lstm_2 (LSTM)</text>\n",
+       "<polyline fill=\"none\" points=\"668.476,-346.9 668.476,-396.5 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"696.311\" y=\"-379.9\">input:</text>\n",
+       "<polyline fill=\"none\" points=\"668.476,-371.7 724.147,-371.7 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"696.311\" y=\"-355.1\">output:</text>\n",
+       "<polyline fill=\"none\" points=\"724.147,-346.9 724.147,-396.5 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"761.308\" y=\"-379.9\">(1, 1, 256)</text>\n",
+       "<polyline fill=\"none\" points=\"724.147,-371.7 798.468,-371.7 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"761.308\" y=\"-355.1\">(1, 256)</text>\n",
+       "</g>\n",
+       "<!-- 4508958928&#45;&gt;4738189776 -->\n",
+       "<g class=\"edge\" id=\"edge6\"><title>4508958928-&gt;4738189776</title>\n",
+       "<path d=\"M681.337,-433.283C681.337,-425.067 681.337,-415.712 681.337,-406.852\" fill=\"none\" stroke=\"black\"/>\n",
+       "<polygon fill=\"black\" points=\"684.837,-406.777 681.337,-396.777 677.837,-406.777 684.837,-406.777\" stroke=\"black\"/>\n",
+       "</g>\n",
+       "<!-- 4599983056 -->\n",
+       "<g class=\"node\" id=\"node8\"><title>4599983056</title>\n",
+       "<polygon fill=\"none\" points=\"545.94,-260.3 545.94,-309.9 816.734,-309.9 816.734,-260.3 545.94,-260.3\" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"623.341\" y=\"-280.9\">relu_lstm_2 (Activation)</text>\n",
+       "<polyline fill=\"none\" points=\"700.741,-260.3 700.741,-309.9 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"728.577\" y=\"-293.3\">input:</text>\n",
+       "<polyline fill=\"none\" points=\"700.741,-285.1 756.413,-285.1 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"728.577\" y=\"-268.5\">output:</text>\n",
+       "<polyline fill=\"none\" points=\"756.413,-260.3 756.413,-309.9 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"786.574\" y=\"-293.3\">(1, 256)</text>\n",
+       "<polyline fill=\"none\" points=\"756.413,-285.1 816.734,-285.1 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"786.574\" y=\"-268.5\">(1, 256)</text>\n",
+       "</g>\n",
+       "<!-- 4738189776&#45;&gt;4599983056 -->\n",
+       "<g class=\"edge\" id=\"edge7\"><title>4738189776-&gt;4599983056</title>\n",
+       "<path d=\"M681.337,-346.683C681.337,-338.467 681.337,-329.112 681.337,-320.252\" fill=\"none\" stroke=\"black\"/>\n",
+       "<polygon fill=\"black\" points=\"684.837,-320.177 681.337,-310.177 677.837,-320.177 684.837,-320.177\" stroke=\"black\"/>\n",
+       "</g>\n",
+       "<!-- 4495123344 -->\n",
+       "<g class=\"node\" id=\"node9\"><title>4495123344</title>\n",
+       "<polygon fill=\"none\" points=\"41.5028,-173.7 41.5028,-223.3 267.171,-223.3 267.171,-173.7 41.5028,-173.7\" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"96.3405\" y=\"-194.3\">dense_2 (Dense)</text>\n",
+       "<polyline fill=\"none\" points=\"151.178,-173.7 151.178,-223.3 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"179.014\" y=\"-206.7\">input:</text>\n",
+       "<polyline fill=\"none\" points=\"151.178,-198.5 206.85,-198.5 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"179.014\" y=\"-181.9\">output:</text>\n",
+       "<polyline fill=\"none\" points=\"206.85,-173.7 206.85,-223.3 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"237.011\" y=\"-206.7\">(1, 256)</text>\n",
+       "<polyline fill=\"none\" points=\"206.85,-198.5 267.171,-198.5 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"237.011\" y=\"-181.9\">(1, 5)</text>\n",
+       "</g>\n",
+       "<!-- 4599983056&#45;&gt;4495123344 -->\n",
+       "<g class=\"edge\" id=\"edge8\"><title>4599983056-&gt;4495123344</title>\n",
+       "<path d=\"M545.577,-263.534C471.308,-252.135 377.702,-237.529 294.337,-223.8 288.86,-222.898 283.265,-221.967 277.614,-221.019\" fill=\"none\" stroke=\"black\"/>\n",
+       "<polygon fill=\"black\" points=\"277.838,-217.507 267.395,-219.296 276.674,-224.41 277.838,-217.507\" stroke=\"black\"/>\n",
+       "</g>\n",
+       "<!-- 4968395088 -->\n",
+       "<g class=\"node\" id=\"node10\"><title>4968395088</title>\n",
+       "<polygon fill=\"none\" points=\"303.503,-173.7 303.503,-223.3 529.171,-223.3 529.171,-173.7 303.503,-173.7\" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"358.341\" y=\"-194.3\">dense_1 (Dense)</text>\n",
+       "<polyline fill=\"none\" points=\"413.178,-173.7 413.178,-223.3 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"441.014\" y=\"-206.7\">input:</text>\n",
+       "<polyline fill=\"none\" points=\"413.178,-198.5 468.85,-198.5 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"441.014\" y=\"-181.9\">output:</text>\n",
+       "<polyline fill=\"none\" points=\"468.85,-173.7 468.85,-223.3 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"499.011\" y=\"-206.7\">(1, 256)</text>\n",
+       "<polyline fill=\"none\" points=\"468.85,-198.5 529.171,-198.5 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"499.011\" y=\"-181.9\">(1, 1)</text>\n",
+       "</g>\n",
+       "<!-- 4599983056&#45;&gt;4968395088 -->\n",
+       "<g class=\"edge\" id=\"edge9\"><title>4599983056-&gt;4968395088</title>\n",
+       "<path d=\"M606.461,-260.196C573.586,-249.701 534.832,-237.329 500.919,-226.502\" fill=\"none\" stroke=\"black\"/>\n",
+       "<polygon fill=\"black\" points=\"501.619,-223.052 491.028,-223.345 499.49,-229.72 501.619,-223.052\" stroke=\"black\"/>\n",
+       "</g>\n",
+       "<!-- 4602434768 -->\n",
+       "<g class=\"node\" id=\"node12\"><title>4602434768</title>\n",
+       "<polygon fill=\"none\" points=\"568.503,-173.7 568.503,-223.3 794.171,-223.3 794.171,-173.7 568.503,-173.7\" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"623.341\" y=\"-194.3\">dense_4 (Dense)</text>\n",
+       "<polyline fill=\"none\" points=\"678.178,-173.7 678.178,-223.3 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"706.014\" y=\"-206.7\">input:</text>\n",
+       "<polyline fill=\"none\" points=\"678.178,-198.5 733.85,-198.5 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"706.014\" y=\"-181.9\">output:</text>\n",
+       "<polyline fill=\"none\" points=\"733.85,-173.7 733.85,-223.3 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"764.011\" y=\"-206.7\">(1, 256)</text>\n",
+       "<polyline fill=\"none\" points=\"733.85,-198.5 794.171,-198.5 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"764.011\" y=\"-181.9\">(1, 10)</text>\n",
+       "</g>\n",
+       "<!-- 4599983056&#45;&gt;4602434768 -->\n",
+       "<g class=\"edge\" id=\"edge11\"><title>4599983056-&gt;4602434768</title>\n",
+       "<path d=\"M681.337,-260.083C681.337,-251.867 681.337,-242.512 681.337,-233.652\" fill=\"none\" stroke=\"black\"/>\n",
+       "<polygon fill=\"black\" points=\"684.837,-233.577 681.337,-223.577 677.837,-233.577 684.837,-233.577\" stroke=\"black\"/>\n",
+       "</g>\n",
+       "<!-- 4971146064 -->\n",
+       "<g class=\"node\" id=\"node13\"><title>4971146064</title>\n",
+       "<polygon fill=\"none\" points=\"836.503,-173.7 836.503,-223.3 1062.17,-223.3 1062.17,-173.7 836.503,-173.7\" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"891.341\" y=\"-194.3\">dense_5 (Dense)</text>\n",
+       "<polyline fill=\"none\" points=\"946.178,-173.7 946.178,-223.3 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"974.014\" y=\"-206.7\">input:</text>\n",
+       "<polyline fill=\"none\" points=\"946.178,-198.5 1001.85,-198.5 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"974.014\" y=\"-181.9\">output:</text>\n",
+       "<polyline fill=\"none\" points=\"1001.85,-173.7 1001.85,-223.3 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"1032.01\" y=\"-206.7\">(1, 256)</text>\n",
+       "<polyline fill=\"none\" points=\"1001.85,-198.5 1062.17,-198.5 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"1032.01\" y=\"-181.9\">(1, 10)</text>\n",
+       "</g>\n",
+       "<!-- 4599983056&#45;&gt;4971146064 -->\n",
+       "<g class=\"edge\" id=\"edge12\"><title>4599983056-&gt;4971146064</title>\n",
+       "<path d=\"M757.06,-260.196C790.451,-249.656 829.837,-237.223 864.239,-226.363\" fill=\"none\" stroke=\"black\"/>\n",
+       "<polygon fill=\"black\" points=\"865.318,-229.693 873.801,-223.345 863.211,-223.017 865.318,-229.693\" stroke=\"black\"/>\n",
+       "</g>\n",
+       "<!-- 4765728400 -->\n",
+       "<g class=\"node\" id=\"node14\"><title>4765728400</title>\n",
+       "<polygon fill=\"none\" points=\"1116.5,-173.7 1116.5,-223.3 1342.17,-223.3 1342.17,-173.7 1116.5,-173.7\" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"1171.34\" y=\"-194.3\">dense_6 (Dense)</text>\n",
+       "<polyline fill=\"none\" points=\"1226.18,-173.7 1226.18,-223.3 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"1254.01\" y=\"-206.7\">input:</text>\n",
+       "<polyline fill=\"none\" points=\"1226.18,-198.5 1281.85,-198.5 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"1254.01\" y=\"-181.9\">output:</text>\n",
+       "<polyline fill=\"none\" points=\"1281.85,-173.7 1281.85,-223.3 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"1312.01\" y=\"-206.7\">(1, 256)</text>\n",
+       "<polyline fill=\"none\" points=\"1281.85,-198.5 1342.17,-198.5 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"1312.01\" y=\"-181.9\">(1, 10)</text>\n",
+       "</g>\n",
+       "<!-- 4599983056&#45;&gt;4765728400 -->\n",
+       "<g class=\"edge\" id=\"edge13\"><title>4599983056-&gt;4765728400</title>\n",
+       "<path d=\"M816.798,-263.188C905.365,-249.515 1020.14,-231.796 1106.13,-218.52\" fill=\"none\" stroke=\"black\"/>\n",
+       "<polygon fill=\"black\" points=\"1106.86,-221.949 1116.21,-216.965 1105.79,-215.031 1106.86,-221.949\" stroke=\"black\"/>\n",
+       "</g>\n",
+       "<!-- 4743679824 -->\n",
+       "<g class=\"node\" id=\"node11\"><title>4743679824</title>\n",
+       "<polygon fill=\"none\" points=\"28.0028,-87.1 28.0028,-136.7 246.671,-136.7 246.671,-87.1 28.0028,-87.1\" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"82.8405\" y=\"-107.7\">dense_3 (Dense)</text>\n",
+       "<polyline fill=\"none\" points=\"137.678,-87.1 137.678,-136.7 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"165.514\" y=\"-120.1\">input:</text>\n",
+       "<polyline fill=\"none\" points=\"137.678,-111.9 193.35,-111.9 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"165.514\" y=\"-95.3\">output:</text>\n",
+       "<polyline fill=\"none\" points=\"193.35,-87.1 193.35,-136.7 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"220.011\" y=\"-120.1\">(1, 5)</text>\n",
+       "<polyline fill=\"none\" points=\"193.35,-111.9 246.671,-111.9 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"220.011\" y=\"-95.3\">(1, 10)</text>\n",
+       "</g>\n",
+       "<!-- 4495123344&#45;&gt;4743679824 -->\n",
+       "<g class=\"edge\" id=\"edge10\"><title>4495123344-&gt;4743679824</title>\n",
+       "<path d=\"M149.511,-173.483C147.86,-165.267 145.98,-155.912 144.2,-147.052\" fill=\"none\" stroke=\"black\"/>\n",
+       "<polygon fill=\"black\" points=\"147.577,-146.091 142.175,-136.977 140.714,-147.47 147.577,-146.091\" stroke=\"black\"/>\n",
+       "</g>\n",
+       "<!-- 4448914256 -->\n",
+       "<g class=\"node\" id=\"node15\"><title>4448914256</title>\n",
+       "<polygon fill=\"none\" points=\"264.215,-87.1 264.215,-136.7 526.459,-136.7 526.459,-87.1 264.215,-87.1\" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"344.341\" y=\"-107.7\">sigmoid_end (Activation)</text>\n",
+       "<polyline fill=\"none\" points=\"424.466,-87.1 424.466,-136.7 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"452.302\" y=\"-120.1\">input:</text>\n",
+       "<polyline fill=\"none\" points=\"424.466,-111.9 480.137,-111.9 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"452.302\" y=\"-95.3\">output:</text>\n",
+       "<polyline fill=\"none\" points=\"480.137,-87.1 480.137,-136.7 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"503.298\" y=\"-120.1\">(1, 1)</text>\n",
+       "<polyline fill=\"none\" points=\"480.137,-111.9 526.459,-111.9 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"503.298\" y=\"-95.3\">(1, 1)</text>\n",
+       "</g>\n",
+       "<!-- 4968395088&#45;&gt;4448914256 -->\n",
+       "<g class=\"edge\" id=\"edge14\"><title>4968395088-&gt;4448914256</title>\n",
+       "<path d=\"M410.375,-173.483C408.314,-165.178 405.963,-155.708 403.743,-146.763\" fill=\"none\" stroke=\"black\"/>\n",
+       "<polygon fill=\"black\" points=\"407.12,-145.839 401.313,-136.977 400.326,-147.525 407.12,-145.839\" stroke=\"black\"/>\n",
+       "</g>\n",
+       "<!-- 5072433936 -->\n",
+       "<g class=\"node\" id=\"node19\"><title>5072433936</title>\n",
+       "<polygon fill=\"none\" points=\"-2.84217e-14,-0.5 -2.84217e-14,-50.1 274.674,-50.1 274.674,-0.5 -2.84217e-14,-0.5\" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"82.8405\" y=\"-21.1\">softmax_prog (Activation)</text>\n",
+       "<polyline fill=\"none\" points=\"165.681,-0.5 165.681,-50.1 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"193.517\" y=\"-33.5\">input:</text>\n",
+       "<polyline fill=\"none\" points=\"165.681,-25.3 221.353,-25.3 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"193.517\" y=\"-8.7\">output:</text>\n",
+       "<polyline fill=\"none\" points=\"221.353,-0.5 221.353,-50.1 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"248.013\" y=\"-33.5\">(1, 10)</text>\n",
+       "<polyline fill=\"none\" points=\"221.353,-25.3 274.674,-25.3 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"248.013\" y=\"-8.7\">(1, 10)</text>\n",
+       "</g>\n",
+       "<!-- 4743679824&#45;&gt;5072433936 -->\n",
+       "<g class=\"edge\" id=\"edge18\"><title>4743679824-&gt;5072433936</title>\n",
+       "<path d=\"M137.337,-86.8833C137.337,-78.6673 137.337,-69.3117 137.337,-60.4518\" fill=\"none\" stroke=\"black\"/>\n",
+       "<polygon fill=\"black\" points=\"140.837,-60.3767 137.337,-50.3767 133.837,-60.3768 140.837,-60.3767\" stroke=\"black\"/>\n",
+       "</g>\n",
+       "<!-- 4971145232 -->\n",
+       "<g class=\"node\" id=\"node16\"><title>4971145232</title>\n",
+       "<polygon fill=\"none\" points=\"544.393,-87.1 544.393,-136.7 818.281,-136.7 818.281,-87.1 544.393,-87.1\" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"626.841\" y=\"-107.7\">softmax_arg1 (Activation)</text>\n",
+       "<polyline fill=\"none\" points=\"709.288,-87.1 709.288,-136.7 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"737.124\" y=\"-120.1\">input:</text>\n",
+       "<polyline fill=\"none\" points=\"709.288,-111.9 764.96,-111.9 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"737.124\" y=\"-95.3\">output:</text>\n",
+       "<polyline fill=\"none\" points=\"764.96,-87.1 764.96,-136.7 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"791.621\" y=\"-120.1\">(1, 10)</text>\n",
+       "<polyline fill=\"none\" points=\"764.96,-111.9 818.281,-111.9 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"791.621\" y=\"-95.3\">(1, 10)</text>\n",
+       "</g>\n",
+       "<!-- 4602434768&#45;&gt;4971145232 -->\n",
+       "<g class=\"edge\" id=\"edge15\"><title>4602434768-&gt;4971145232</title>\n",
+       "<path d=\"M681.337,-173.483C681.337,-165.267 681.337,-155.912 681.337,-147.052\" fill=\"none\" stroke=\"black\"/>\n",
+       "<polygon fill=\"black\" points=\"684.837,-146.977 681.337,-136.977 677.837,-146.977 684.837,-146.977\" stroke=\"black\"/>\n",
+       "</g>\n",
+       "<!-- 4823026000 -->\n",
+       "<g class=\"node\" id=\"node17\"><title>4823026000</title>\n",
+       "<polygon fill=\"none\" points=\"836.393,-87.1 836.393,-136.7 1110.28,-136.7 1110.28,-87.1 836.393,-87.1\" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"918.841\" y=\"-107.7\">softmax_arg2 (Activation)</text>\n",
+       "<polyline fill=\"none\" points=\"1001.29,-87.1 1001.29,-136.7 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"1029.12\" y=\"-120.1\">input:</text>\n",
+       "<polyline fill=\"none\" points=\"1001.29,-111.9 1056.96,-111.9 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"1029.12\" y=\"-95.3\">output:</text>\n",
+       "<polyline fill=\"none\" points=\"1056.96,-87.1 1056.96,-136.7 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"1083.62\" y=\"-120.1\">(1, 10)</text>\n",
+       "<polyline fill=\"none\" points=\"1056.96,-111.9 1110.28,-111.9 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"1083.62\" y=\"-95.3\">(1, 10)</text>\n",
+       "</g>\n",
+       "<!-- 4971146064&#45;&gt;4823026000 -->\n",
+       "<g class=\"edge\" id=\"edge16\"><title>4971146064-&gt;4823026000</title>\n",
+       "<path d=\"M956.15,-173.483C958.506,-165.178 961.193,-155.708 963.73,-146.763\" fill=\"none\" stroke=\"black\"/>\n",
+       "<polygon fill=\"black\" points=\"967.145,-147.552 966.507,-136.977 960.41,-145.642 967.145,-147.552\" stroke=\"black\"/>\n",
+       "</g>\n",
+       "<!-- 4744310288 -->\n",
+       "<g class=\"node\" id=\"node18\"><title>4744310288</title>\n",
+       "<polygon fill=\"none\" points=\"1128.39,-87.1 1128.39,-136.7 1402.28,-136.7 1402.28,-87.1 1128.39,-87.1\" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"1210.84\" y=\"-107.7\">softmax_arg3 (Activation)</text>\n",
+       "<polyline fill=\"none\" points=\"1293.29,-87.1 1293.29,-136.7 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"1321.12\" y=\"-120.1\">input:</text>\n",
+       "<polyline fill=\"none\" points=\"1293.29,-111.9 1348.96,-111.9 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"1321.12\" y=\"-95.3\">output:</text>\n",
+       "<polyline fill=\"none\" points=\"1348.96,-87.1 1348.96,-136.7 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"1375.62\" y=\"-120.1\">(1, 10)</text>\n",
+       "<polyline fill=\"none\" points=\"1348.96,-111.9 1402.28,-111.9 \" stroke=\"black\"/>\n",
+       "<text font-family=\"Times,serif\" font-size=\"14.00\" text-anchor=\"middle\" x=\"1375.62\" y=\"-95.3\">(1, 10)</text>\n",
+       "</g>\n",
+       "<!-- 4765728400&#45;&gt;4744310288 -->\n",
+       "<g class=\"edge\" id=\"edge17\"><title>4765728400-&gt;4744310288</title>\n",
+       "<path d=\"M1239.56,-173.483C1243.17,-164.999 1247.29,-155.3 1251.17,-146.187\" fill=\"none\" stroke=\"black\"/>\n",
+       "<polygon fill=\"black\" points=\"1254.4,-147.549 1255.09,-136.977 1247.96,-144.808 1254.4,-147.549\" stroke=\"black\"/>\n",
+       "</g>\n",
+       "</g>\n",
+       "</svg>"
+      ],
+      "text/plain": [
+       "<IPython.core.display.SVG object>"
+      ]
+     },
+     "execution_count": 8,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "SVG('model.svg')"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "# Fitting\n",
+    "The actual code to fit the model with the training data"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "training f_enc\n",
+      "ep   0: loss=1.03819\n",
+      "ep   1: loss=0.242629\n",
+      "ep   2: loss=0.094752\n",
+      "ep   3: loss=0.0467588\n",
+      "ep   4: loss=0.0263074\n",
+      "ep   5: loss=0.0160311\n",
+      "ep   6: loss=0.0102503\n",
+      "ep   7: loss=0.00677445\n",
+      "ep   8: loss=0.00456079\n",
+      "ep   9: loss=0.00311668\n",
+      "ep  10: loss=0.00214863\n",
+      "ep  11: loss=0.00149294\n",
+      "ep  12: loss=0.00103956\n",
+      "ep  13: loss=0.000728405\n",
+      "ep  14: loss=0.000511663\n",
+      "ep  15: loss=0.000359279\n",
+      "ep  16: loss=0.000252763\n",
+      "ep  17: loss=0.000177881\n",
+      "ep  18: loss=0.000125569\n",
+      "ep  19: loss=8.86349e-05\n",
+      "ep  20: loss=6.25864e-05\n",
+      "ep  21: loss=4.4173e-05\n",
+      "ep  22: loss=3.12042e-05\n",
+      "ep  23: loss=2.20769e-05\n",
+      "ep  24: loss=1.56068e-05\n",
+      "ep  25: loss=1.10763e-05\n",
+      "ep  26: loss=7.82133e-06\n",
+      "ep  27: loss=5.57107e-06\n",
+      "ep  28: loss=3.95074e-06\n",
+      "ep  29: loss=2.81476e-06\n",
+      "ep  30: loss=2.01948e-06\n",
+      "ep  31: loss=1.45326e-06\n",
+      "ep  32: loss=1.0526e-06\n",
+      "ep  33: loss=7.7144e-07\n",
+      "Re-Compile Model lr=0.0001 aw=1.0\n",
+      "training questions of a<100 and b<100"
+     ]
+    }
+   ],
+   "source": [
+    "npi_model.fit(steps_list)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": []
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 2",
+   "language": "python",
+   "name": "python2"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 2
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython2",
+   "version": "2.7.12"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 0
+}
diff --git a/src/npi/add/model.py b/src/npi/add/model.py
index 32e70bd..7cb6dc3 100644
--- a/src/npi/add/model.py
+++ b/src/npi/add/model.py
@@ -16,7 +16,8 @@
 from keras.models import Sequential, model_from_yaml
 from keras.optimizers import Adam
 from keras.regularizers import l1, l2
-from keras.utils.visualize_util import plot
+from keras.utils.visualize_util import model_to_dot
+
 
 from npi.add.config import FIELD_ROW, FIELD_DEPTH, PROGRAM_VEC_SIZE, PROGRAM_KEY_VEC_SIZE, FIELD_WIDTH
 from npi.add.lib import AdditionProgramSet, AdditionEnv, run_npi, create_questions, AdditionTeacher, \
@@ -28,6 +29,11 @@
 
 __author__ = 'k_morishita'
 
+def plot(in_model, to_file, **kwargs):
+    """
+    A SVG-based version of the keras version
+    """
+    return model_to_dot(in_model, **kwargs).write_svg(to_file)
 
 class AdditionNPIModel(NPIStep):
     model = None
@@ -65,11 +71,11 @@ def build(self):
         f_lstm = Sequential(name='f_lstm')
         f_lstm.add(Merge([f_enc_convert, program_embedding], mode='concat'))
         f_lstm.add(LSTM(256, return_sequences=False, stateful=True, W_regularizer=l2(0.0000001)))
-        f_lstm.add(Activation('rel', name='relu_lstm_1'))
+        f_lstm.add(Activation('relu', name='relu_lstm_1'))
         f_lstm.add(RepeatVector(1))
         f_lstm.add(LSTM(256, return_sequences=False, stateful=True, W_regularizer=l2(0.0000001)))
-        f_lstm.add(Activation('rel', name='relu_lstm_2'))
-        # plot(f_lstm, to_file='f_lstm.png', show_shapes=True)
+        f_lstm.add(Activation('relu', name='relu_lstm_2'))
+        plot(f_lstm, to_file='f_lstm.svg', show_shapes=True)
 
         f_end = Sequential(name='f_end')
         f_end.add(f_lstm)
@@ -78,10 +84,10 @@ def build(self):
 
         f_prog = Sequential(name='f_prog')
         f_prog.add(f_lstm)
-        f_prog.add(Dense(PROGRAM_KEY_VEC_SIZE, activation="rel"))
+        f_prog.add(Dense(PROGRAM_KEY_VEC_SIZE, activation="relu"))
         f_prog.add(Dense(PROGRAM_VEC_SIZE, W_regularizer=l2(0.0001)))
         f_prog.add(Activation('softmax', name='softmax_prog'))
-        # plot(f_prog, to_file='f_prog.png', show_shapes=True)
+        plot(f_prog, to_file='f_prog.svg', show_shapes=True)
 
         f_args = []
         for ai in xrange(1, IntegerArguments.max_arg_num+1):
@@ -96,7 +102,7 @@ def build(self):
                            [f_end.output, f_prog.output] + [fa.output for fa in f_args],
                            name="npi")
         self.compile_model()
-        plot(self.model, to_file='model.png', show_shapes=True)
+        plot(self.model, to_file='model.svg', show_shapes=True)
 
     def reset(self):
         super(AdditionNPIModel, self).reset()
@@ -265,8 +271,7 @@ def do_learn(self, steps_list, epoch, pass_rate=1.0, skip_correct=False):
                     last_weights = self.model.get_weights()
             if losses:
                 cur_loss = np.average(losses)
-                print "ep=%2d: ok_rate=%.2f%% (+%s -%s): ave loss %s (%s samples)" %
-                      (ep, np.average(ok_rate)*100, correct_new, wrong_new, cur_loss, len(steps_list))
+                print "ep=%2d: ok_rate=%.2f%% (+%s -%s): ave loss %s (%s samples)" % (ep, np.average(ok_rate)*100, correct_new, wrong_new, cur_loss, len(steps_list))
                 # self.print_weights()
                 if correct_new + wrong_new == 0:
                     no_change_count += 1