This patch is for better numerical behaviors:

- Add alpha, get_scale function for binary and ternary quantizers. - Control the initial weight distribution with respect to fan-in of layers. PiperOrigin-RevId: 302736657 Change-Id: I296d8fe267f9fb47e45ad3bdddac1d7a332c155c
google · Mar 24, 2020 · 244ebe8 · 244ebe8
1 parent 01a61fb
commit 244ebe8
Show file tree

Hide file tree

Showing 21 changed files with 2,604 additions and 559 deletions.
diff --git a/CHANGELOG b/CHANGELOG
@@ -1,2 +1,3 @@
-v0.5, 07/18/2019 -- Initial release.
-v0.6, 12/03/2019 -- Support tensorflow 2.0 and tf.keras
+v0.5, 2019/07 -- Initial release.
+v0.6, 2020/03 -- Support tensorflow 2.0, tf.keras and python3.
+v0.7, 2020/03 -- Enhancemence of binary and ternary quantization.
diff --git a/README.md b/README.md
@@ -137,6 +137,7 @@ that accept an alpha parameter, we need to specify a range of alpha,
 and for po2 type of quantizers, we need to specify the range of
 max_value.
 
+
 ### Example
 
 Suppose you have the following network.

diff --git a/examples/example_ternary.py b/examples/example_ternary.py
@@ -0,0 +1,113 @@
+# Copyright 2020 Google LLC
+#
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+from __future__ import absolute_import  # Not necessary in a Python 3-only module
+from __future__ import division  # Not necessary in a Python 3-only module
+from __future__ import google_type_annotations  # Not necessary in a Python 3-only module
+from __future__ import print_function  # Not necessary in a Python 3-only module
+
+from absl import app
+from absl import flags
+import matplotlib
+import numpy as np
+
+matplotlib.use('TkAgg')
+import matplotlib.pyplot as plt
+
+
+FLAGS = flags.FLAGS
+
+
+def _stochastic_rounding(x, precision, resolution, delta):
+  """Stochastic_rounding for ternary.
+
+  Args:
+    x:
+    precision: A float. The area we want to make this stochastic rounding.
+       [delta-precision, delta] [delta, delta+precision]
+    resolution: control the quantization resolution.
+    delta: the undiscountinued point (positive number)
+
+  Return:
+    A tensor with stochastic rounding numbers.
+  """
+  delta_left = delta - precision
+  delta_right = delta + precision
+  scale = 1 / resolution
+  scale_delta_left = delta_left * scale
+  scale_delta_right = delta_right * scale
+  scale_2_delta = scale_delta_right - scale_delta_left
+  scale_x = x * scale
+  fraction = scale_x - scale_delta_left
+  # print(precision, scale, x[0], np.floor(scale_x[0]), scale_x[0], fraction[0])
+
+  # we use uniform distribution
+  random_selector = np.random.uniform(0, 1, size=x.shape) * scale_2_delta
+
+  # print(precision, scale, x[0], delta_left[0], delta_right[0])
+  # print('x', scale_x[0], fraction[0], random_selector[0], scale_2_delta[0])
+  # rounddown = fraction < random_selector
+  result = np.where(fraction < random_selector,
+                    scale_delta_left / scale,
+                    scale_delta_right / scale)
+  return result
+
+
+def _ternary(x, sto=False):
+  m = np.amax(np.abs(x), keepdims=True)
+  scale = 2 * m / 3.0
+  thres = scale / 2.0
+  ratio = 0.1
+
+  if sto:
+    sign_bit = np.sign(x)
+    x = np.abs(x)
+    prec = x / scale
+    x = (
+        sign_bit * scale * _stochastic_rounding(
+            x / scale,
+            precision=0.3, resolution=0.01, # those two are all normalized.
+            delta=thres / scale))
+    # prec + prec *ratio)
+    # mm = np.amax(np.abs(x), keepdims=True)
+  return np.where(np.abs(x) < thres, np.zeros_like(x), np.sign(x))
+
+
+def main(argv):
+  if len(argv) > 1:
+    raise app.UsageError('Too many command-line arguments.')
+
+  # x = np.arange(-3.0, 3.0, 0.01)
+  # x = np.random.uniform(-0.01, 0.01, size=1000)
+  x = np.random.uniform(-10.0, 10.0, size=1000)
+  # x = np.random.uniform(-1, 1, size=1000)
+  x = np.sort(x)
+  tr = np.zeros_like(x)
+  t = np.zeros_like(x)
+  iter_count = 500
+  for _ in range(iter_count):
+    y = _ternary(x)
+    yr = _ternary(x, sto=True)
+    t = t + y
+    tr = tr + yr
+
+  plt.plot(x, t/iter_count)
+  plt.plot(x, tr/iter_count)
+  plt.ylabel('mean (%s samples)' % iter_count)
+  plt.show()
+
+
+if __name__ == '__main__':
+  app.run(main)
diff --git a/notebook/QKerasTutorial.ipynb b/notebook/QKerasTutorial.ipynb
diff --git a/notebook/images/figure1.png b/notebook/images/figure1.png
diff --git a/notebook/images/figure2.png b/notebook/images/figure2.png
diff --git a/qkeras/__init__.py b/qkeras/__init__.py
@@ -27,4 +27,4 @@
 from .qpooling import *  # pylint: disable=wildcard-import
 from .safe_eval import *  # pylint: disable=wildcard-import
 
-__version__ = "0.6.0"
+__version__ = "0.7.0"