Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Add SPSA optimizer #653

Merged
merged 39 commits into from
Jan 20, 2022
Merged
Show file tree
Hide file tree
Changes from 37 commits
Commits
Show all changes
39 commits
Select commit Hold shift + click to select a range
9b0628b
Create spsa_minimizer.py
lockwo Jan 5, 2022
0486c45
Update spsa_minimizer.py
lockwo Jan 5, 2022
7b74ccb
Update __init__.py
lockwo Jan 5, 2022
833b8c8
Create spsa_minimizer_test.py
lockwo Jan 5, 2022
522bf08
Update __init__.py
lockwo Jan 6, 2022
33e607f
Update spsa_minimizer.py
lockwo Jan 6, 2022
ba92437
Update spsa_minimizer.py
lockwo Jan 6, 2022
363af00
Update spsa_minimizer.py
lockwo Jan 6, 2022
ba8668a
Update spsa_minimizer.py
lockwo Jan 6, 2022
a7471e6
Update spsa_minimizer.py
lockwo Jan 6, 2022
fc0e0ef
Update spsa_minimizer_test.py
lockwo Jan 6, 2022
0144889
Update spsa_minimizer.py
lockwo Jan 6, 2022
728d55e
Update spsa_minimizer.py
lockwo Jan 6, 2022
5d49981
Update spsa_minimizer_test.py
lockwo Jan 6, 2022
7daf326
Update spsa_minimizer.py
lockwo Jan 6, 2022
c2b9ebd
Update spsa_minimizer.py
lockwo Jan 6, 2022
d145b6a
Update spsa_minimizer.py
lockwo Jan 6, 2022
54f01ea
Update spsa_minimizer.py
lockwo Jan 6, 2022
5a2dd0f
Update spsa_minimizer.py
lockwo Jan 6, 2022
ad542c0
Update import_test.py
lockwo Jan 6, 2022
35558bb
Update BUILD
lockwo Jan 6, 2022
4707477
Update BUILD
lockwo Jan 6, 2022
64e5c9a
Update build_docs.py
lockwo Jan 6, 2022
09679ce
Update spsa_minimizer.py
lockwo Jan 13, 2022
3fdc0c3
Update spsa_minimizer_test.py
lockwo Jan 13, 2022
65b6b3b
Update spsa_minimizer_test.py
lockwo Jan 13, 2022
4a3edbf
Update spsa_minimizer.py
lockwo Jan 13, 2022
412adf4
Update spsa_minimizer.py
lockwo Jan 13, 2022
654f398
Update spsa_minimizer_test.py
lockwo Jan 13, 2022
14e9e04
Update spsa_minimizer.py
lockwo Jan 13, 2022
00d982f
Update spsa_minimizer_test.py
lockwo Jan 13, 2022
e71d8e2
Update spsa_minimizer.py
lockwo Jan 13, 2022
73f1e4f
Update rotosolve_minimizer_test.py
lockwo Jan 13, 2022
2663722
Update spsa_minimizer_test.py
lockwo Jan 13, 2022
d47a968
Update spsa_minimizer_test.py
lockwo Jan 13, 2022
490dd7a
Update rotosolve_minimizer_test.py
lockwo Jan 13, 2022
de57af9
Update spsa_minimizer_test.py
lockwo Jan 13, 2022
9bd74f0
Update spsa_minimizer.py
lockwo Jan 18, 2022
8997511
Merge branch 'master' into master
MichaelBroughton Jan 19, 2022
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
1 change: 1 addition & 0 deletions release/BUILD
Original file line number Diff line number Diff line change
Expand Up @@ -65,5 +65,6 @@ sh_binary(
"//tensorflow_quantum/python:quantum_context",
"//tensorflow_quantum/python:util",
"//tensorflow_quantum/python/optimizers:rotosolve_minimizer",
"//tensorflow_quantum/python/optimizers:spsa_minimizer",
],
)
2 changes: 1 addition & 1 deletion scripts/build_docs.py
Original file line number Diff line number Diff line change
Expand Up @@ -67,7 +67,7 @@ def main(unused_argv):
"parameter_shift_util", "adjoint"
],
"tfq.datasets": ["cluster_state"],
"tfq.optimizers": ["rotosolve_minimizer"],
"tfq.optimizers": ["rotosolve_minimizer", "spsa_minimizer"],
"tfq.util": [
"from_tensor", "convert_to_tensor", "exp_identity",
"check_commutability", "kwargs_cartesian_product",
Expand Down
1 change: 1 addition & 0 deletions scripts/import_test.py
Original file line number Diff line number Diff line change
Expand Up @@ -81,6 +81,7 @@ def test_imports():

#Optimizers
_ = tfq.optimizers.rotosolve_minimize
_ = tfq.optimizers.spsa_minimize


if __name__ == "__main__":
Expand Down
17 changes: 17 additions & 0 deletions tensorflow_quantum/python/optimizers/BUILD
Original file line number Diff line number Diff line change
Expand Up @@ -11,6 +11,7 @@ py_library(
srcs_version = "PY3",
deps = [
":rotosolve_minimizer",
":spsa_minimizer",
],
)

Expand All @@ -19,6 +20,11 @@ py_library(
srcs = ["rotosolve_minimizer.py"],
)

py_library(
name = "spsa_minimizer",
srcs = ["spsa_minimizer.py"],
)

py_test(
name = "rotosolve_minimizer_test",
srcs = ["rotosolve_minimizer_test.py"],
Expand All @@ -29,3 +35,14 @@ py_test(
"//tensorflow_quantum/python/layers/high_level:pqc",
],
)

py_test(
name = "spsa_minimizer_test",
srcs = ["spsa_minimizer_test.py"],
python_version = "PY3",
deps = [
":spsa_minimizer",
"//tensorflow_quantum/core/ops:tfq_ps_util_ops_py",
"//tensorflow_quantum/python/layers/high_level:pqc",
],
)
2 changes: 2 additions & 0 deletions tensorflow_quantum/python/optimizers/__init__.py
Original file line number Diff line number Diff line change
Expand Up @@ -17,3 +17,5 @@
# Quantum circuit specific optimizers.
from tensorflow_quantum.python.optimizers.rotosolve_minimizer import (
minimize as rotosolve_minimize)
from tensorflow_quantum.python.optimizers.spsa_minimizer import (minimize as
spsa_minimize)
Original file line number Diff line number Diff line change
Expand Up @@ -35,13 +35,11 @@
def loss_function_with_model_parameters(model, loss, train_x, train_y):
"""Create a new function that assign the model parameter to the model
and evaluate its value.

Args:
model : an instance of `tf.keras.Model` or its subclasses.
loss : a function with signature loss_value = loss(pred_y, true_y).
train_x : the input part of training data.
train_y : the output part of training data.

Returns:
A function that has a signature of:
loss_value = f(model_parameters).
Expand All @@ -62,10 +60,8 @@ def loss_function_with_model_parameters(model, loss, train_x, train_y):
@tf.function
def func(params):
"""A function that can be used by tfq.optimizer.rotosolve_minimize.

Args:
params [in]: a 1D tf.Tensor.

Returns:
Loss function value
"""
Expand Down
276 changes: 276 additions & 0 deletions tensorflow_quantum/python/optimizers/spsa_minimizer.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,276 @@
# Copyright 2021 The TensorFlow Quantum Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# ==============================================================================
"""The SPSA minimization algorithm"""
import collections
import tensorflow as tf
import numpy as np


def prefer_static_shape(x):
"""Return static shape of tensor `x` if available,

else `tf.shape(x)`.

Args:
x: `tf.Tensor` (already converted).
Returns:
Numpy array (if static shape is obtainable), else `tf.Tensor`.
"""
return prefer_static_value(tf.shape(x))


def prefer_static_value(x):
"""Return static value of tensor `x` if available, else `x`.

Args:
x: `tf.Tensor` (already converted).
Returns:
Numpy array (if static value is obtainable), else `tf.Tensor`.
"""
static_x = tf.get_static_value(x)
if static_x is not None:
return static_x
return x


SPSAOptimizerResults = collections.namedtuple(
'SPSAOptimizerResults',
[
'converged',
# Scalar boolean tensor indicating whether the minimum
# was found within tolerance.
'num_iterations',
# The number of iterations of the SPSA update.
'num_objective_evaluations',
# The total number of objective
# evaluations performed.
'position',
# A tensor containing the last argument value found
# during the search. If the search converged, then
# this value is the argmin of the objective function.
# A tensor containing the value of the objective from
# previous iteration
'objective_value_previous_iteration',
# Save the evaluated value of the objective function
# from the previous iteration
'objective_value',
# A tensor containing the value of the objective
# function at the `position`. If the search
# converged, then this is the (local) minimum of
# the objective function.
'tolerance',
# Define the stop criteria. Iteration will stop when the
# objective value difference between two iterations is
# smaller than tolerance
'lr',
# Specifies the learning rate
'alpha',
# Specifies scaling of the learning rate
'perturb',
# Specifies the size of the perturbations
'gamma',
# Specifies scaling of the size of the perturbations
'blocking',
# If true, then the optimizer will only accept updates that improve
# the objective function.
'allowed_increase'
# Specifies maximum allowable increase in objective function
# (only applies if blocking is true).
])


def _get_initial_state(initial_position, tolerance, expectation_value_function,
lr, alpha, perturb, gamma, blocking, allowed_increase):
"""Create SPSAOptimizerResults with initial state of search."""
init_args = {
"converged": tf.Variable(False),
"num_iterations": tf.Variable(0),
"num_objective_evaluations": tf.Variable(0),
"position": tf.Variable(initial_position),
"objective_value": tf.Variable(0.),
"objective_value_previous_iteration": tf.Variable(np.inf),
"tolerance": tolerance,
"lr": tf.Variable(lr),
"alpha": tf.Variable(alpha),
"perturb": tf.Variable(perturb),
"gamma": tf.Variable(gamma),
"blocking": tf.Variable(blocking),
"allowed_increase": tf.Variable(allowed_increase)
}
return SPSAOptimizerResults(**init_args)


def minimize(expectation_value_function,
initial_position,
tolerance=1e-5,
max_iterations=200,
alpha=0.602,
lr=1.0,
perturb=1.0,
gamma=0.101,
blocking=False,
allowed_increase=0.5,
seed=None,
name=None):
"""Applies the SPSA algorithm.

The SPSA algorithm can be used to minimize a noisy function. See:

[SPSA website](https://www.jhuapl.edu/SPSA/)

Usage:

Here is an example of optimize a function which consists the
summation of a few quadratics.

>>> n = 5 # Number of quadractics
>>> coefficient = tf.random.uniform(minval=0, maxval=1, shape=[n])
>>> min_value = 0
>>> func = func = lambda x : tf.math.reduce_sum(np.power(x, 2) * \
coefficient)
>>> # Optimize the function with SPSA, start with random parameters
>>> result = tfq.optimizers.spsa_minimize(func, np.random.random(n))
>>> result.converged
tf.Tensor(True, shape=(), dtype=bool)
>>> result.objective_value
tf.Tensor(0.0013349084, shape=(), dtype=float32)

Args:
expectation_value_function: Python callable that accepts a real
valued tf.Tensor with shape [n] where n is the number of function
parameters. The return value is a real `tf.Tensor` Scalar
(matching shape `[1]`).
initial_position: Real `tf.Tensor` of shape `[n]`. The starting
point, or points when using batching dimensions, of the search
procedure. At these points the function value and the gradient
norm should be finite.
tolerance: Scalar `tf.Tensor` of real dtype. Specifies the tolerance
for the procedure. If the supremum norm between two iteration
vector is below this number, the algorithm is stopped.
a: Scalar `tf.Tensor` of real dtype. Specifies the learning rate
alpha: Scalar `tf.Tensor` of real dtype. Specifies scaling of the
learning rate.
c: Scalar `tf.Tensor` of real dtype. Specifies the size of the
Copy link
Collaborator

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Nit: Need to update the names here.

Copy link
Contributor Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Updated

perturbations.
gamma: Scalar `tf.Tensor` of real dtype. Specifies scaling of the
size of the perturbations.
blocking: Boolean. If true, then the optimizer will only accept
updates that improve the objective function.
allowed_increase: Scalar `tf.Tensor` of real dtype. Specifies maximum
allowable increase in objective function (only applies if blocking
is true).
name: (Optional) Python `str`. The name prefixed to the ops created
Copy link
Collaborator

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Nit: Need to add seed.

Copy link
Contributor Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Added

by this function. If not supplied, the default name 'minimize'
is used.

Returns:
optimizer_results: A SPSAOptimizerResults object contains the
result of the optimization process.
"""

with tf.name_scope(name or 'minimize'):
if seed is not None:
tf.random.set_seed(seed)
Copy link
Collaborator

@MichaelBroughton MichaelBroughton Jan 16, 2022

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

This is setting the global seed, which we don't want (it will impact code outside of this function). Something like this might be a little better:

g = tf.random.Generator.from_seed(1234)
g.normal(shape=(2, 3)) # produces same output as tf.random.normal, but from the seed in g.

Ideally all random ops in this function should draw from g

Copy link
Contributor Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Updated. There is only 1 random op (for the deltas), but it now draws from the generator.


initial_position = tf.convert_to_tensor(initial_position,
name='initial_position',
dtype='float32')
dtype = initial_position.dtype.base_dtype
tolerance = tf.convert_to_tensor(tolerance,
dtype=dtype,
name='grad_tolerance')
max_iterations = tf.convert_to_tensor(max_iterations,
name='max_iterations')

lr_init = tf.convert_to_tensor(lr, name='initial_a', dtype='float32')
perturb_init = tf.convert_to_tensor(perturb,
name='initial_c',
dtype='float32')

def _spsa_once(state):
"""Caclulate single SPSA gradient estimation

Args:
state: A SPSAOptimizerResults object stores the
current state of the minimizer.

Returns:
states: A list which the first element is the new state
"""
delta_shift = tf.cast(
2 * tf.random.uniform(shape=state.position.shape,
minval=0,
maxval=2,
dtype=tf.int32) - 1, tf.float32)
v_m = expectation_value_function(state.position -
state.perturb * delta_shift)
v_p = expectation_value_function(state.position +
state.perturb * delta_shift)

gradient_estimate = (v_p - v_m) / (2 * state.perturb) * delta_shift
update = state.lr * gradient_estimate

state.num_objective_evaluations.assign_add(2)

current_obj = expectation_value_function(state.position - update)
if state.objective_value_previous_iteration + \
state.allowed_increase >= current_obj or not state.blocking:
state.position.assign(state.position - update)
state.objective_value_previous_iteration.assign(
state.objective_value)
state.objective_value.assign(current_obj)

return [state]

# The `state` here is a `SPSAOptimizerResults` tuple with
# values for the current state of the algorithm computation.
def _cond(state):
"""Continue if iterations remain and stopping condition
is not met."""
return (state.num_iterations < max_iterations) \
and (not state.converged)

def _body(state):
"""Main optimization loop."""
new_lr = lr_init / (
(tf.cast(state.num_iterations + 1, tf.float32) +
0.01 * tf.cast(max_iterations, tf.float32))**state.alpha)
new_perturb = perturb_init / (tf.cast(state.num_iterations + 1,
tf.float32)**state.gamma)

state.lr.assign(new_lr)
state.perturb.assign(new_perturb)

_spsa_once(state)
state.num_iterations.assign_add(1)
state.converged.assign(
tf.abs(state.objective_value -
state.objective_value_previous_iteration) <
state.tolerance)
return [state]

initial_state = _get_initial_state(initial_position, tolerance,
expectation_value_function, lr,
alpha, perturb, gamma, blocking,
allowed_increase)

initial_state.objective_value.assign(
tf.cast(expectation_value_function(initial_state.position),
tf.float32))

return tf.while_loop(cond=_cond,
body=_body,
loop_vars=[initial_state],
parallel_iterations=1)[0]
Loading