From b3c3bf60e0ecc572afef71b797c7623073bdf8d3 Mon Sep 17 00:00:00 2001 From: Divyashree Sreepathihalli Date: Fri, 1 Dec 2023 13:42:02 -0800 Subject: [PATCH] Simplify running KerasCV with Keras 3 (#2179) * remove keras_core dependency * update init * update readme * fix model None error (#2176) (#2177) * Update pycoco_callback.py * Update waymo_evaluation_callback.py * fix model None error (#2176) (#2178) * Update pycoco_callback.py * Update waymo_evaluation_callback.py * update readme and conftest * update readme * update citation list * fix mix transformer tests * fix lint error * fix all failing tests --- README.md | 61 +++++++++-------- keras_cv/backend/__init__.py | 20 +++++- keras_cv/backend/config.py | 66 +++---------------- keras_cv/backend/keras.py | 5 -- keras_cv/backend/ops.py | 9 ++- keras_cv/backend/scope.py | 4 +- keras_cv/conftest.py | 14 ++-- .../multi_class_non_max_suppression.py | 4 +- .../object_detection/non_max_suppression.py | 6 +- ...ectorized_base_image_augmentation_layer.py | 4 +- keras_cv/layers/spatial_pyramid.py | 4 +- keras_cv/losses/focal_test.py | 4 +- .../center_pillar_backbone_test.py | 4 +- .../object_detection_3d/center_pillar_test.py | 4 +- 14 files changed, 88 insertions(+), 121 deletions(-) diff --git a/README.md b/README.md index e4ad4bae14..6c7b97c9f2 100644 --- a/README.md +++ b/README.md @@ -7,10 +7,10 @@ [![Contributions Welcome](https://img.shields.io/badge/contributions-welcome-brightgreen.svg?style=flat)](https://github.com/keras-team/keras-cv/issues) KerasCV is a library of modular computer vision components that work natively -with TensorFlow, JAX, or PyTorch. Built on [Keras Core](https://keras.io/keras_core/announcement/), -these models, layers, metrics, callbacks, etc., can be trained and serialized -in any framework and re-used in another without costly migrations. See -"Configuring your backend" below for more details on multi-framework KerasCV. +with TensorFlow, JAX, or PyTorch. Built on Keras 3, these models, layers, +metrics, callbacks, etc., can be trained and serialized in any framework and +re-used in another without costly migrations. See "Configuring your backend" +below for more details on multi-framework KerasCV. @@ -34,29 +34,44 @@ these common tasks. - [API Design Guidelines](.github/API_DESIGN.md) ## Installation +KerasCV supports both Keras 2 and Keras 3. We recommend Keras 3 for all new +users, as it enables using KerasCV models and layers with JAX, TensorFlow and +PyTorch. -To install the latest official release: +### Keras 2 Installation + +To install the latest KerasCV release with Keras 2, simply run: ``` -pip install keras-cv tensorflow --upgrade +pip install --upgrade keras-cv tensorflow ``` -To install the latest unreleased changes to the library, we recommend using -pip to install directly from the master branch on github: +### Keras 3 Installation + +There are currently two ways to install Keras 3 with KerasCV. To install the +latest changes for KerasCV and Keras, you can use our nightly package. + ``` -pip install git+https://github.com/keras-team/keras-cv.git tensorflow --upgrade +pip install --upgrade keras-cv-nightly tf-nightly ``` -## Configuring your backend +To install the stable versions of KerasCV and Keras 3, you should install Keras +3 **after** installing KerasCV. This is a temporary step while TensorFlow is +pinned to Keras 2, and will no longer be necessary after TensorFlow 2.16. -**Keras 3** is an upcoming release of the Keras library which supports -TensorFlow, Jax or Torch as backends. This is supported today in KerasNLP, -but will not be enabled by default until the official release of Keras 3. If you -`pip install keras-cv` and run a script or notebook without changes, you will -be using TensorFlow and **Keras 2**. +``` +pip install --upgrade keras-cv tensorflow +pip install keras>=3 +``` +> [!IMPORTANT] +> Keras 3 will not function with TensorFlow 2.14 or earlier. + +## Configuring your backend -If you would like to enable a preview of the Keras 3 behavior, you can do +If you have Keras 3 installed in your environment (see installation above), +you can use KerasCV with any of JAX, TensorFlow and PyTorch. To do so, set the +`KERAS_BACKEND` environment variable. For example: so by setting the `KERAS_BACKEND` environment variable. For example: ```shell @@ -75,21 +90,13 @@ import keras_cv > [!IMPORTANT] > Make sure to set the `KERAS_BACKEND` before import any Keras libraries, it > will be used to set up Keras when it is first imported. -Until the Keras 3 release, KerasCV will use a preview of Keras 3 on PyPI named -[keras-core](https://pypi.org/project/keras-core/). - -> [!IMPORTANT] -> If you set `KERAS_BACKEND` variable, you should `import keras_core as keras` -> instead of `import keras`. This is a temporary step until Keras 3 is out! -To restore the default **Keras 2** behavior, `unset KERAS_BACKEND` before -importing Keras and KerasCV. Once that configuration step is done, you can just import KerasCV and start using it on top of your backend of choice: ```python import keras_cv -from keras_cv.backend import keras +import keras filepath = keras.utils.get_file(origin="https://i.imgur.com/gCNcJJI.jpg") image = np.array(keras.utils.load_img(filepath)) @@ -108,7 +115,7 @@ predictions = model.predict(image_resized) import tensorflow as tf import keras_cv import tensorflow_datasets as tfds -from keras_cv.backend import keras +import keras # Create a preprocessing pipeline with augmentations BATCH_SIZE = 16 @@ -260,7 +267,7 @@ Here is the BibTeX entry: ```bibtex @misc{wood2022kerascv, title={KerasCV}, - author={Wood, Luke and Tan, Zhenyu and Stenbit, Ian and Bischof, Jonathan and Zhu, Scott and Chollet, Fran\c{c}ois and others}, + author={Wood, Luke and Tan, Zhenyu and Stenbit, Ian and Bischof, Jonathan and Zhu, Scott and Chollet, Fran\c{c}ois and Sreepathihalli, Divyashree and Sampath, Ramesh and others}, year={2022}, howpublished={\url{https://github.com/keras-team/keras-cv}}, } diff --git a/keras_cv/backend/__init__.py b/keras_cv/backend/__init__.py index 890073a1eb..2190534ff8 100644 --- a/keras_cv/backend/__init__.py +++ b/keras_cv/backend/__init__.py @@ -11,6 +11,20 @@ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # See the License for the specific language governing permissions and # limitations under the License. +""" +Keras backend module. + +This module adds a temporary Keras API surface that is fully under KerasCV +control. The goal is to allow us to write Keras 3-like code everywhere, while +still supporting Keras 2. We do this by using the `keras_core` package with +Keras 2 to backport Keras 3 numerics APIs (`keras.ops` and `keras.random`) into +Keras 2. The sub-modules exposed are as follows: + +- `config`: check which version of Keras is being run. +- `keras`: The full `keras` API with compat shims for older Keras versions. +- `ops`: `keras.ops` for Keras 3 or `keras_core.ops` for Keras 2. +- `random`: `keras.random` for Keras 3 or `keras_core.ops` for Keras 2. +""" from keras_cv.backend import config # noqa: E402 from keras_cv.backend import keras # noqa: E402 from keras_cv.backend import ops # noqa: E402 @@ -19,12 +33,12 @@ def assert_tf_keras(src): - if config.multi_backend(): + if config.keras_3(): raise NotImplementedError( - f"KerasCV component {src} does not yet support Keras Core, and can " + f"KerasCV component {src} does not yet support Keras 3, and can " "only be used in `tf.keras`." ) def supports_ragged(): - return not config.multi_backend() + return not config.keras_3() diff --git a/keras_cv/backend/config.py b/keras_cv/backend/config.py index e2858d59ba..11d6c8273b 100644 --- a/keras_cv/backend/config.py +++ b/keras_cv/backend/config.py @@ -11,20 +11,16 @@ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # See the License for the specific language governing permissions and # limitations under the License. -import json -import os -_MULTI_BACKEND = False -# Set Keras base dir path given KERAS_HOME env variable, if applicable. -# Otherwise either ~/.keras or /tmp. -if "KERAS_HOME" in os.environ: - _keras_dir = os.environ.get("KERAS_HOME") -else: - _keras_base_dir = os.path.expanduser("~") - if not os.access(_keras_base_dir, os.W_OK): - _keras_base_dir = "/tmp" - _keras_dir = os.path.join(_keras_base_dir, ".keras") +from tensorflow import keras + +# We follow the version of keras that tensorflow is configured to use. +_USE_KERAS_3 = False + +# Note that only recent versions of keras have a `version()` function. +if hasattr(keras, "version") and keras.version().startswith("3."): + _USE_KERAS_3 = True def detect_if_tensorflow_uses_keras_3(): @@ -57,53 +53,9 @@ def keras_3(): return _USE_KERAS_3 -# Attempt to read KerasCV config file. -_config_path = os.path.expanduser(os.path.join(_keras_dir, "keras_cv.json")) -if os.path.exists(_config_path): - try: - with open(_config_path) as f: - _config = json.load(f) - except ValueError: - _config = {} - _MULTI_BACKEND = _config.get("multi_backend", _MULTI_BACKEND) - -# Save config file, if possible. -if not os.path.exists(_keras_dir): - try: - os.makedirs(_keras_dir) - except OSError: - # Except permission denied and potential race conditions - # in multi-threaded environments. - pass - -if not os.path.exists(_config_path): - _config = { - "multi_backend": _MULTI_BACKEND, - } - try: - with open(_config_path, "w") as f: - f.write(json.dumps(_config, indent=4)) - except IOError: - # Except permission denied. - pass - -if "KERAS_BACKEND" in os.environ and os.environ["KERAS_BACKEND"]: - _MULTI_BACKEND = True - - -def multi_backend(): - return _MULTI_BACKEND - - def backend(): """Check the backend framework.""" - if not multi_backend(): - return "tensorflow" if not keras_3(): - import keras_core - - return keras_core.config.backend() - - from tensorflow import keras + return "tensorflow" return keras.config.backend() diff --git a/keras_cv/backend/keras.py b/keras_cv/backend/keras.py index 65082573ae..340efad3b1 100644 --- a/keras_cv/backend/keras.py +++ b/keras_cv/backend/keras.py @@ -30,11 +30,6 @@ import keras # noqa: F403, F401 from keras import * # noqa: F403, F401 - keras.backend.name_scope = keras.name_scope -elif config.multi_backend(): - import keras_core as keras # noqa: F403, F401 - from keras_core import * # noqa: F403, F401 - keras.backend.name_scope = keras.name_scope else: from tensorflow import keras # noqa: F403, F401 diff --git a/keras_cv/backend/ops.py b/keras_cv/backend/ops.py index cbb533c103..c02dadfd6b 100644 --- a/keras_cv/backend/ops.py +++ b/keras_cv/backend/ops.py @@ -11,10 +11,9 @@ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # See the License for the specific language governing permissions and # limitations under the License. -from keras_cv.backend.config import keras_3 -from keras_cv.backend.config import multi_backend +from keras_cv.backend import config -if keras_3(): +if config.keras_3(): from keras.ops import * # noqa: F403, F401 from keras.preprocessing.image import smart_resize # noqa: F403, F401 @@ -32,5 +31,5 @@ from keras_core.src.utils.image_utils import ( # noqa: F403, F401 smart_resize, ) -if not multi_backend(): - from keras_cv.backend.tf_ops import * # noqa: F403, F401 + if config.backend() == "tensorflow": + from keras_cv.backend.tf_ops import * # noqa: F403, F401 diff --git a/keras_cv/backend/scope.py b/keras_cv/backend/scope.py index d6bd1b40d2..b2eb094147 100644 --- a/keras_cv/backend/scope.py +++ b/keras_cv/backend/scope.py @@ -18,7 +18,7 @@ from keras_cv.backend import keras from keras_cv.backend import ops from keras_cv.backend import tf_ops -from keras_cv.backend.config import multi_backend +from keras_cv.backend.config import keras_3 _ORIGINAL_OPS = copy.copy(backend.ops.__dict__) _ORIGINAL_SUPPORTS_RAGGED = backend.supports_ragged @@ -30,7 +30,7 @@ def tf_data(function): @functools.wraps(function) def wrapper(*args, **kwargs): - if multi_backend() and keras.src.utils.backend_utils.in_tf_graph(): + if keras_3() and keras.src.utils.backend_utils.in_tf_graph(): with TFDataScope(): return function(*args, **kwargs) else: diff --git a/keras_cv/conftest.py b/keras_cv/conftest.py index 8e886dfd99..b8be780c39 100644 --- a/keras_cv/conftest.py +++ b/keras_cv/conftest.py @@ -17,7 +17,7 @@ import tensorflow as tf from packaging import version -from keras_cv.backend.config import multi_backend +from keras_cv.backend.config import keras_3 def pytest_addoption(parser): @@ -45,7 +45,7 @@ def pytest_configure(config): ) config.addinivalue_line( "markers", - "tf_keras_only: mark test as a tf.keras-only test", + "tf_keras_only: mark test as a Keras 2-only test", ) config.addinivalue_line( "markers", @@ -69,12 +69,12 @@ def pytest_collection_modifyitems(config, items): skip_extra_large = pytest.mark.skipif( not run_extra_large_tests, reason="need --run_extra_large option to run" ) - skip_tf_keras_only = pytest.mark.skipif( - multi_backend(), - reason="This test is only supported on tf.keras", + skip_keras_2_only = pytest.mark.skipif( + keras_3(), + reason="This test is only supported on Keras 2", ) skip_tf_only = pytest.mark.skipif( - multi_backend() and keras_core.backend.backend() != "tensorflow", + keras_3() and keras_core.backend.backend() != "tensorflow", reason="This test is only supported on TensorFlow", ) for item in items: @@ -87,6 +87,6 @@ def pytest_collection_modifyitems(config, items): if "extra_large" in item.keywords: item.add_marker(skip_extra_large) if "tf_keras_only" in item.keywords: - item.add_marker(skip_tf_keras_only) + item.add_marker(skip_keras_2_only) if "tf_only" in item.keywords: item.add_marker(skip_tf_only) diff --git a/keras_cv/layers/object_detection/multi_class_non_max_suppression.py b/keras_cv/layers/object_detection/multi_class_non_max_suppression.py index 7825268578..08bcd97528 100644 --- a/keras_cv/layers/object_detection/multi_class_non_max_suppression.py +++ b/keras_cv/layers/object_detection/multi_class_non_max_suppression.py @@ -18,7 +18,7 @@ from keras_cv.api_export import keras_cv_export from keras_cv.backend import keras from keras_cv.backend import ops -from keras_cv.backend.config import multi_backend +from keras_cv.backend.config import keras_3 @keras_cv_export("keras_cv.layers.MultiClassNonMaxSuppression") @@ -73,7 +73,7 @@ def call( `bounding_box_format` specified in the constructor. class_prediction: Dense Tensor of shape [batch, boxes, num_classes]. """ - if multi_backend() and keras.backend.backend() != "tensorflow": + if keras_3() and keras.backend.backend() != "tensorflow": raise NotImplementedError( "MultiClassNonMaxSuppression does not support non-TensorFlow " "backends. Consider using NonMaxSuppression instead." diff --git a/keras_cv/layers/object_detection/non_max_suppression.py b/keras_cv/layers/object_detection/non_max_suppression.py index ed988cf113..2c39fd0d12 100644 --- a/keras_cv/layers/object_detection/non_max_suppression.py +++ b/keras_cv/layers/object_detection/non_max_suppression.py @@ -20,7 +20,7 @@ from keras_cv.api_export import keras_cv_export from keras_cv.backend import keras from keras_cv.backend import ops -from keras_cv.backend.config import multi_backend +from keras_cv.backend.config import keras_3 EPSILON = 1e-8 @@ -89,7 +89,7 @@ def call( confidence_prediction = ops.max(class_prediction, axis=-1) - if not multi_backend() or keras.backend.backend() == "tensorflow": + if not keras_3() or keras.backend.backend() == "tensorflow": idx, valid_det = tf.image.non_max_suppression_padded( box_prediction, confidence_prediction, @@ -318,7 +318,7 @@ def suppression_loop_body(boxes, iou_threshold, output_size, idx): # TODO(ianstenbit): Fix bug in tfnp.take_along_axis that causes this hack. # (This will be removed anyway when we use built-in NMS for TF.) - if multi_backend() and keras.backend.backend() != "tensorflow": + if keras_3() and keras.backend.backend() != "tensorflow": idx = ops.take_along_axis( ops.reshape(sorted_indices, [-1]), take_along_axis_idx ) diff --git a/keras_cv/layers/preprocessing/vectorized_base_image_augmentation_layer.py b/keras_cv/layers/preprocessing/vectorized_base_image_augmentation_layer.py index 1f420437f4..8d3dacfa98 100644 --- a/keras_cv/layers/preprocessing/vectorized_base_image_augmentation_layer.py +++ b/keras_cv/layers/preprocessing/vectorized_base_image_augmentation_layer.py @@ -24,7 +24,7 @@ from keras_cv.api_export import keras_cv_export from keras_cv.backend import keras from keras_cv.backend import scope -from keras_cv.backend.config import multi_backend +from keras_cv.backend.config import keras_3 from keras_cv.utils import preprocessing H_AXIS = -3 @@ -44,7 +44,7 @@ base_class = ( keras.src.layers.preprocessing.tf_data_layer.TFDataLayer - if multi_backend() + if keras_3() else keras.layers.Layer ) diff --git a/keras_cv/layers/spatial_pyramid.py b/keras_cv/layers/spatial_pyramid.py index b45ee7bda3..8f0e50a7d8 100644 --- a/keras_cv/layers/spatial_pyramid.py +++ b/keras_cv/layers/spatial_pyramid.py @@ -19,7 +19,7 @@ from keras_cv.api_export import keras_cv_export from keras_cv.backend import keras from keras_cv.backend import ops -from keras_cv.backend.config import multi_backend +from keras_cv.backend.config import keras_3 @keras_cv_export("keras_cv.layers.SpatialPyramidPooling") @@ -68,7 +68,7 @@ def __init__( self.dropout = dropout # TODO(ianstenbit): Remove this once TF 2.14 is released which adds # XLA support for resizing with bilinear interpolation. - if multi_backend() and keras.backend.backend() == "tensorflow": + if keras_3() and keras.backend.backend() == "tensorflow": self.supports_jit = False def build(self, input_shape): diff --git a/keras_cv/losses/focal_test.py b/keras_cv/losses/focal_test.py index 9594d13d21..a8f4463fba 100644 --- a/keras_cv/losses/focal_test.py +++ b/keras_cv/losses/focal_test.py @@ -16,7 +16,7 @@ from keras_cv.backend import keras from keras_cv.backend import ops -from keras_cv.backend.config import multi_backend +from keras_cv.backend.config import keras_3 from keras_cv.losses import FocalLoss from keras_cv.tests.test_case import TestCase @@ -73,7 +73,7 @@ def test_from_logits_argument(self): # TF backend somehow has different numerics. expected_loss = ( 31.11176 - if multi_backend() and keras.backend.backend() != "tensorflow" + if keras_3() and keras.backend.backend() != "tensorflow" else 925.28081 ) self.assertAllClose( diff --git a/keras_cv/models/object_detection_3d/center_pillar_backbone_test.py b/keras_cv/models/object_detection_3d/center_pillar_backbone_test.py index cc89cb1895..c02046b5e1 100644 --- a/keras_cv/models/object_detection_3d/center_pillar_backbone_test.py +++ b/keras_cv/models/object_detection_3d/center_pillar_backbone_test.py @@ -16,13 +16,13 @@ import tensorflow as tf from keras_cv.backend import keras -from keras_cv.backend.config import multi_backend +from keras_cv.backend.config import keras_3 from keras_cv.models.object_detection_3d import CenterPillarBackbone from keras_cv.tests.test_case import TestCase @pytest.mark.skipif( - multi_backend() and keras.backend.backend() == "torch", + keras_3() and keras.backend.backend() == "torch", reason="CenterPillar does not yet support PyTorch.", ) class CenterPillarBackboneTest(TestCase): diff --git a/keras_cv/models/object_detection_3d/center_pillar_test.py b/keras_cv/models/object_detection_3d/center_pillar_test.py index 352d33fbbd..b4be9e6a5e 100644 --- a/keras_cv/models/object_detection_3d/center_pillar_test.py +++ b/keras_cv/models/object_detection_3d/center_pillar_test.py @@ -16,7 +16,7 @@ import tensorflow as tf from keras_cv.backend import keras -from keras_cv.backend.config import multi_backend +from keras_cv.backend.config import keras_3 from keras_cv.layers.object_detection_3d.voxelization import DynamicVoxelization from keras_cv.models.object_detection_3d.center_pillar import ( MultiClassDetectionHead, @@ -34,7 +34,7 @@ @pytest.mark.skipif( - multi_backend() and keras.backend.backend() == "torch", + keras_3() and keras.backend.backend() == "torch", reason="CenterPillar does not yet support PyTorch.", ) class CenterPillarTest(TestCase):