From 4322834fe7d1f475a19c628a8a7699ded54d0e4a Mon Sep 17 00:00:00 2001 From: Matt Watson Date: Thu, 16 Feb 2023 22:14:13 -0800 Subject: [PATCH] Add a note for TPU issues for deberta_v3 --- keras_nlp/models/deberta_v3/deberta_v3_backbone.py | 3 +++ keras_nlp/models/deberta_v3/deberta_v3_classifier.py | 3 +++ 2 files changed, 6 insertions(+) diff --git a/keras_nlp/models/deberta_v3/deberta_v3_backbone.py b/keras_nlp/models/deberta_v3/deberta_v3_backbone.py index ab8ebd21db..637b3b0c0b 100644 --- a/keras_nlp/models/deberta_v3/deberta_v3_backbone.py +++ b/keras_nlp/models/deberta_v3/deberta_v3_backbone.py @@ -47,6 +47,9 @@ class DebertaV3Backbone(Backbone): dimensions. To load preset architectures and weights, use the `from_preset` constructor. + Note: `DebertaV3Backbone` has a performance issue on TPUs, and we recommend + other models for TPU training and inference. + Disclaimer: Pre-trained models are provided on an "as is" basis, without warranties or conditions of any kind. The underlying model is provided by a third party and subject to a separate license, available diff --git a/keras_nlp/models/deberta_v3/deberta_v3_classifier.py b/keras_nlp/models/deberta_v3/deberta_v3_classifier.py index 660d0a99e1..c5f1baebe0 100644 --- a/keras_nlp/models/deberta_v3/deberta_v3_classifier.py +++ b/keras_nlp/models/deberta_v3/deberta_v3_classifier.py @@ -44,6 +44,9 @@ class DebertaV3Classifier(Task): `fit()`, `predict()`, and `evaluate()`. This is done by default when creating the model with `from_preset()`. + Note: `DebertaV3Backbone` has a performance issue on TPUs, and we recommend + other models for TPU training and inference. + Disclaimer: Pre-trained models are provided on an "as is" basis, without warranties or conditions of any kind. The underlying model is provided by a third party and subject to a separate license, available