From 3736b0b78a84e22bf6989a6c8f2638d32324a278 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Aylin=20Ayd=C4=B1n?= Date: Wed, 21 Sep 2022 23:31:06 +0300 Subject: [PATCH 01/25] ArcFace Loss Implementation --- .../losses/ArcFace Loss Sample Notebook.ipynb | 775 ++++++++++++++++++ tensorflow_similarity/losses/__init__.py | 13 +- tensorflow_similarity/losses/arcface_loss.py | 119 +++ tensorflow_similarity/losses/test_losses.py | 275 +++++++ 4 files changed, 1176 insertions(+), 6 deletions(-) create mode 100644 tensorflow_similarity/losses/ArcFace Loss Sample Notebook.ipynb create mode 100644 tensorflow_similarity/losses/arcface_loss.py create mode 100644 tensorflow_similarity/losses/test_losses.py diff --git a/tensorflow_similarity/losses/ArcFace Loss Sample Notebook.ipynb b/tensorflow_similarity/losses/ArcFace Loss Sample Notebook.ipynb new file mode 100644 index 00000000..b481492e --- /dev/null +++ b/tensorflow_similarity/losses/ArcFace Loss Sample Notebook.ipynb @@ -0,0 +1,775 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "id": "28956aa1", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "Copyright 2022 The TensorFlow Similarity Authors." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "24eda1a6", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "# @title Licensed under the Apache License, Version 2.0 (the \"License\");\n", + "# you may not use this file except in compliance with the License.\n", + "# You may obtain a copy of the License at\n", + "#\n", + "# https://www.apache.org/licenses/LICENSE-2.0\n", + "#\n", + "# Unless required by applicable law or agreed to in writing, software\n", + "# distributed under the License is distributed on an \"AS IS\" BASIS,\n", + "# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.\n", + "# See the License for the specific language governing permissions and\n", + "# limitations under the License." + ] + }, + { + "cell_type": "markdown", + "id": "7ca9d025", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "# TensorFlow Similarity ArcFace Loss Example" + ] + }, + { + "cell_type": "markdown", + "id": "d072628f", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "A Total Angular Margin Loss (ArcFace) calculates the geodetic distance in the hypersphere instead of the euclidean distance to improve the discriminatory strength of the facial recognition model and stabilize the training process. Rails are used to measure all distances in geodetic space. The geodetic trace is the path taken between two places. It specifies the geodetic distance, which is the shortest distance between two places.\n", + "\n", + "ArcFace loss determines the angle between the current feature and the target weight using the arc-cosine function since the dot product between the DCNN feature and the last fully connected layer after feature and weight normalization matches the cosine distance. The target logit is then returned by multiplying the goal angle by an additional angular margin and using the cosine function. After that, we continue as before and rescale all logits to a certain feature norm, just like with softmax loss." + ] + }, + { + "cell_type": "markdown", + "id": "808ac087", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "### Notebook goal\n", + "\n", + "This notebook demonstrates how to use ArcFaceLoss implementation of TensorFlow Similarity with standalone usage and to train a `SimilarityModel()` on a fraction of the MNIST classes.\n", + "\n", + "You are going to learn about the main features offered by the `ArcFaceLoss()` and will:\n", + "\n", + " 1. Standalone usage of ArcFaceLoss\n", + "\n", + " 2. Usage with `model.compile()`\n", + "\n", + " 3. 3D-Visualization of ArcFaceLoss \n", + "\n", + "### Things to try \n", + "\n", + "Along the way you can try the following things to improve the model performance:\n", + "- Adding more \"seen\" classes at training time.\n", + "- Use a larger embedding by increasing the size of the output.\n", + "- Add data augmentation pre-processing layers to the model.\n", + "- Include more examples in the index to give the models more points to choose from.\n", + "- Try a more challenging dataset, such as Fashion MNIST." + ] + }, + { + "cell_type": "markdown", + "id": "078c53c0", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "### Notebook goal\n", + "\n", + "This notebook demonstrates how to use ArcFaceLoss implementation of TensorFlow Similarity with standalone usage and to train a `SimilarityModel()` on a fraction of the MNIST classes.\n", + "\n", + "You are going to learn about the main features offered by the `ArcFaceLoss()` and will:\n", + "\n", + " 1. Standalone usage of ArcFaceLoss\n", + "\n", + " 2. Usage with `model.compile()`\n", + "\n", + " 3. 3D-Visualization of ArcFaceLoss \n", + "\n", + "### Things to try \n", + "\n", + "Along the way you can try the following things to improve the model performance:\n", + "- Adding more \"seen\" classes at training time.\n", + "- Use a larger embedding by increasing the size of the output.\n", + "- Add data augmentation pre-processing layers to the model.\n", + "- Include more examples in the index to give the models more points to choose from.\n", + "- Try a more challenging dataset, such as Fashion MNIST." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "8fd63f16", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "import gc\n", + "import os\n", + "\n", + "import numpy as np\n", + "from matplotlib import pyplot as plt\n", + "from tabulate import tabulate\n", + "from mpl_toolkits.mplot3d import Axes3D\n", + "\n", + "# INFO messages are not printed.\n", + "# This must be run before loading other modules.\n", + "os.environ[\"TF_CPP_MIN_LOG_LEVEL\"] = \"1\"" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "80af5fc0", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "import tensorflow as tf" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "8ba8caf7", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "# install TF similarity if needed\n", + "try:\n", + " import tensorflow_similarity as tfsim # main package\n", + "except ModuleNotFoundError:\n", + " !pip install tensorflow_similarity\n", + " import tensorflow_similarity as tfsim" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "2484bd72", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "tfsim.utils.tf_cap_memory()" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "3fe0344e", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "# Clear out any old model state.\n", + "gc.collect()\n", + "tf.keras.backend.clear_session()" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "99d9bef9", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "print(\"TensorFlow:\", tf.__version__)\n", + "print(\"TensorFlow Similarity\", tfsim.__version__)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "7137afbc", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [] + }, + { + "cell_type": "markdown", + "id": "1d534ad3", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "# Standalone Usage of ArcFaceLoss\n", + "\n", + "ArcFace loss alone can be used as follows when it is desired to calculate the additive angular margin loss of the existing data set." + ] + }, + { + "cell_type": "markdown", + "id": "68d526da", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "### Initialize Loss function as ArcFaceLoss" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "bebf6ef0", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "loss_fn = tfsim.losses.ArcFaceLoss(num_classes=8, embedding_size=10)" + ] + }, + { + "cell_type": "markdown", + "id": "d2ccfd7d", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "### Create own simple random dataset" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "1d1ec43a", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "labels = tf.Variable([0, 1, 2, 3, 4, 5, 6, 7])\n", + "embeddings = tf.Variable(tf.random.uniform(shape=[8, 10]))" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "73d0c1c6", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "print(\"\", embeddings)" + ] + }, + { + "cell_type": "markdown", + "id": "d65b3085", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "### Calculate loss" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "cdf7c30c", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "loss = loss_fn(labels, embeddings)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "16745b7d", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "print(\"loss : \" , loss)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "outputs": [], + "source": [ + "loss = loss_fn(labels, embeddings)" + ], + "metadata": { + "collapsed": false, + "pycharm": { + "name": "#%%\n" + } + } + }, + { + "cell_type": "code", + "execution_count": null, + "outputs": [], + "source": [ + "print(\"loss : \" , loss)" + ], + "metadata": { + "collapsed": false, + "pycharm": { + "name": "#%%\n" + } + } + }, + { + "cell_type": "markdown", + "source": [ + "## Data preparation\n", + "\n", + "We are going to load the MNIST dataset to showcase how the model is able to find similar examples from classes unseen during training. The model's ability to generalize the matching to unseen classes, without retraining, is one of the main reason you would want to use metric learning.\n", + "\n", + "\n", + "**WARNING**: Tensorflow similarity expects `y_train` to be an IntTensor containing the class ids for each example instead of the standard categorical encoding traditionally used for multi-class classification." + ], + "metadata": { + "collapsed": false, + "pycharm": { + "name": "#%% md\n" + } + } + }, + { + "cell_type": "code", + "execution_count": null, + "id": "8a9f8122", + "metadata": {}, + "outputs": [], + "source": [ + "print(\"loss : \" , loss)" + ] + }, + { + "cell_type": "markdown", + "id": "11ef5236", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "## Data preparation\n", + "\n", + "We are going to load the MNIST dataset to showcase how the model is able to find similar examples from classes unseen during training. The model's ability to generalize the matching to unseen classes, without retraining, is one of the main reason you would want to use metric learning.\n", + "\n", + "\n", + "**WARNING**: Tensorflow similarity expects `y_train` to be an IntTensor containing the class ids for each example instead of the standard categorical encoding traditionally used for multi-class classification." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "97152229", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "(x_train, y_train), (x_test, y_test) = tf.keras.datasets.mnist.load_data()" + ] + }, + { + "cell_type": "markdown", + "id": "08b766d8", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "## Model setup" + ] + }, + { + "cell_type": "markdown", + "id": "3eac2da7", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "### Model definition\n", + "\n", + "`SimilarityModel()` models extend `tensorflow.keras.model.Model` with additional features and functionality that allow you to index and search for similar looking examples.\n", + "\n", + "As visible in the model definition below, similarity models output a 64 dimensional float embedding using the `MetricEmbedding()` layers. This layer is a Dense layer with L2 normalization. Thanks to the loss, the model learns to minimize the distance between similar examples and maximize the distance between dissimilar examples. As a result, the distance between examples in the embedding space is meaningful; the smaller the distance the more similar the examples are. \n", + "\n", + "Being able to use a distance as a meaningful proxy for how similar two examples are, is what enables the fast ANN (aproximate nearest neighbor) search. Using a sub-linear ANN search instead of a standard quadratic NN search is what allows deep similarity search to scale to millions of items. The built in memory index used in this notebook scales to a million indexed examples very easily... if you have enough RAM :)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "a003c971", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "def get_model():\n", + " inputs = tf.keras.layers.Input(shape=(28, 28, 1))\n", + " x = tf.keras.layers.experimental.preprocessing.Rescaling(1 / 255)(inputs)\n", + " x = tf.keras.layers.Conv2D(32, 3, activation=\"relu\")(x)\n", + " x = tf.keras.layers.Conv2D(32, 3, activation=\"relu\")(x)\n", + " x = tf.keras.layers.MaxPool2D()(x)\n", + " x = tf.keras.layers.Conv2D(64, 3, activation=\"relu\")(x)\n", + " x = tf.keras.layers.Conv2D(64, 3, activation=\"relu\")(x)\n", + " x = tf.keras.layers.Flatten()(x)\n", + " # smaller embeddings will have faster lookup times while a larger embedding will improve the accuracy up to a point.\n", + " outputs = tfsim.layers.MetricEmbedding(64)(x)\n", + " return tfsim.models.SimilarityModel(inputs, outputs)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "a2177b12", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "model = get_model()\n", + "model.summary()" + ] + }, + { + "cell_type": "markdown", + "id": "defb3961", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "### ArcFace Loss definition\n", + "\n", + "Overall what makes Metric losses different from tradional losses is that:\n", + "- **They expect different inputs.** Instead of having the prediction equal the true values, they expect embeddings as `y_preds` and the id (as an int32) of the class as `y_true`. \n", + "- **They require a distance.** You need to specify which `distance` function to use to compute the distance between embeddings. `cosine` is usually a great starting point and the default.\n", + "\n", + "ArcFace Loss takes inputs as number of classes which labels includes, and embedding size which we define in model `MetricEmbedding()` layers." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "13b0d745", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "distance = \"cosine\" " + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "c22d10cc", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "num_classes = np.unique(y_train).size\n", + "embedding_size = model.get_layer('metric_embedding').output.shape[1]" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "d5b8e426", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "loss = tfsim.losses.ArcFaceLoss(num_classes= num_classes, embedding_size=embedding_size, name=\"ArcFaceLoss\")" + ] + }, + { + "cell_type": "markdown", + "id": "b6eaf9c8", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "### Compilation\n", + "\n", + "Tensorflow similarity use an extended `compile()` method that allows you to optionally specify `distance_metrics` (metrics that are computed over the distance between the embeddings), and the distance to use for the indexer.\n", + "\n", + "By default the `compile()` method tries to infer what type of distance you are using by looking at the first loss specified. If you use multiple losses, and the distance loss is not the first one, then you need to specify the distance function used as `distance=` parameter in the compile function." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "673f986f", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "LR = 0.0005 # @param {type:\"number\"}\n", + "model.compile(optimizer=tf.keras.optimizers.SGD(LR), loss=loss, distance=distance)" + ] + }, + { + "cell_type": "markdown", + "id": "15961601", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "## Training\n", + "\n", + "Similarity models are trained like normal models. " + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "147a6863", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "EPOCHS = 10 # @param {type:\"integer\"}\n", + "history = model.fit(x_train, y_train, epochs=EPOCHS, validation_data=(x_test, y_test))" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "88e1ee4d", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "plt.plot(history.history[\"loss\"])\n", + "plt.plot(history.history[\"val_loss\"])\n", + "plt.legend([\"loss\", \"val_loss\"])\n", + "plt.title(f\"Loss: {loss.name}\")\n", + "plt.show()" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "a5404906", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [] + }, + { + "cell_type": "markdown", + "id": "5ad4ba20", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "## Prediction\n", + "\n", + "Let's predict some features and visualiza them." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "a1936264", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "embedded_features = model.predict(x_test, verbose=1)\n", + "embedded_features /= np.linalg.norm(embedded_features, axis=1, keepdims=True)" + ] + }, + { + "cell_type": "markdown", + "id": "7c0df63b", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "### 3D-Visualization of ArcFace Loss" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "5aac5d98", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "fig = plt.figure()\n", + "ax = Axes3D(fig)\n", + "for c in range(len(np.unique(y_test))):\n", + " ax.plot(embedded_features[y_test==c, 0], embedded_features[y_test==c, 1], embedded_features[y_test==c, 2], '.', alpha=0.1)\n", + "plt.title('ArcFace')\n", + "plt.show()" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "8889f840", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "fef529d9", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3 (ipykernel)", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.9.12" + } + }, + "nbformat": 4, + "nbformat_minor": 5 +} \ No newline at end of file diff --git a/tensorflow_similarity/losses/__init__.py b/tensorflow_similarity/losses/__init__.py index 46c7c700..a51937b3 100644 --- a/tensorflow_similarity/losses/__init__.py +++ b/tensorflow_similarity/losses/__init__.py @@ -15,13 +15,14 @@ """ Contrastive learning specialized losses. """ -from .barlow import Barlow # noqa -from .circle_loss import CircleLoss # noqa +from .pn_loss import PNLoss # noqa +from .triplet_loss import TripletLoss # noqa from .metric_loss import MetricLoss # noqa +from .circle_loss import CircleLoss # noqa from .multisim_loss import MultiSimilarityLoss # noqa -from .pn_loss import PNLoss # noqa -from .simclr import SimCLRLoss # noqa from .simsiam import SimSiamLoss # noqa -from .softnn_loss import SoftNearestNeighborLoss # noqa -from .triplet_loss import TripletLoss # noqa +from .simclr import SimCLRLoss # noqa from .vicreg import VicReg # noqa +from .barlow import Barlow # noqa +from .softnn_loss import SoftNearestNeighborLoss # noqa +from .arcface_loss import ArcFaceLoss # noqa diff --git a/tensorflow_similarity/losses/arcface_loss.py b/tensorflow_similarity/losses/arcface_loss.py new file mode 100644 index 00000000..e0252d5c --- /dev/null +++ b/tensorflow_similarity/losses/arcface_loss.py @@ -0,0 +1,119 @@ +# Copyright 2022 The TensorFlow Authors. All Rights Reserved. +# +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. +# ============================================================================== +"""ArcFace losses base class. + +ArcFace: Additive Angular Margin Loss for Deep Face +Recognition. [online] arXiv.org. Available at: +. + +""" + +from typing import Any, Callable, Dict, Optional, Tuple, Union + +import tensorflow as tf +from tensorflow_similarity.algebra import build_masks +from tensorflow_similarity.distances import Distance, distance_canonicalizer +from tensorflow_similarity.types import FloatTensor, IntTensor +from tensorflow_similarity.utils import is_tensor_or_variable + +from .metric_loss import MetricLoss +from .utils import logsumexp + + +@tf.keras.utils.register_keras_serializable(package="Similarity") +class ArcFaceLoss(tf.keras.losses.Loss): + """Implement of ArcFace: Additive Angular Margin Loss: + Step 1: Create a trainable kernel matrix with the shape of [embedding_size, num_classes]. + Step 2: Normalize the kernel and prediction vectors. + Step 3: Calculate the cosine similarity between the normalized prediction vector and the kernel. + Step 4: Create a one-hot vector include the margin value for the ground truth class. + Step 5: Add margin_hot to the cosine similarity and multiply it by scale. + Step 6: Calculate the cross-entropy loss. + + ArcFace: Additive Angular Margin Loss for Deep Face + Recognition. [online] arXiv.org. Available at: + . + + Standalone usage: + >>> loss_fn = tfsim.losses.ArcFaceLoss(num_classes=2, embedding_size=3) + >>> labels = tf.Variable([1, 0]) + >>> embeddings = tf.Variable([[0.2, 0.3, 0.1], [0.4, 0.5, 0.5]]) + >>> loss = loss_fn(labels, embeddings) + Args: + num_classes: Number of classes. + embedding_size: The size of the embedding vectors. + margin: The margin value. + scale: s in the paper, feature scale + name: Optional name for the operation. + reduction: Type of loss reduction to apply to the loss. + """ + + def __init__( + self, + num_classes: int, + embedding_size: int, + margin: float = 0.50, # margin in radians + scale: float = 64.0, # feature scale + name: Optional[str] = None, + reduction: Callable = tf.keras.losses.Reduction.AUTO, + **kwargs + ): + + super().__init__(reduction=reduction, name=name, **kwargs) + + self.num_classes = num_classes + self.embedding_size = embedding_size + self.margin = margin + self.scale = scale + self.name = name + self.kernel = tf.Variable(tf.random.normal([embedding_size, num_classes])) + + def call(self, y_true: FloatTensor, y_pred: FloatTensor) -> FloatTensor: + + y_pred_norm = tf.math.l2_normalize(y_pred, axis=1) + kernel_norm = tf.math.l2_normalize(self.kernel, axis=0) + + cos_theta = tf.matmul(y_pred_norm, kernel_norm) + cos_theta = tf.clip_by_value(cos_theta, -1.0, 1.0) + + m_hot = tf.one_hot(y_true, self.num_classes, on_value=self.margin, axis=1) + m_hot = tf.reshape(m_hot, [-1, self.num_classes]) + + cos_theta = tf.acos(cos_theta) + cos_theta += m_hot + cos_theta = tf.math.cos(cos_theta) + cos_theta = tf.math.multiply(cos_theta, self.scale) + + cce = tf.keras.losses.SparseCategoricalCrossentropy( + from_logits=True, reduction=self.reduction + ) + loss: FloatTensor = cce(y_true, cos_theta) + + return loss + + def get_config(self) -> Dict[str, Any]: + """Contains the loss configuration. + Returns: + A Python dict containing the configuration of the loss. + """ + config = { + "num_classes": self.num_classes, + "embedding_size": self.embedding_size, + "margin": self.margin, + "scale": self.scale, + "name": self.name, + } + base_config = super().get_config() + return {**base_config, **config} diff --git a/tensorflow_similarity/losses/test_losses.py b/tensorflow_similarity/losses/test_losses.py new file mode 100644 index 00000000..1d4fef9c --- /dev/null +++ b/tensorflow_similarity/losses/test_losses.py @@ -0,0 +1,275 @@ +import tensorflow as tf +import numpy as np +from tensorflow_similarity.losses import TripletLoss, MultiSimilarityLoss +from tensorflow_similarity.losses import PNLoss +from tensorflow_similarity.losses import SoftNearestNeighborLoss +from tensorflow_similarity.losses import ArcFaceLoss + +# [triplet loss] +from tensorflow_similarity.losses.xbm_loss import XBM + + +def test_triplet_loss_serialization(): + loss = TripletLoss() + config = loss.get_config() + print(config) + loss2 = TripletLoss.from_config(config) + assert loss.name == loss2.name + assert loss.distance == loss2.distance + + +def triplet_hard_loss_np(labels, embedding, margin, dist_func, soft=False): + num_data = embedding.shape[0] + # Reshape labels to compute adjacency matrix. + labels_reshaped = np.reshape(labels.astype(np.float32), + (labels.shape[0], 1)) + + adjacency = np.equal(labels_reshaped, labels_reshaped.T) + pdist_matrix = dist_func(embedding) + loss_np = 0.0 + for i in range(num_data): + pos_distances = [] + neg_distances = [] + for j in range(num_data): + if adjacency[i][j] == 0: + neg_distances.append(pdist_matrix[i][j]) + if adjacency[i][j] > 0.0 and i != j: + pos_distances.append(pdist_matrix[i][j]) + + # if there are no positive pairs, distance is 0 + if len(pos_distances) == 0: + pos_distances.append(0) + + # Sort by distance. + neg_distances.sort() + min_neg_distance = neg_distances[0] + pos_distances.sort(reverse=True) + max_pos_distance = pos_distances[0] + + if soft: + loss_np += np.log1p(np.exp(max_pos_distance - min_neg_distance)) + else: + loss_np += np.maximum(0.0, + max_pos_distance - min_neg_distance + margin) + + loss_np /= num_data + return loss_np + + +def test_triplet_loss(): + num_inputs = 10 + # y_true: labels + y_true = tf.random.uniform((num_inputs,), 0, 10, dtype=tf.int32) + # y_preds: embedding + y_preds = tf.random.uniform((num_inputs, 20), 0, 1) + tpl = TripletLoss() + # y_true, y_preds + loss = tpl(y_true, y_preds) + assert loss > 0.9 + + +def test_triplet_loss_easy(): + num_inputs = 10 + # y_true: labels + y_true = tf.random.uniform((num_inputs,), 0, 3, dtype=tf.int32) + # y_preds: embedding + y_preds = tf.random.uniform((num_inputs, 16), 0, 1) + tpl = TripletLoss(positive_mining_strategy='easy', + negative_mining_strategy='easy') + # y_true, y_preds + loss = tpl(y_true, y_preds) + assert loss > 0 + + +def test_triplet_loss_semi_hard(): + num_inputs = 10 + # y_true: labels + y_true = tf.random.uniform((num_inputs,), 0, 3, dtype=tf.int32) + # y_preds: embedding + y_preds = tf.random.uniform((num_inputs, 16), 0, 1) + tpl = TripletLoss(positive_mining_strategy='easy', + negative_mining_strategy='semi-hard') + # y_true, y_preds + loss = tpl(y_true, y_preds) + assert loss + + +def test_triplet_loss_hard(): + num_inputs = 10 + # y_true: labels + y_true = tf.random.uniform((num_inputs,), 0, 3, dtype=tf.int32) + # y_preds: embedding + y_preds = tf.random.uniform((num_inputs, 16), 0, 1) + tpl = TripletLoss(positive_mining_strategy='hard', + negative_mining_strategy='hard') + # y_true, y_preds + loss = tpl(y_true, y_preds) + assert loss + + +# [pn loss] +def test_pn_loss_serialization(): + loss = PNLoss() + config = loss.get_config() + print(config) + loss2 = PNLoss.from_config(config) + assert loss.name == loss2.name + assert loss.distance == loss2.distance + + +def test_np_loss(): + num_inputs = 10 + # y_true: labels + y_true = tf.random.uniform((num_inputs,), 0, 10, dtype=tf.int32) + # y_preds: embedding + y_preds = tf.random.uniform((num_inputs, 20), 0, 1) + pnl = PNLoss() + # y_true, y_preds + loss = pnl(y_true, y_preds) + assert loss > 0.9 + + +# [soft neasrest neighbor loss] +def test_softnn_loss_serialization(): + loss = SoftNearestNeighborLoss(distance="cosine", temperature=50) + config = loss.get_config() + loss2 = SoftNearestNeighborLoss.from_config(config) + assert loss.name == loss2.name + assert loss.distance == loss2.distance + assert loss.temperature == loss2.temperature + + +def softnn_util(y_true, x, temperature=1): + """ + A simple loop based implementation of soft + nearest neighbor loss to test the code. + https://arxiv.org/pdf/1902.01889.pdf + """ + + y_true = y_true.numpy() + x = x.numpy() + batch_size = y_true.shape[0] + loss = 0 + eps = 1e-9 + for i in range(batch_size): + numerator = 0 + denominator = 0 + for j in range(batch_size): + if i == j: continue + if y_true[i] == y_true[j]: + numerator += np.exp(-1 * + np.sum(np.square(x[i] - x[j])) / temperature) + denominator += np.exp(-1 * + np.sum(np.square(x[i] - x[j])) / temperature) + if numerator == 0: continue + loss += np.log(numerator / denominator) + return -loss / batch_size + + +def test_softnn_loss(): + num_inputs = 10 + n_classes = 10 + # y_true: labels + y_true = tf.random.uniform((num_inputs,), 0, n_classes, dtype=tf.int32) + # x: embeddings + x = tf.random.uniform((num_inputs, 20), 0, 1) + + temperature = np.random.uniform(0.1, 50) + softnn = SoftNearestNeighborLoss(temperature=temperature) + loss = softnn(y_true, x) + loss_check = softnn_util(y_true, x, temperature) + loss_diff = loss.numpy() - loss_check + assert np.abs(loss_diff) < 1e-3 + + +def test_xbm_loss(): + batch_size = 6 + embed_dim = 16 + + embeddings1 = tf.random.uniform(shape=[batch_size, embed_dim]) + labels1 = tf.constant( + [ + [1], + [1], + [2], + [2], + [3], + [3], + ], + dtype=tf.int32 + ) + + embeddings2 = tf.random.uniform(shape=[batch_size, embed_dim]) + labels2 = tf.constant( + [ + [4], + [4], + [5], + [5], + [6], + [6], + ], + dtype=tf.int32 + ) + + distance = "cosine" + loss = MultiSimilarityLoss(distance=distance) + loss_nowarm = XBM(loss, memory_size=12, warmup_steps=0) + + # test enqueue + loss_nowarm(labels1, embeddings1) + assert loss_nowarm._y_pred_memory.numpy().shape == (batch_size, embed_dim) + tf.assert_equal(loss_nowarm._y_true_memory, labels1) + + loss_nowarm(labels2, embeddings2) + assert loss_nowarm._y_pred_memory.numpy().shape == (2 * batch_size, embed_dim) + tf.assert_equal(loss_nowarm._y_true_memory, tf.concat([labels2, labels1], axis=0)) + + # test dequeue + loss_nowarm(labels2, embeddings2) + assert loss_nowarm._y_pred_memory.numpy().shape == (2 * batch_size, embed_dim) + tf.assert_equal(loss_nowarm._y_true_memory, tf.concat([labels2, labels2], axis=0)) + + # test warmup + loss_warm = XBM(loss, memory_size=12, warmup_steps=1) + + loss_warm(labels1, embeddings1) + assert loss_warm._y_pred_memory.numpy().shape == (0, embed_dim) + tf.assert_equal(loss_warm._y_true_memory, tf.constant([[]], dtype=tf.int32)) + + loss_warm(labels2, embeddings2) + assert loss_warm._y_pred_memory.numpy().shape == (batch_size, embed_dim) + tf.assert_equal(loss_warm._y_true_memory, labels2) + + +# arcface loss +""" +ArcFaceLoss + ArcFace: Additive Angular Margin Loss for Deep Face + Recognition. [online] arXiv.org. Available at: + . +""" + + +def test_arcface_loss_serialization(): + n_classes = 10 + embed_size = 16 + loss = ArcFaceLoss(num_classes=n_classes, embedding_size=embed_size) + config = loss.get_config() + loss2 = ArcFaceLoss.from_config(config) + assert loss.name == loss2.name + assert loss.margin == loss2.margin + assert loss.scale == loss2.scale + assert loss.num_classes == loss2.num_classes + assert loss.embedding_size == loss2.embedding_size + + + +def test_arcface_loss(): + tf.random.set_seed(128) + loss_fn = ArcFaceLoss(num_classes=4, embedding_size=5) + labels = tf.Variable([0, 1, 2, 3]) + embeddings = tf.Variable(tf.random.uniform(shape=[4, 5])) + loss = loss_fn(labels, embeddings) + + assert 60.4 < loss.numpy() < 60.5 From f49676fb649c1caccb0c15fa27415bce9c071293 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Aylin=20Ayd=C4=B1n?= Date: Wed, 21 Sep 2022 23:37:32 +0300 Subject: [PATCH 02/25] Add files via upload --- ArcFace Loss Sample Notebook.ipynb | 775 +++++++++++++++++++++++++++++ arcface_loss.py | 120 +++++ test_losses.py | 275 ++++++++++ 3 files changed, 1170 insertions(+) create mode 100644 ArcFace Loss Sample Notebook.ipynb create mode 100644 arcface_loss.py create mode 100644 test_losses.py diff --git a/ArcFace Loss Sample Notebook.ipynb b/ArcFace Loss Sample Notebook.ipynb new file mode 100644 index 00000000..b481492e --- /dev/null +++ b/ArcFace Loss Sample Notebook.ipynb @@ -0,0 +1,775 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "id": "28956aa1", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "Copyright 2022 The TensorFlow Similarity Authors." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "24eda1a6", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "# @title Licensed under the Apache License, Version 2.0 (the \"License\");\n", + "# you may not use this file except in compliance with the License.\n", + "# You may obtain a copy of the License at\n", + "#\n", + "# https://www.apache.org/licenses/LICENSE-2.0\n", + "#\n", + "# Unless required by applicable law or agreed to in writing, software\n", + "# distributed under the License is distributed on an \"AS IS\" BASIS,\n", + "# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.\n", + "# See the License for the specific language governing permissions and\n", + "# limitations under the License." + ] + }, + { + "cell_type": "markdown", + "id": "7ca9d025", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "# TensorFlow Similarity ArcFace Loss Example" + ] + }, + { + "cell_type": "markdown", + "id": "d072628f", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "A Total Angular Margin Loss (ArcFace) calculates the geodetic distance in the hypersphere instead of the euclidean distance to improve the discriminatory strength of the facial recognition model and stabilize the training process. Rails are used to measure all distances in geodetic space. The geodetic trace is the path taken between two places. It specifies the geodetic distance, which is the shortest distance between two places.\n", + "\n", + "ArcFace loss determines the angle between the current feature and the target weight using the arc-cosine function since the dot product between the DCNN feature and the last fully connected layer after feature and weight normalization matches the cosine distance. The target logit is then returned by multiplying the goal angle by an additional angular margin and using the cosine function. After that, we continue as before and rescale all logits to a certain feature norm, just like with softmax loss." + ] + }, + { + "cell_type": "markdown", + "id": "808ac087", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "### Notebook goal\n", + "\n", + "This notebook demonstrates how to use ArcFaceLoss implementation of TensorFlow Similarity with standalone usage and to train a `SimilarityModel()` on a fraction of the MNIST classes.\n", + "\n", + "You are going to learn about the main features offered by the `ArcFaceLoss()` and will:\n", + "\n", + " 1. Standalone usage of ArcFaceLoss\n", + "\n", + " 2. Usage with `model.compile()`\n", + "\n", + " 3. 3D-Visualization of ArcFaceLoss \n", + "\n", + "### Things to try \n", + "\n", + "Along the way you can try the following things to improve the model performance:\n", + "- Adding more \"seen\" classes at training time.\n", + "- Use a larger embedding by increasing the size of the output.\n", + "- Add data augmentation pre-processing layers to the model.\n", + "- Include more examples in the index to give the models more points to choose from.\n", + "- Try a more challenging dataset, such as Fashion MNIST." + ] + }, + { + "cell_type": "markdown", + "id": "078c53c0", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "### Notebook goal\n", + "\n", + "This notebook demonstrates how to use ArcFaceLoss implementation of TensorFlow Similarity with standalone usage and to train a `SimilarityModel()` on a fraction of the MNIST classes.\n", + "\n", + "You are going to learn about the main features offered by the `ArcFaceLoss()` and will:\n", + "\n", + " 1. Standalone usage of ArcFaceLoss\n", + "\n", + " 2. Usage with `model.compile()`\n", + "\n", + " 3. 3D-Visualization of ArcFaceLoss \n", + "\n", + "### Things to try \n", + "\n", + "Along the way you can try the following things to improve the model performance:\n", + "- Adding more \"seen\" classes at training time.\n", + "- Use a larger embedding by increasing the size of the output.\n", + "- Add data augmentation pre-processing layers to the model.\n", + "- Include more examples in the index to give the models more points to choose from.\n", + "- Try a more challenging dataset, such as Fashion MNIST." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "8fd63f16", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "import gc\n", + "import os\n", + "\n", + "import numpy as np\n", + "from matplotlib import pyplot as plt\n", + "from tabulate import tabulate\n", + "from mpl_toolkits.mplot3d import Axes3D\n", + "\n", + "# INFO messages are not printed.\n", + "# This must be run before loading other modules.\n", + "os.environ[\"TF_CPP_MIN_LOG_LEVEL\"] = \"1\"" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "80af5fc0", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "import tensorflow as tf" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "8ba8caf7", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "# install TF similarity if needed\n", + "try:\n", + " import tensorflow_similarity as tfsim # main package\n", + "except ModuleNotFoundError:\n", + " !pip install tensorflow_similarity\n", + " import tensorflow_similarity as tfsim" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "2484bd72", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "tfsim.utils.tf_cap_memory()" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "3fe0344e", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "# Clear out any old model state.\n", + "gc.collect()\n", + "tf.keras.backend.clear_session()" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "99d9bef9", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "print(\"TensorFlow:\", tf.__version__)\n", + "print(\"TensorFlow Similarity\", tfsim.__version__)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "7137afbc", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [] + }, + { + "cell_type": "markdown", + "id": "1d534ad3", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "# Standalone Usage of ArcFaceLoss\n", + "\n", + "ArcFace loss alone can be used as follows when it is desired to calculate the additive angular margin loss of the existing data set." + ] + }, + { + "cell_type": "markdown", + "id": "68d526da", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "### Initialize Loss function as ArcFaceLoss" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "bebf6ef0", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "loss_fn = tfsim.losses.ArcFaceLoss(num_classes=8, embedding_size=10)" + ] + }, + { + "cell_type": "markdown", + "id": "d2ccfd7d", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "### Create own simple random dataset" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "1d1ec43a", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "labels = tf.Variable([0, 1, 2, 3, 4, 5, 6, 7])\n", + "embeddings = tf.Variable(tf.random.uniform(shape=[8, 10]))" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "73d0c1c6", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "print(\"\", embeddings)" + ] + }, + { + "cell_type": "markdown", + "id": "d65b3085", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "### Calculate loss" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "cdf7c30c", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "loss = loss_fn(labels, embeddings)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "16745b7d", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "print(\"loss : \" , loss)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "outputs": [], + "source": [ + "loss = loss_fn(labels, embeddings)" + ], + "metadata": { + "collapsed": false, + "pycharm": { + "name": "#%%\n" + } + } + }, + { + "cell_type": "code", + "execution_count": null, + "outputs": [], + "source": [ + "print(\"loss : \" , loss)" + ], + "metadata": { + "collapsed": false, + "pycharm": { + "name": "#%%\n" + } + } + }, + { + "cell_type": "markdown", + "source": [ + "## Data preparation\n", + "\n", + "We are going to load the MNIST dataset to showcase how the model is able to find similar examples from classes unseen during training. The model's ability to generalize the matching to unseen classes, without retraining, is one of the main reason you would want to use metric learning.\n", + "\n", + "\n", + "**WARNING**: Tensorflow similarity expects `y_train` to be an IntTensor containing the class ids for each example instead of the standard categorical encoding traditionally used for multi-class classification." + ], + "metadata": { + "collapsed": false, + "pycharm": { + "name": "#%% md\n" + } + } + }, + { + "cell_type": "code", + "execution_count": null, + "id": "8a9f8122", + "metadata": {}, + "outputs": [], + "source": [ + "print(\"loss : \" , loss)" + ] + }, + { + "cell_type": "markdown", + "id": "11ef5236", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "## Data preparation\n", + "\n", + "We are going to load the MNIST dataset to showcase how the model is able to find similar examples from classes unseen during training. The model's ability to generalize the matching to unseen classes, without retraining, is one of the main reason you would want to use metric learning.\n", + "\n", + "\n", + "**WARNING**: Tensorflow similarity expects `y_train` to be an IntTensor containing the class ids for each example instead of the standard categorical encoding traditionally used for multi-class classification." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "97152229", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "(x_train, y_train), (x_test, y_test) = tf.keras.datasets.mnist.load_data()" + ] + }, + { + "cell_type": "markdown", + "id": "08b766d8", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "## Model setup" + ] + }, + { + "cell_type": "markdown", + "id": "3eac2da7", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "### Model definition\n", + "\n", + "`SimilarityModel()` models extend `tensorflow.keras.model.Model` with additional features and functionality that allow you to index and search for similar looking examples.\n", + "\n", + "As visible in the model definition below, similarity models output a 64 dimensional float embedding using the `MetricEmbedding()` layers. This layer is a Dense layer with L2 normalization. Thanks to the loss, the model learns to minimize the distance between similar examples and maximize the distance between dissimilar examples. As a result, the distance between examples in the embedding space is meaningful; the smaller the distance the more similar the examples are. \n", + "\n", + "Being able to use a distance as a meaningful proxy for how similar two examples are, is what enables the fast ANN (aproximate nearest neighbor) search. Using a sub-linear ANN search instead of a standard quadratic NN search is what allows deep similarity search to scale to millions of items. The built in memory index used in this notebook scales to a million indexed examples very easily... if you have enough RAM :)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "a003c971", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "def get_model():\n", + " inputs = tf.keras.layers.Input(shape=(28, 28, 1))\n", + " x = tf.keras.layers.experimental.preprocessing.Rescaling(1 / 255)(inputs)\n", + " x = tf.keras.layers.Conv2D(32, 3, activation=\"relu\")(x)\n", + " x = tf.keras.layers.Conv2D(32, 3, activation=\"relu\")(x)\n", + " x = tf.keras.layers.MaxPool2D()(x)\n", + " x = tf.keras.layers.Conv2D(64, 3, activation=\"relu\")(x)\n", + " x = tf.keras.layers.Conv2D(64, 3, activation=\"relu\")(x)\n", + " x = tf.keras.layers.Flatten()(x)\n", + " # smaller embeddings will have faster lookup times while a larger embedding will improve the accuracy up to a point.\n", + " outputs = tfsim.layers.MetricEmbedding(64)(x)\n", + " return tfsim.models.SimilarityModel(inputs, outputs)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "a2177b12", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "model = get_model()\n", + "model.summary()" + ] + }, + { + "cell_type": "markdown", + "id": "defb3961", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "### ArcFace Loss definition\n", + "\n", + "Overall what makes Metric losses different from tradional losses is that:\n", + "- **They expect different inputs.** Instead of having the prediction equal the true values, they expect embeddings as `y_preds` and the id (as an int32) of the class as `y_true`. \n", + "- **They require a distance.** You need to specify which `distance` function to use to compute the distance between embeddings. `cosine` is usually a great starting point and the default.\n", + "\n", + "ArcFace Loss takes inputs as number of classes which labels includes, and embedding size which we define in model `MetricEmbedding()` layers." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "13b0d745", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "distance = \"cosine\" " + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "c22d10cc", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "num_classes = np.unique(y_train).size\n", + "embedding_size = model.get_layer('metric_embedding').output.shape[1]" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "d5b8e426", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "loss = tfsim.losses.ArcFaceLoss(num_classes= num_classes, embedding_size=embedding_size, name=\"ArcFaceLoss\")" + ] + }, + { + "cell_type": "markdown", + "id": "b6eaf9c8", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "### Compilation\n", + "\n", + "Tensorflow similarity use an extended `compile()` method that allows you to optionally specify `distance_metrics` (metrics that are computed over the distance between the embeddings), and the distance to use for the indexer.\n", + "\n", + "By default the `compile()` method tries to infer what type of distance you are using by looking at the first loss specified. If you use multiple losses, and the distance loss is not the first one, then you need to specify the distance function used as `distance=` parameter in the compile function." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "673f986f", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "LR = 0.0005 # @param {type:\"number\"}\n", + "model.compile(optimizer=tf.keras.optimizers.SGD(LR), loss=loss, distance=distance)" + ] + }, + { + "cell_type": "markdown", + "id": "15961601", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "## Training\n", + "\n", + "Similarity models are trained like normal models. " + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "147a6863", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "EPOCHS = 10 # @param {type:\"integer\"}\n", + "history = model.fit(x_train, y_train, epochs=EPOCHS, validation_data=(x_test, y_test))" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "88e1ee4d", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "plt.plot(history.history[\"loss\"])\n", + "plt.plot(history.history[\"val_loss\"])\n", + "plt.legend([\"loss\", \"val_loss\"])\n", + "plt.title(f\"Loss: {loss.name}\")\n", + "plt.show()" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "a5404906", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [] + }, + { + "cell_type": "markdown", + "id": "5ad4ba20", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "## Prediction\n", + "\n", + "Let's predict some features and visualiza them." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "a1936264", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "embedded_features = model.predict(x_test, verbose=1)\n", + "embedded_features /= np.linalg.norm(embedded_features, axis=1, keepdims=True)" + ] + }, + { + "cell_type": "markdown", + "id": "7c0df63b", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "### 3D-Visualization of ArcFace Loss" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "5aac5d98", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "fig = plt.figure()\n", + "ax = Axes3D(fig)\n", + "for c in range(len(np.unique(y_test))):\n", + " ax.plot(embedded_features[y_test==c, 0], embedded_features[y_test==c, 1], embedded_features[y_test==c, 2], '.', alpha=0.1)\n", + "plt.title('ArcFace')\n", + "plt.show()" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "8889f840", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "fef529d9", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3 (ipykernel)", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.9.12" + } + }, + "nbformat": 4, + "nbformat_minor": 5 +} \ No newline at end of file diff --git a/arcface_loss.py b/arcface_loss.py new file mode 100644 index 00000000..e93a98fd --- /dev/null +++ b/arcface_loss.py @@ -0,0 +1,120 @@ +# Copyright 2022 The TensorFlow Authors. All Rights Reserved. +# +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. +# ============================================================================== +"""ArcFace losses base class. + +ArcFace: Additive Angular Margin Loss for Deep Face +Recognition. [online] arXiv.org. Available at: +. + +""" + +from typing import Any, Callable, Dict, Optional, Tuple, Union + +import tensorflow as tf + +from tensorflow_similarity.algebra import build_masks +from tensorflow_similarity.distances import Distance, distance_canonicalizer +from tensorflow_similarity.types import FloatTensor, IntTensor +from tensorflow_similarity.utils import is_tensor_or_variable + +from .metric_loss import MetricLoss +from .utils import logsumexp + + +@tf.keras.utils.register_keras_serializable(package="Similarity") +class ArcFaceLoss(tf.keras.losses.Loss): + """Implement of ArcFace: Additive Angular Margin Loss: + Step 1: Create a trainable kernel matrix with the shape of [embedding_size, num_classes]. + Step 2: Normalize the kernel and prediction vectors. + Step 3: Calculate the cosine similarity between the normalized prediction vector and the kernel. + Step 4: Create a one-hot vector include the margin value for the ground truth class. + Step 5: Add margin_hot to the cosine similarity and multiply it by scale. + Step 6: Calculate the cross-entropy loss. + + ArcFace: Additive Angular Margin Loss for Deep Face + Recognition. [online] arXiv.org. Available at: + . + + Standalone usage: + >>> loss_fn = tfsim.losses.ArcFaceLoss(num_classes=2, embedding_size=3) + >>> labels = tf.Variable([1, 0]) + >>> embeddings = tf.Variable([[0.2, 0.3, 0.1], [0.4, 0.5, 0.5]]) + >>> loss = loss_fn(labels, embeddings) + Args: + num_classes: Number of classes. + embedding_size: The size of the embedding vectors. + margin: The margin value. + scale: s in the paper, feature scale + name: Optional name for the operation. + reduction: Type of loss reduction to apply to the loss. + """ + + def __init__( + self, + num_classes: int, + embedding_size: int, + margin: float = 0.50, # margin in radians + scale: float = 64.0, # feature scale + name: Optional[str] = None, + reduction: Callable = tf.keras.losses.Reduction.AUTO, + **kwargs + ): + + super().__init__(reduction=reduction, name=name, **kwargs) + + self.num_classes = num_classes + self.embedding_size = embedding_size + self.margin = margin + self.scale = scale + self.name = name + self.kernel = tf.Variable(tf.random.normal([embedding_size, num_classes])) + + def call(self, y_true: FloatTensor, y_pred: FloatTensor) -> FloatTensor: + + y_pred_norm = tf.math.l2_normalize(y_pred, axis=1) + kernel_norm = tf.math.l2_normalize(self.kernel, axis=0) + + cos_theta = tf.matmul(y_pred_norm, kernel_norm) + cos_theta = tf.clip_by_value(cos_theta, -1.0, 1.0) + + m_hot = tf.one_hot(y_true, self.num_classes, on_value=self.margin, axis=1) + m_hot = tf.reshape(m_hot, [-1, self.num_classes]) + + cos_theta = tf.acos(cos_theta) + cos_theta += m_hot + cos_theta = tf.math.cos(cos_theta) + cos_theta = tf.math.multiply(cos_theta, self.scale) + + cce = tf.keras.losses.SparseCategoricalCrossentropy( + from_logits=True, reduction=self.reduction + ) + loss: FloatTensor = cce(y_true, cos_theta) + + return loss + + def get_config(self) -> Dict[str, Any]: + """Contains the loss configuration. + Returns: + A Python dict containing the configuration of the loss. + """ + config = { + "num_classes": self.num_classes, + "embedding_size": self.embedding_size, + "margin": self.margin, + "scale": self.scale, + "name": self.name, + } + base_config = super().get_config() + return {**base_config, **config} diff --git a/test_losses.py b/test_losses.py new file mode 100644 index 00000000..1169423f --- /dev/null +++ b/test_losses.py @@ -0,0 +1,275 @@ +import numpy as np +import tensorflow as tf + +from tensorflow_similarity.losses import ( + ArcFaceLoss, + MultiSimilarityLoss, + PNLoss, + SoftNearestNeighborLoss, + TripletLoss, +) + +# [triplet loss] +from tensorflow_similarity.losses.xbm_loss import XBM + + +def test_triplet_loss_serialization(): + loss = TripletLoss() + config = loss.get_config() + print(config) + loss2 = TripletLoss.from_config(config) + assert loss.name == loss2.name + assert loss.distance == loss2.distance + + +def triplet_hard_loss_np(labels, embedding, margin, dist_func, soft=False): + num_data = embedding.shape[0] + # Reshape labels to compute adjacency matrix. + labels_reshaped = np.reshape(labels.astype(np.float32), (labels.shape[0], 1)) + + adjacency = np.equal(labels_reshaped, labels_reshaped.T) + pdist_matrix = dist_func(embedding) + loss_np = 0.0 + for i in range(num_data): + pos_distances = [] + neg_distances = [] + for j in range(num_data): + if adjacency[i][j] == 0: + neg_distances.append(pdist_matrix[i][j]) + if adjacency[i][j] > 0.0 and i != j: + pos_distances.append(pdist_matrix[i][j]) + + # if there are no positive pairs, distance is 0 + if len(pos_distances) == 0: + pos_distances.append(0) + + # Sort by distance. + neg_distances.sort() + min_neg_distance = neg_distances[0] + pos_distances.sort(reverse=True) + max_pos_distance = pos_distances[0] + + if soft: + loss_np += np.log1p(np.exp(max_pos_distance - min_neg_distance)) + else: + loss_np += np.maximum(0.0, max_pos_distance - min_neg_distance + margin) + + loss_np /= num_data + return loss_np + + +def test_triplet_loss(): + num_inputs = 10 + # y_true: labels + y_true = tf.random.uniform((num_inputs,), 0, 10, dtype=tf.int32) + # y_preds: embedding + y_preds = tf.random.uniform((num_inputs, 20), 0, 1) + tpl = TripletLoss() + # y_true, y_preds + loss = tpl(y_true, y_preds) + assert loss > 0.9 + + +def test_triplet_loss_easy(): + num_inputs = 10 + # y_true: labels + y_true = tf.random.uniform((num_inputs,), 0, 3, dtype=tf.int32) + # y_preds: embedding + y_preds = tf.random.uniform((num_inputs, 16), 0, 1) + tpl = TripletLoss(positive_mining_strategy="easy", negative_mining_strategy="easy") + # y_true, y_preds + loss = tpl(y_true, y_preds) + assert loss > 0 + + +def test_triplet_loss_semi_hard(): + num_inputs = 10 + # y_true: labels + y_true = tf.random.uniform((num_inputs,), 0, 3, dtype=tf.int32) + # y_preds: embedding + y_preds = tf.random.uniform((num_inputs, 16), 0, 1) + tpl = TripletLoss( + positive_mining_strategy="easy", negative_mining_strategy="semi-hard" + ) + # y_true, y_preds + loss = tpl(y_true, y_preds) + assert loss + + +def test_triplet_loss_hard(): + num_inputs = 10 + # y_true: labels + y_true = tf.random.uniform((num_inputs,), 0, 3, dtype=tf.int32) + # y_preds: embedding + y_preds = tf.random.uniform((num_inputs, 16), 0, 1) + tpl = TripletLoss(positive_mining_strategy="hard", negative_mining_strategy="hard") + # y_true, y_preds + loss = tpl(y_true, y_preds) + assert loss + + +# [pn loss] +def test_pn_loss_serialization(): + loss = PNLoss() + config = loss.get_config() + print(config) + loss2 = PNLoss.from_config(config) + assert loss.name == loss2.name + assert loss.distance == loss2.distance + + +def test_np_loss(): + num_inputs = 10 + # y_true: labels + y_true = tf.random.uniform((num_inputs,), 0, 10, dtype=tf.int32) + # y_preds: embedding + y_preds = tf.random.uniform((num_inputs, 20), 0, 1) + pnl = PNLoss() + # y_true, y_preds + loss = pnl(y_true, y_preds) + assert loss > 0.9 + + +# [soft neasrest neighbor loss] +def test_softnn_loss_serialization(): + loss = SoftNearestNeighborLoss(distance="cosine", temperature=50) + config = loss.get_config() + loss2 = SoftNearestNeighborLoss.from_config(config) + assert loss.name == loss2.name + assert loss.distance == loss2.distance + assert loss.temperature == loss2.temperature + + +def softnn_util(y_true, x, temperature=1): + """ + A simple loop based implementation of soft + nearest neighbor loss to test the code. + https://arxiv.org/pdf/1902.01889.pdf + """ + + y_true = y_true.numpy() + x = x.numpy() + batch_size = y_true.shape[0] + loss = 0 + eps = 1e-9 + for i in range(batch_size): + numerator = 0 + denominator = 0 + for j in range(batch_size): + if i == j: + continue + if y_true[i] == y_true[j]: + numerator += np.exp(-1 * np.sum(np.square(x[i] - x[j])) / temperature) + denominator += np.exp(-1 * np.sum(np.square(x[i] - x[j])) / temperature) + if numerator == 0: + continue + loss += np.log(numerator / denominator) + return -loss / batch_size + + +def test_softnn_loss(): + num_inputs = 10 + n_classes = 10 + # y_true: labels + y_true = tf.random.uniform((num_inputs,), 0, n_classes, dtype=tf.int32) + # x: embeddings + x = tf.random.uniform((num_inputs, 20), 0, 1) + + temperature = np.random.uniform(0.1, 50) + softnn = SoftNearestNeighborLoss(temperature=temperature) + loss = softnn(y_true, x) + loss_check = softnn_util(y_true, x, temperature) + loss_diff = loss.numpy() - loss_check + assert np.abs(loss_diff) < 1e-3 + + +def test_xbm_loss(): + batch_size = 6 + embed_dim = 16 + + embeddings1 = tf.random.uniform(shape=[batch_size, embed_dim]) + labels1 = tf.constant( + [ + [1], + [1], + [2], + [2], + [3], + [3], + ], + dtype=tf.int32, + ) + + embeddings2 = tf.random.uniform(shape=[batch_size, embed_dim]) + labels2 = tf.constant( + [ + [4], + [4], + [5], + [5], + [6], + [6], + ], + dtype=tf.int32, + ) + + distance = "cosine" + loss = MultiSimilarityLoss(distance=distance) + loss_nowarm = XBM(loss, memory_size=12, warmup_steps=0) + + # test enqueue + loss_nowarm(labels1, embeddings1) + assert loss_nowarm._y_pred_memory.numpy().shape == (batch_size, embed_dim) + tf.assert_equal(loss_nowarm._y_true_memory, labels1) + + loss_nowarm(labels2, embeddings2) + assert loss_nowarm._y_pred_memory.numpy().shape == (2 * batch_size, embed_dim) + tf.assert_equal(loss_nowarm._y_true_memory, tf.concat([labels2, labels1], axis=0)) + + # test dequeue + loss_nowarm(labels2, embeddings2) + assert loss_nowarm._y_pred_memory.numpy().shape == (2 * batch_size, embed_dim) + tf.assert_equal(loss_nowarm._y_true_memory, tf.concat([labels2, labels2], axis=0)) + + # test warmup + loss_warm = XBM(loss, memory_size=12, warmup_steps=1) + + loss_warm(labels1, embeddings1) + assert loss_warm._y_pred_memory.numpy().shape == (0, embed_dim) + tf.assert_equal(loss_warm._y_true_memory, tf.constant([[]], dtype=tf.int32)) + + loss_warm(labels2, embeddings2) + assert loss_warm._y_pred_memory.numpy().shape == (batch_size, embed_dim) + tf.assert_equal(loss_warm._y_true_memory, labels2) + + +# arcface loss +""" +ArcFaceLoss + ArcFace: Additive Angular Margin Loss for Deep Face + Recognition. [online] arXiv.org. Available at: + . +""" + + +def test_arcface_loss_serialization(): + n_classes = 10 + embed_size = 16 + loss = ArcFaceLoss(num_classes=n_classes, embedding_size=embed_size) + config = loss.get_config() + loss2 = ArcFaceLoss.from_config(config) + assert loss.name == loss2.name + assert loss.margin == loss2.margin + assert loss.scale == loss2.scale + assert loss.num_classes == loss2.num_classes + assert loss.embedding_size == loss2.embedding_size + + +def test_arcface_loss(): + tf.random.set_seed(128) + loss_fn = ArcFaceLoss(num_classes=4, embedding_size=5) + labels = tf.Variable([0, 1, 2, 3]) + embeddings = tf.Variable(tf.random.uniform(shape=[4, 5])) + loss = loss_fn(labels, embeddings) + + assert 60.4 < loss.numpy() < 60.5 From 7b84548cafd5d2695856e5faad35bb2c7951c726 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Aylin=20Ayd=C4=B1n?= Date: Wed, 21 Sep 2022 23:38:44 +0300 Subject: [PATCH 03/25] Delete ArcFace Loss Sample Notebook.ipynb --- .../losses/ArcFace Loss Sample Notebook.ipynb | 775 ------------------ 1 file changed, 775 deletions(-) delete mode 100644 tensorflow_similarity/losses/ArcFace Loss Sample Notebook.ipynb diff --git a/tensorflow_similarity/losses/ArcFace Loss Sample Notebook.ipynb b/tensorflow_similarity/losses/ArcFace Loss Sample Notebook.ipynb deleted file mode 100644 index b481492e..00000000 --- a/tensorflow_similarity/losses/ArcFace Loss Sample Notebook.ipynb +++ /dev/null @@ -1,775 +0,0 @@ -{ - "cells": [ - { - "cell_type": "markdown", - "id": "28956aa1", - "metadata": { - "pycharm": { - "name": "#%% md\n" - } - }, - "source": [ - "Copyright 2022 The TensorFlow Similarity Authors." - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "24eda1a6", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "# @title Licensed under the Apache License, Version 2.0 (the \"License\");\n", - "# you may not use this file except in compliance with the License.\n", - "# You may obtain a copy of the License at\n", - "#\n", - "# https://www.apache.org/licenses/LICENSE-2.0\n", - "#\n", - "# Unless required by applicable law or agreed to in writing, software\n", - "# distributed under the License is distributed on an \"AS IS\" BASIS,\n", - "# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.\n", - "# See the License for the specific language governing permissions and\n", - "# limitations under the License." - ] - }, - { - "cell_type": "markdown", - "id": "7ca9d025", - "metadata": { - "pycharm": { - "name": "#%% md\n" - } - }, - "source": [ - "# TensorFlow Similarity ArcFace Loss Example" - ] - }, - { - "cell_type": "markdown", - "id": "d072628f", - "metadata": { - "pycharm": { - "name": "#%% md\n" - } - }, - "source": [ - "A Total Angular Margin Loss (ArcFace) calculates the geodetic distance in the hypersphere instead of the euclidean distance to improve the discriminatory strength of the facial recognition model and stabilize the training process. Rails are used to measure all distances in geodetic space. The geodetic trace is the path taken between two places. It specifies the geodetic distance, which is the shortest distance between two places.\n", - "\n", - "ArcFace loss determines the angle between the current feature and the target weight using the arc-cosine function since the dot product between the DCNN feature and the last fully connected layer after feature and weight normalization matches the cosine distance. The target logit is then returned by multiplying the goal angle by an additional angular margin and using the cosine function. After that, we continue as before and rescale all logits to a certain feature norm, just like with softmax loss." - ] - }, - { - "cell_type": "markdown", - "id": "808ac087", - "metadata": { - "pycharm": { - "name": "#%% md\n" - } - }, - "source": [ - "### Notebook goal\n", - "\n", - "This notebook demonstrates how to use ArcFaceLoss implementation of TensorFlow Similarity with standalone usage and to train a `SimilarityModel()` on a fraction of the MNIST classes.\n", - "\n", - "You are going to learn about the main features offered by the `ArcFaceLoss()` and will:\n", - "\n", - " 1. Standalone usage of ArcFaceLoss\n", - "\n", - " 2. Usage with `model.compile()`\n", - "\n", - " 3. 3D-Visualization of ArcFaceLoss \n", - "\n", - "### Things to try \n", - "\n", - "Along the way you can try the following things to improve the model performance:\n", - "- Adding more \"seen\" classes at training time.\n", - "- Use a larger embedding by increasing the size of the output.\n", - "- Add data augmentation pre-processing layers to the model.\n", - "- Include more examples in the index to give the models more points to choose from.\n", - "- Try a more challenging dataset, such as Fashion MNIST." - ] - }, - { - "cell_type": "markdown", - "id": "078c53c0", - "metadata": { - "pycharm": { - "name": "#%% md\n" - } - }, - "source": [ - "### Notebook goal\n", - "\n", - "This notebook demonstrates how to use ArcFaceLoss implementation of TensorFlow Similarity with standalone usage and to train a `SimilarityModel()` on a fraction of the MNIST classes.\n", - "\n", - "You are going to learn about the main features offered by the `ArcFaceLoss()` and will:\n", - "\n", - " 1. Standalone usage of ArcFaceLoss\n", - "\n", - " 2. Usage with `model.compile()`\n", - "\n", - " 3. 3D-Visualization of ArcFaceLoss \n", - "\n", - "### Things to try \n", - "\n", - "Along the way you can try the following things to improve the model performance:\n", - "- Adding more \"seen\" classes at training time.\n", - "- Use a larger embedding by increasing the size of the output.\n", - "- Add data augmentation pre-processing layers to the model.\n", - "- Include more examples in the index to give the models more points to choose from.\n", - "- Try a more challenging dataset, such as Fashion MNIST." - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "8fd63f16", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "import gc\n", - "import os\n", - "\n", - "import numpy as np\n", - "from matplotlib import pyplot as plt\n", - "from tabulate import tabulate\n", - "from mpl_toolkits.mplot3d import Axes3D\n", - "\n", - "# INFO messages are not printed.\n", - "# This must be run before loading other modules.\n", - "os.environ[\"TF_CPP_MIN_LOG_LEVEL\"] = \"1\"" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "80af5fc0", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "import tensorflow as tf" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "8ba8caf7", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "# install TF similarity if needed\n", - "try:\n", - " import tensorflow_similarity as tfsim # main package\n", - "except ModuleNotFoundError:\n", - " !pip install tensorflow_similarity\n", - " import tensorflow_similarity as tfsim" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "2484bd72", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "tfsim.utils.tf_cap_memory()" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "3fe0344e", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "# Clear out any old model state.\n", - "gc.collect()\n", - "tf.keras.backend.clear_session()" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "99d9bef9", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "print(\"TensorFlow:\", tf.__version__)\n", - "print(\"TensorFlow Similarity\", tfsim.__version__)" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "7137afbc", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [] - }, - { - "cell_type": "markdown", - "id": "1d534ad3", - "metadata": { - "pycharm": { - "name": "#%% md\n" - } - }, - "source": [ - "# Standalone Usage of ArcFaceLoss\n", - "\n", - "ArcFace loss alone can be used as follows when it is desired to calculate the additive angular margin loss of the existing data set." - ] - }, - { - "cell_type": "markdown", - "id": "68d526da", - "metadata": { - "pycharm": { - "name": "#%% md\n" - } - }, - "source": [ - "### Initialize Loss function as ArcFaceLoss" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "bebf6ef0", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "loss_fn = tfsim.losses.ArcFaceLoss(num_classes=8, embedding_size=10)" - ] - }, - { - "cell_type": "markdown", - "id": "d2ccfd7d", - "metadata": { - "pycharm": { - "name": "#%% md\n" - } - }, - "source": [ - "### Create own simple random dataset" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "1d1ec43a", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "labels = tf.Variable([0, 1, 2, 3, 4, 5, 6, 7])\n", - "embeddings = tf.Variable(tf.random.uniform(shape=[8, 10]))" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "73d0c1c6", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "print(\"\", embeddings)" - ] - }, - { - "cell_type": "markdown", - "id": "d65b3085", - "metadata": { - "pycharm": { - "name": "#%% md\n" - } - }, - "source": [ - "### Calculate loss" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "cdf7c30c", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "loss = loss_fn(labels, embeddings)" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "16745b7d", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "print(\"loss : \" , loss)" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "outputs": [], - "source": [ - "loss = loss_fn(labels, embeddings)" - ], - "metadata": { - "collapsed": false, - "pycharm": { - "name": "#%%\n" - } - } - }, - { - "cell_type": "code", - "execution_count": null, - "outputs": [], - "source": [ - "print(\"loss : \" , loss)" - ], - "metadata": { - "collapsed": false, - "pycharm": { - "name": "#%%\n" - } - } - }, - { - "cell_type": "markdown", - "source": [ - "## Data preparation\n", - "\n", - "We are going to load the MNIST dataset to showcase how the model is able to find similar examples from classes unseen during training. The model's ability to generalize the matching to unseen classes, without retraining, is one of the main reason you would want to use metric learning.\n", - "\n", - "\n", - "**WARNING**: Tensorflow similarity expects `y_train` to be an IntTensor containing the class ids for each example instead of the standard categorical encoding traditionally used for multi-class classification." - ], - "metadata": { - "collapsed": false, - "pycharm": { - "name": "#%% md\n" - } - } - }, - { - "cell_type": "code", - "execution_count": null, - "id": "8a9f8122", - "metadata": {}, - "outputs": [], - "source": [ - "print(\"loss : \" , loss)" - ] - }, - { - "cell_type": "markdown", - "id": "11ef5236", - "metadata": { - "pycharm": { - "name": "#%% md\n" - } - }, - "source": [ - "## Data preparation\n", - "\n", - "We are going to load the MNIST dataset to showcase how the model is able to find similar examples from classes unseen during training. The model's ability to generalize the matching to unseen classes, without retraining, is one of the main reason you would want to use metric learning.\n", - "\n", - "\n", - "**WARNING**: Tensorflow similarity expects `y_train` to be an IntTensor containing the class ids for each example instead of the standard categorical encoding traditionally used for multi-class classification." - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "97152229", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "(x_train, y_train), (x_test, y_test) = tf.keras.datasets.mnist.load_data()" - ] - }, - { - "cell_type": "markdown", - "id": "08b766d8", - "metadata": { - "pycharm": { - "name": "#%% md\n" - } - }, - "source": [ - "## Model setup" - ] - }, - { - "cell_type": "markdown", - "id": "3eac2da7", - "metadata": { - "pycharm": { - "name": "#%% md\n" - } - }, - "source": [ - "### Model definition\n", - "\n", - "`SimilarityModel()` models extend `tensorflow.keras.model.Model` with additional features and functionality that allow you to index and search for similar looking examples.\n", - "\n", - "As visible in the model definition below, similarity models output a 64 dimensional float embedding using the `MetricEmbedding()` layers. This layer is a Dense layer with L2 normalization. Thanks to the loss, the model learns to minimize the distance between similar examples and maximize the distance between dissimilar examples. As a result, the distance between examples in the embedding space is meaningful; the smaller the distance the more similar the examples are. \n", - "\n", - "Being able to use a distance as a meaningful proxy for how similar two examples are, is what enables the fast ANN (aproximate nearest neighbor) search. Using a sub-linear ANN search instead of a standard quadratic NN search is what allows deep similarity search to scale to millions of items. The built in memory index used in this notebook scales to a million indexed examples very easily... if you have enough RAM :)" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "a003c971", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "def get_model():\n", - " inputs = tf.keras.layers.Input(shape=(28, 28, 1))\n", - " x = tf.keras.layers.experimental.preprocessing.Rescaling(1 / 255)(inputs)\n", - " x = tf.keras.layers.Conv2D(32, 3, activation=\"relu\")(x)\n", - " x = tf.keras.layers.Conv2D(32, 3, activation=\"relu\")(x)\n", - " x = tf.keras.layers.MaxPool2D()(x)\n", - " x = tf.keras.layers.Conv2D(64, 3, activation=\"relu\")(x)\n", - " x = tf.keras.layers.Conv2D(64, 3, activation=\"relu\")(x)\n", - " x = tf.keras.layers.Flatten()(x)\n", - " # smaller embeddings will have faster lookup times while a larger embedding will improve the accuracy up to a point.\n", - " outputs = tfsim.layers.MetricEmbedding(64)(x)\n", - " return tfsim.models.SimilarityModel(inputs, outputs)" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "a2177b12", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "model = get_model()\n", - "model.summary()" - ] - }, - { - "cell_type": "markdown", - "id": "defb3961", - "metadata": { - "pycharm": { - "name": "#%% md\n" - } - }, - "source": [ - "### ArcFace Loss definition\n", - "\n", - "Overall what makes Metric losses different from tradional losses is that:\n", - "- **They expect different inputs.** Instead of having the prediction equal the true values, they expect embeddings as `y_preds` and the id (as an int32) of the class as `y_true`. \n", - "- **They require a distance.** You need to specify which `distance` function to use to compute the distance between embeddings. `cosine` is usually a great starting point and the default.\n", - "\n", - "ArcFace Loss takes inputs as number of classes which labels includes, and embedding size which we define in model `MetricEmbedding()` layers." - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "13b0d745", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "distance = \"cosine\" " - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "c22d10cc", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "num_classes = np.unique(y_train).size\n", - "embedding_size = model.get_layer('metric_embedding').output.shape[1]" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "d5b8e426", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "loss = tfsim.losses.ArcFaceLoss(num_classes= num_classes, embedding_size=embedding_size, name=\"ArcFaceLoss\")" - ] - }, - { - "cell_type": "markdown", - "id": "b6eaf9c8", - "metadata": { - "pycharm": { - "name": "#%% md\n" - } - }, - "source": [ - "### Compilation\n", - "\n", - "Tensorflow similarity use an extended `compile()` method that allows you to optionally specify `distance_metrics` (metrics that are computed over the distance between the embeddings), and the distance to use for the indexer.\n", - "\n", - "By default the `compile()` method tries to infer what type of distance you are using by looking at the first loss specified. If you use multiple losses, and the distance loss is not the first one, then you need to specify the distance function used as `distance=` parameter in the compile function." - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "673f986f", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "LR = 0.0005 # @param {type:\"number\"}\n", - "model.compile(optimizer=tf.keras.optimizers.SGD(LR), loss=loss, distance=distance)" - ] - }, - { - "cell_type": "markdown", - "id": "15961601", - "metadata": { - "pycharm": { - "name": "#%% md\n" - } - }, - "source": [ - "## Training\n", - "\n", - "Similarity models are trained like normal models. " - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "147a6863", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "EPOCHS = 10 # @param {type:\"integer\"}\n", - "history = model.fit(x_train, y_train, epochs=EPOCHS, validation_data=(x_test, y_test))" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "88e1ee4d", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "plt.plot(history.history[\"loss\"])\n", - "plt.plot(history.history[\"val_loss\"])\n", - "plt.legend([\"loss\", \"val_loss\"])\n", - "plt.title(f\"Loss: {loss.name}\")\n", - "plt.show()" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "a5404906", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [] - }, - { - "cell_type": "markdown", - "id": "5ad4ba20", - "metadata": { - "pycharm": { - "name": "#%% md\n" - } - }, - "source": [ - "## Prediction\n", - "\n", - "Let's predict some features and visualiza them." - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "a1936264", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "embedded_features = model.predict(x_test, verbose=1)\n", - "embedded_features /= np.linalg.norm(embedded_features, axis=1, keepdims=True)" - ] - }, - { - "cell_type": "markdown", - "id": "7c0df63b", - "metadata": { - "pycharm": { - "name": "#%% md\n" - } - }, - "source": [ - "### 3D-Visualization of ArcFace Loss" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "5aac5d98", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "fig = plt.figure()\n", - "ax = Axes3D(fig)\n", - "for c in range(len(np.unique(y_test))):\n", - " ax.plot(embedded_features[y_test==c, 0], embedded_features[y_test==c, 1], embedded_features[y_test==c, 2], '.', alpha=0.1)\n", - "plt.title('ArcFace')\n", - "plt.show()" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "8889f840", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "fef529d9", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [] - } - ], - "metadata": { - "kernelspec": { - "display_name": "Python 3 (ipykernel)", - "language": "python", - "name": "python3" - }, - "language_info": { - "codemirror_mode": { - "name": "ipython", - "version": 3 - }, - "file_extension": ".py", - "mimetype": "text/x-python", - "name": "python", - "nbconvert_exporter": "python", - "pygments_lexer": "ipython3", - "version": "3.9.12" - } - }, - "nbformat": 4, - "nbformat_minor": 5 -} \ No newline at end of file From 49a18f69455a5d7da984d2f74963a164ec50b52f Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Aylin=20Ayd=C4=B1n?= Date: Wed, 21 Sep 2022 23:38:55 +0300 Subject: [PATCH 04/25] Delete test_losses.py --- tensorflow_similarity/losses/test_losses.py | 275 -------------------- 1 file changed, 275 deletions(-) delete mode 100644 tensorflow_similarity/losses/test_losses.py diff --git a/tensorflow_similarity/losses/test_losses.py b/tensorflow_similarity/losses/test_losses.py deleted file mode 100644 index 1d4fef9c..00000000 --- a/tensorflow_similarity/losses/test_losses.py +++ /dev/null @@ -1,275 +0,0 @@ -import tensorflow as tf -import numpy as np -from tensorflow_similarity.losses import TripletLoss, MultiSimilarityLoss -from tensorflow_similarity.losses import PNLoss -from tensorflow_similarity.losses import SoftNearestNeighborLoss -from tensorflow_similarity.losses import ArcFaceLoss - -# [triplet loss] -from tensorflow_similarity.losses.xbm_loss import XBM - - -def test_triplet_loss_serialization(): - loss = TripletLoss() - config = loss.get_config() - print(config) - loss2 = TripletLoss.from_config(config) - assert loss.name == loss2.name - assert loss.distance == loss2.distance - - -def triplet_hard_loss_np(labels, embedding, margin, dist_func, soft=False): - num_data = embedding.shape[0] - # Reshape labels to compute adjacency matrix. - labels_reshaped = np.reshape(labels.astype(np.float32), - (labels.shape[0], 1)) - - adjacency = np.equal(labels_reshaped, labels_reshaped.T) - pdist_matrix = dist_func(embedding) - loss_np = 0.0 - for i in range(num_data): - pos_distances = [] - neg_distances = [] - for j in range(num_data): - if adjacency[i][j] == 0: - neg_distances.append(pdist_matrix[i][j]) - if adjacency[i][j] > 0.0 and i != j: - pos_distances.append(pdist_matrix[i][j]) - - # if there are no positive pairs, distance is 0 - if len(pos_distances) == 0: - pos_distances.append(0) - - # Sort by distance. - neg_distances.sort() - min_neg_distance = neg_distances[0] - pos_distances.sort(reverse=True) - max_pos_distance = pos_distances[0] - - if soft: - loss_np += np.log1p(np.exp(max_pos_distance - min_neg_distance)) - else: - loss_np += np.maximum(0.0, - max_pos_distance - min_neg_distance + margin) - - loss_np /= num_data - return loss_np - - -def test_triplet_loss(): - num_inputs = 10 - # y_true: labels - y_true = tf.random.uniform((num_inputs,), 0, 10, dtype=tf.int32) - # y_preds: embedding - y_preds = tf.random.uniform((num_inputs, 20), 0, 1) - tpl = TripletLoss() - # y_true, y_preds - loss = tpl(y_true, y_preds) - assert loss > 0.9 - - -def test_triplet_loss_easy(): - num_inputs = 10 - # y_true: labels - y_true = tf.random.uniform((num_inputs,), 0, 3, dtype=tf.int32) - # y_preds: embedding - y_preds = tf.random.uniform((num_inputs, 16), 0, 1) - tpl = TripletLoss(positive_mining_strategy='easy', - negative_mining_strategy='easy') - # y_true, y_preds - loss = tpl(y_true, y_preds) - assert loss > 0 - - -def test_triplet_loss_semi_hard(): - num_inputs = 10 - # y_true: labels - y_true = tf.random.uniform((num_inputs,), 0, 3, dtype=tf.int32) - # y_preds: embedding - y_preds = tf.random.uniform((num_inputs, 16), 0, 1) - tpl = TripletLoss(positive_mining_strategy='easy', - negative_mining_strategy='semi-hard') - # y_true, y_preds - loss = tpl(y_true, y_preds) - assert loss - - -def test_triplet_loss_hard(): - num_inputs = 10 - # y_true: labels - y_true = tf.random.uniform((num_inputs,), 0, 3, dtype=tf.int32) - # y_preds: embedding - y_preds = tf.random.uniform((num_inputs, 16), 0, 1) - tpl = TripletLoss(positive_mining_strategy='hard', - negative_mining_strategy='hard') - # y_true, y_preds - loss = tpl(y_true, y_preds) - assert loss - - -# [pn loss] -def test_pn_loss_serialization(): - loss = PNLoss() - config = loss.get_config() - print(config) - loss2 = PNLoss.from_config(config) - assert loss.name == loss2.name - assert loss.distance == loss2.distance - - -def test_np_loss(): - num_inputs = 10 - # y_true: labels - y_true = tf.random.uniform((num_inputs,), 0, 10, dtype=tf.int32) - # y_preds: embedding - y_preds = tf.random.uniform((num_inputs, 20), 0, 1) - pnl = PNLoss() - # y_true, y_preds - loss = pnl(y_true, y_preds) - assert loss > 0.9 - - -# [soft neasrest neighbor loss] -def test_softnn_loss_serialization(): - loss = SoftNearestNeighborLoss(distance="cosine", temperature=50) - config = loss.get_config() - loss2 = SoftNearestNeighborLoss.from_config(config) - assert loss.name == loss2.name - assert loss.distance == loss2.distance - assert loss.temperature == loss2.temperature - - -def softnn_util(y_true, x, temperature=1): - """ - A simple loop based implementation of soft - nearest neighbor loss to test the code. - https://arxiv.org/pdf/1902.01889.pdf - """ - - y_true = y_true.numpy() - x = x.numpy() - batch_size = y_true.shape[0] - loss = 0 - eps = 1e-9 - for i in range(batch_size): - numerator = 0 - denominator = 0 - for j in range(batch_size): - if i == j: continue - if y_true[i] == y_true[j]: - numerator += np.exp(-1 * - np.sum(np.square(x[i] - x[j])) / temperature) - denominator += np.exp(-1 * - np.sum(np.square(x[i] - x[j])) / temperature) - if numerator == 0: continue - loss += np.log(numerator / denominator) - return -loss / batch_size - - -def test_softnn_loss(): - num_inputs = 10 - n_classes = 10 - # y_true: labels - y_true = tf.random.uniform((num_inputs,), 0, n_classes, dtype=tf.int32) - # x: embeddings - x = tf.random.uniform((num_inputs, 20), 0, 1) - - temperature = np.random.uniform(0.1, 50) - softnn = SoftNearestNeighborLoss(temperature=temperature) - loss = softnn(y_true, x) - loss_check = softnn_util(y_true, x, temperature) - loss_diff = loss.numpy() - loss_check - assert np.abs(loss_diff) < 1e-3 - - -def test_xbm_loss(): - batch_size = 6 - embed_dim = 16 - - embeddings1 = tf.random.uniform(shape=[batch_size, embed_dim]) - labels1 = tf.constant( - [ - [1], - [1], - [2], - [2], - [3], - [3], - ], - dtype=tf.int32 - ) - - embeddings2 = tf.random.uniform(shape=[batch_size, embed_dim]) - labels2 = tf.constant( - [ - [4], - [4], - [5], - [5], - [6], - [6], - ], - dtype=tf.int32 - ) - - distance = "cosine" - loss = MultiSimilarityLoss(distance=distance) - loss_nowarm = XBM(loss, memory_size=12, warmup_steps=0) - - # test enqueue - loss_nowarm(labels1, embeddings1) - assert loss_nowarm._y_pred_memory.numpy().shape == (batch_size, embed_dim) - tf.assert_equal(loss_nowarm._y_true_memory, labels1) - - loss_nowarm(labels2, embeddings2) - assert loss_nowarm._y_pred_memory.numpy().shape == (2 * batch_size, embed_dim) - tf.assert_equal(loss_nowarm._y_true_memory, tf.concat([labels2, labels1], axis=0)) - - # test dequeue - loss_nowarm(labels2, embeddings2) - assert loss_nowarm._y_pred_memory.numpy().shape == (2 * batch_size, embed_dim) - tf.assert_equal(loss_nowarm._y_true_memory, tf.concat([labels2, labels2], axis=0)) - - # test warmup - loss_warm = XBM(loss, memory_size=12, warmup_steps=1) - - loss_warm(labels1, embeddings1) - assert loss_warm._y_pred_memory.numpy().shape == (0, embed_dim) - tf.assert_equal(loss_warm._y_true_memory, tf.constant([[]], dtype=tf.int32)) - - loss_warm(labels2, embeddings2) - assert loss_warm._y_pred_memory.numpy().shape == (batch_size, embed_dim) - tf.assert_equal(loss_warm._y_true_memory, labels2) - - -# arcface loss -""" -ArcFaceLoss - ArcFace: Additive Angular Margin Loss for Deep Face - Recognition. [online] arXiv.org. Available at: - . -""" - - -def test_arcface_loss_serialization(): - n_classes = 10 - embed_size = 16 - loss = ArcFaceLoss(num_classes=n_classes, embedding_size=embed_size) - config = loss.get_config() - loss2 = ArcFaceLoss.from_config(config) - assert loss.name == loss2.name - assert loss.margin == loss2.margin - assert loss.scale == loss2.scale - assert loss.num_classes == loss2.num_classes - assert loss.embedding_size == loss2.embedding_size - - - -def test_arcface_loss(): - tf.random.set_seed(128) - loss_fn = ArcFaceLoss(num_classes=4, embedding_size=5) - labels = tf.Variable([0, 1, 2, 3]) - embeddings = tf.Variable(tf.random.uniform(shape=[4, 5])) - loss = loss_fn(labels, embeddings) - - assert 60.4 < loss.numpy() < 60.5 From e0ea837a0a17e26f44044b31a97ec3f53279d7d4 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Aylin=20Ayd=C4=B1n?= Date: Wed, 21 Sep 2022 23:39:40 +0300 Subject: [PATCH 05/25] Add files via upload --- examples/ArcFace Loss Sample Notebook.ipynb | 775 ++++++++++++++++++++ 1 file changed, 775 insertions(+) create mode 100644 examples/ArcFace Loss Sample Notebook.ipynb diff --git a/examples/ArcFace Loss Sample Notebook.ipynb b/examples/ArcFace Loss Sample Notebook.ipynb new file mode 100644 index 00000000..b481492e --- /dev/null +++ b/examples/ArcFace Loss Sample Notebook.ipynb @@ -0,0 +1,775 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "id": "28956aa1", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "Copyright 2022 The TensorFlow Similarity Authors." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "24eda1a6", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "# @title Licensed under the Apache License, Version 2.0 (the \"License\");\n", + "# you may not use this file except in compliance with the License.\n", + "# You may obtain a copy of the License at\n", + "#\n", + "# https://www.apache.org/licenses/LICENSE-2.0\n", + "#\n", + "# Unless required by applicable law or agreed to in writing, software\n", + "# distributed under the License is distributed on an \"AS IS\" BASIS,\n", + "# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.\n", + "# See the License for the specific language governing permissions and\n", + "# limitations under the License." + ] + }, + { + "cell_type": "markdown", + "id": "7ca9d025", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "# TensorFlow Similarity ArcFace Loss Example" + ] + }, + { + "cell_type": "markdown", + "id": "d072628f", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "A Total Angular Margin Loss (ArcFace) calculates the geodetic distance in the hypersphere instead of the euclidean distance to improve the discriminatory strength of the facial recognition model and stabilize the training process. Rails are used to measure all distances in geodetic space. The geodetic trace is the path taken between two places. It specifies the geodetic distance, which is the shortest distance between two places.\n", + "\n", + "ArcFace loss determines the angle between the current feature and the target weight using the arc-cosine function since the dot product between the DCNN feature and the last fully connected layer after feature and weight normalization matches the cosine distance. The target logit is then returned by multiplying the goal angle by an additional angular margin and using the cosine function. After that, we continue as before and rescale all logits to a certain feature norm, just like with softmax loss." + ] + }, + { + "cell_type": "markdown", + "id": "808ac087", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "### Notebook goal\n", + "\n", + "This notebook demonstrates how to use ArcFaceLoss implementation of TensorFlow Similarity with standalone usage and to train a `SimilarityModel()` on a fraction of the MNIST classes.\n", + "\n", + "You are going to learn about the main features offered by the `ArcFaceLoss()` and will:\n", + "\n", + " 1. Standalone usage of ArcFaceLoss\n", + "\n", + " 2. Usage with `model.compile()`\n", + "\n", + " 3. 3D-Visualization of ArcFaceLoss \n", + "\n", + "### Things to try \n", + "\n", + "Along the way you can try the following things to improve the model performance:\n", + "- Adding more \"seen\" classes at training time.\n", + "- Use a larger embedding by increasing the size of the output.\n", + "- Add data augmentation pre-processing layers to the model.\n", + "- Include more examples in the index to give the models more points to choose from.\n", + "- Try a more challenging dataset, such as Fashion MNIST." + ] + }, + { + "cell_type": "markdown", + "id": "078c53c0", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "### Notebook goal\n", + "\n", + "This notebook demonstrates how to use ArcFaceLoss implementation of TensorFlow Similarity with standalone usage and to train a `SimilarityModel()` on a fraction of the MNIST classes.\n", + "\n", + "You are going to learn about the main features offered by the `ArcFaceLoss()` and will:\n", + "\n", + " 1. Standalone usage of ArcFaceLoss\n", + "\n", + " 2. Usage with `model.compile()`\n", + "\n", + " 3. 3D-Visualization of ArcFaceLoss \n", + "\n", + "### Things to try \n", + "\n", + "Along the way you can try the following things to improve the model performance:\n", + "- Adding more \"seen\" classes at training time.\n", + "- Use a larger embedding by increasing the size of the output.\n", + "- Add data augmentation pre-processing layers to the model.\n", + "- Include more examples in the index to give the models more points to choose from.\n", + "- Try a more challenging dataset, such as Fashion MNIST." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "8fd63f16", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "import gc\n", + "import os\n", + "\n", + "import numpy as np\n", + "from matplotlib import pyplot as plt\n", + "from tabulate import tabulate\n", + "from mpl_toolkits.mplot3d import Axes3D\n", + "\n", + "# INFO messages are not printed.\n", + "# This must be run before loading other modules.\n", + "os.environ[\"TF_CPP_MIN_LOG_LEVEL\"] = \"1\"" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "80af5fc0", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "import tensorflow as tf" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "8ba8caf7", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "# install TF similarity if needed\n", + "try:\n", + " import tensorflow_similarity as tfsim # main package\n", + "except ModuleNotFoundError:\n", + " !pip install tensorflow_similarity\n", + " import tensorflow_similarity as tfsim" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "2484bd72", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "tfsim.utils.tf_cap_memory()" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "3fe0344e", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "# Clear out any old model state.\n", + "gc.collect()\n", + "tf.keras.backend.clear_session()" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "99d9bef9", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "print(\"TensorFlow:\", tf.__version__)\n", + "print(\"TensorFlow Similarity\", tfsim.__version__)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "7137afbc", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [] + }, + { + "cell_type": "markdown", + "id": "1d534ad3", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "# Standalone Usage of ArcFaceLoss\n", + "\n", + "ArcFace loss alone can be used as follows when it is desired to calculate the additive angular margin loss of the existing data set." + ] + }, + { + "cell_type": "markdown", + "id": "68d526da", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "### Initialize Loss function as ArcFaceLoss" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "bebf6ef0", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "loss_fn = tfsim.losses.ArcFaceLoss(num_classes=8, embedding_size=10)" + ] + }, + { + "cell_type": "markdown", + "id": "d2ccfd7d", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "### Create own simple random dataset" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "1d1ec43a", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "labels = tf.Variable([0, 1, 2, 3, 4, 5, 6, 7])\n", + "embeddings = tf.Variable(tf.random.uniform(shape=[8, 10]))" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "73d0c1c6", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "print(\"\", embeddings)" + ] + }, + { + "cell_type": "markdown", + "id": "d65b3085", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "### Calculate loss" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "cdf7c30c", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "loss = loss_fn(labels, embeddings)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "16745b7d", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "print(\"loss : \" , loss)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "outputs": [], + "source": [ + "loss = loss_fn(labels, embeddings)" + ], + "metadata": { + "collapsed": false, + "pycharm": { + "name": "#%%\n" + } + } + }, + { + "cell_type": "code", + "execution_count": null, + "outputs": [], + "source": [ + "print(\"loss : \" , loss)" + ], + "metadata": { + "collapsed": false, + "pycharm": { + "name": "#%%\n" + } + } + }, + { + "cell_type": "markdown", + "source": [ + "## Data preparation\n", + "\n", + "We are going to load the MNIST dataset to showcase how the model is able to find similar examples from classes unseen during training. The model's ability to generalize the matching to unseen classes, without retraining, is one of the main reason you would want to use metric learning.\n", + "\n", + "\n", + "**WARNING**: Tensorflow similarity expects `y_train` to be an IntTensor containing the class ids for each example instead of the standard categorical encoding traditionally used for multi-class classification." + ], + "metadata": { + "collapsed": false, + "pycharm": { + "name": "#%% md\n" + } + } + }, + { + "cell_type": "code", + "execution_count": null, + "id": "8a9f8122", + "metadata": {}, + "outputs": [], + "source": [ + "print(\"loss : \" , loss)" + ] + }, + { + "cell_type": "markdown", + "id": "11ef5236", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "## Data preparation\n", + "\n", + "We are going to load the MNIST dataset to showcase how the model is able to find similar examples from classes unseen during training. The model's ability to generalize the matching to unseen classes, without retraining, is one of the main reason you would want to use metric learning.\n", + "\n", + "\n", + "**WARNING**: Tensorflow similarity expects `y_train` to be an IntTensor containing the class ids for each example instead of the standard categorical encoding traditionally used for multi-class classification." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "97152229", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "(x_train, y_train), (x_test, y_test) = tf.keras.datasets.mnist.load_data()" + ] + }, + { + "cell_type": "markdown", + "id": "08b766d8", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "## Model setup" + ] + }, + { + "cell_type": "markdown", + "id": "3eac2da7", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "### Model definition\n", + "\n", + "`SimilarityModel()` models extend `tensorflow.keras.model.Model` with additional features and functionality that allow you to index and search for similar looking examples.\n", + "\n", + "As visible in the model definition below, similarity models output a 64 dimensional float embedding using the `MetricEmbedding()` layers. This layer is a Dense layer with L2 normalization. Thanks to the loss, the model learns to minimize the distance between similar examples and maximize the distance between dissimilar examples. As a result, the distance between examples in the embedding space is meaningful; the smaller the distance the more similar the examples are. \n", + "\n", + "Being able to use a distance as a meaningful proxy for how similar two examples are, is what enables the fast ANN (aproximate nearest neighbor) search. Using a sub-linear ANN search instead of a standard quadratic NN search is what allows deep similarity search to scale to millions of items. The built in memory index used in this notebook scales to a million indexed examples very easily... if you have enough RAM :)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "a003c971", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "def get_model():\n", + " inputs = tf.keras.layers.Input(shape=(28, 28, 1))\n", + " x = tf.keras.layers.experimental.preprocessing.Rescaling(1 / 255)(inputs)\n", + " x = tf.keras.layers.Conv2D(32, 3, activation=\"relu\")(x)\n", + " x = tf.keras.layers.Conv2D(32, 3, activation=\"relu\")(x)\n", + " x = tf.keras.layers.MaxPool2D()(x)\n", + " x = tf.keras.layers.Conv2D(64, 3, activation=\"relu\")(x)\n", + " x = tf.keras.layers.Conv2D(64, 3, activation=\"relu\")(x)\n", + " x = tf.keras.layers.Flatten()(x)\n", + " # smaller embeddings will have faster lookup times while a larger embedding will improve the accuracy up to a point.\n", + " outputs = tfsim.layers.MetricEmbedding(64)(x)\n", + " return tfsim.models.SimilarityModel(inputs, outputs)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "a2177b12", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "model = get_model()\n", + "model.summary()" + ] + }, + { + "cell_type": "markdown", + "id": "defb3961", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "### ArcFace Loss definition\n", + "\n", + "Overall what makes Metric losses different from tradional losses is that:\n", + "- **They expect different inputs.** Instead of having the prediction equal the true values, they expect embeddings as `y_preds` and the id (as an int32) of the class as `y_true`. \n", + "- **They require a distance.** You need to specify which `distance` function to use to compute the distance between embeddings. `cosine` is usually a great starting point and the default.\n", + "\n", + "ArcFace Loss takes inputs as number of classes which labels includes, and embedding size which we define in model `MetricEmbedding()` layers." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "13b0d745", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "distance = \"cosine\" " + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "c22d10cc", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "num_classes = np.unique(y_train).size\n", + "embedding_size = model.get_layer('metric_embedding').output.shape[1]" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "d5b8e426", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "loss = tfsim.losses.ArcFaceLoss(num_classes= num_classes, embedding_size=embedding_size, name=\"ArcFaceLoss\")" + ] + }, + { + "cell_type": "markdown", + "id": "b6eaf9c8", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "### Compilation\n", + "\n", + "Tensorflow similarity use an extended `compile()` method that allows you to optionally specify `distance_metrics` (metrics that are computed over the distance between the embeddings), and the distance to use for the indexer.\n", + "\n", + "By default the `compile()` method tries to infer what type of distance you are using by looking at the first loss specified. If you use multiple losses, and the distance loss is not the first one, then you need to specify the distance function used as `distance=` parameter in the compile function." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "673f986f", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "LR = 0.0005 # @param {type:\"number\"}\n", + "model.compile(optimizer=tf.keras.optimizers.SGD(LR), loss=loss, distance=distance)" + ] + }, + { + "cell_type": "markdown", + "id": "15961601", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "## Training\n", + "\n", + "Similarity models are trained like normal models. " + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "147a6863", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "EPOCHS = 10 # @param {type:\"integer\"}\n", + "history = model.fit(x_train, y_train, epochs=EPOCHS, validation_data=(x_test, y_test))" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "88e1ee4d", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "plt.plot(history.history[\"loss\"])\n", + "plt.plot(history.history[\"val_loss\"])\n", + "plt.legend([\"loss\", \"val_loss\"])\n", + "plt.title(f\"Loss: {loss.name}\")\n", + "plt.show()" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "a5404906", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [] + }, + { + "cell_type": "markdown", + "id": "5ad4ba20", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "## Prediction\n", + "\n", + "Let's predict some features and visualiza them." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "a1936264", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "embedded_features = model.predict(x_test, verbose=1)\n", + "embedded_features /= np.linalg.norm(embedded_features, axis=1, keepdims=True)" + ] + }, + { + "cell_type": "markdown", + "id": "7c0df63b", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "### 3D-Visualization of ArcFace Loss" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "5aac5d98", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "fig = plt.figure()\n", + "ax = Axes3D(fig)\n", + "for c in range(len(np.unique(y_test))):\n", + " ax.plot(embedded_features[y_test==c, 0], embedded_features[y_test==c, 1], embedded_features[y_test==c, 2], '.', alpha=0.1)\n", + "plt.title('ArcFace')\n", + "plt.show()" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "8889f840", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "fef529d9", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3 (ipykernel)", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.9.12" + } + }, + "nbformat": 4, + "nbformat_minor": 5 +} \ No newline at end of file From 882e8d37208f8cdd55a0db9fe601a25a9bb65761 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Aylin=20Ayd=C4=B1n?= Date: Wed, 21 Sep 2022 23:40:12 +0300 Subject: [PATCH 06/25] Add files via upload --- tests/test_losses.py | 38 ++++++++++++++++++++++++++++++++++++-- 1 file changed, 36 insertions(+), 2 deletions(-) diff --git a/tests/test_losses.py b/tests/test_losses.py index 78181eab..1169423f 100644 --- a/tests/test_losses.py +++ b/tests/test_losses.py @@ -2,6 +2,7 @@ import tensorflow as tf from tensorflow_similarity.losses import ( + ArcFaceLoss, MultiSimilarityLoss, PNLoss, SoftNearestNeighborLoss, @@ -22,7 +23,6 @@ def test_triplet_loss_serialization(): def triplet_hard_loss_np(labels, embedding, margin, dist_func, soft=False): - num_data = embedding.shape[0] # Reshape labels to compute adjacency matrix. labels_reshaped = np.reshape(labels.astype(np.float32), (labels.shape[0], 1)) @@ -88,7 +88,9 @@ def test_triplet_loss_semi_hard(): y_true = tf.random.uniform((num_inputs,), 0, 3, dtype=tf.int32) # y_preds: embedding y_preds = tf.random.uniform((num_inputs, 16), 0, 1) - tpl = TripletLoss(positive_mining_strategy="easy", negative_mining_strategy="semi-hard") + tpl = TripletLoss( + positive_mining_strategy="easy", negative_mining_strategy="semi-hard" + ) # y_true, y_preds loss = tpl(y_true, y_preds) assert loss @@ -239,3 +241,35 @@ def test_xbm_loss(): loss_warm(labels2, embeddings2) assert loss_warm._y_pred_memory.numpy().shape == (batch_size, embed_dim) tf.assert_equal(loss_warm._y_true_memory, labels2) + + +# arcface loss +""" +ArcFaceLoss + ArcFace: Additive Angular Margin Loss for Deep Face + Recognition. [online] arXiv.org. Available at: + . +""" + + +def test_arcface_loss_serialization(): + n_classes = 10 + embed_size = 16 + loss = ArcFaceLoss(num_classes=n_classes, embedding_size=embed_size) + config = loss.get_config() + loss2 = ArcFaceLoss.from_config(config) + assert loss.name == loss2.name + assert loss.margin == loss2.margin + assert loss.scale == loss2.scale + assert loss.num_classes == loss2.num_classes + assert loss.embedding_size == loss2.embedding_size + + +def test_arcface_loss(): + tf.random.set_seed(128) + loss_fn = ArcFaceLoss(num_classes=4, embedding_size=5) + labels = tf.Variable([0, 1, 2, 3]) + embeddings = tf.Variable(tf.random.uniform(shape=[4, 5])) + loss = loss_fn(labels, embeddings) + + assert 60.4 < loss.numpy() < 60.5 From 9eb3a34db80c0720d2bcf92f5623ff640f002df5 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Aylin=20Ayd=C4=B1n?= Date: Thu, 22 Sep 2022 12:16:40 +0300 Subject: [PATCH 07/25] Delete test_losses.py --- test_losses.py | 275 ------------------------------------------------- 1 file changed, 275 deletions(-) delete mode 100644 test_losses.py diff --git a/test_losses.py b/test_losses.py deleted file mode 100644 index 1169423f..00000000 --- a/test_losses.py +++ /dev/null @@ -1,275 +0,0 @@ -import numpy as np -import tensorflow as tf - -from tensorflow_similarity.losses import ( - ArcFaceLoss, - MultiSimilarityLoss, - PNLoss, - SoftNearestNeighborLoss, - TripletLoss, -) - -# [triplet loss] -from tensorflow_similarity.losses.xbm_loss import XBM - - -def test_triplet_loss_serialization(): - loss = TripletLoss() - config = loss.get_config() - print(config) - loss2 = TripletLoss.from_config(config) - assert loss.name == loss2.name - assert loss.distance == loss2.distance - - -def triplet_hard_loss_np(labels, embedding, margin, dist_func, soft=False): - num_data = embedding.shape[0] - # Reshape labels to compute adjacency matrix. - labels_reshaped = np.reshape(labels.astype(np.float32), (labels.shape[0], 1)) - - adjacency = np.equal(labels_reshaped, labels_reshaped.T) - pdist_matrix = dist_func(embedding) - loss_np = 0.0 - for i in range(num_data): - pos_distances = [] - neg_distances = [] - for j in range(num_data): - if adjacency[i][j] == 0: - neg_distances.append(pdist_matrix[i][j]) - if adjacency[i][j] > 0.0 and i != j: - pos_distances.append(pdist_matrix[i][j]) - - # if there are no positive pairs, distance is 0 - if len(pos_distances) == 0: - pos_distances.append(0) - - # Sort by distance. - neg_distances.sort() - min_neg_distance = neg_distances[0] - pos_distances.sort(reverse=True) - max_pos_distance = pos_distances[0] - - if soft: - loss_np += np.log1p(np.exp(max_pos_distance - min_neg_distance)) - else: - loss_np += np.maximum(0.0, max_pos_distance - min_neg_distance + margin) - - loss_np /= num_data - return loss_np - - -def test_triplet_loss(): - num_inputs = 10 - # y_true: labels - y_true = tf.random.uniform((num_inputs,), 0, 10, dtype=tf.int32) - # y_preds: embedding - y_preds = tf.random.uniform((num_inputs, 20), 0, 1) - tpl = TripletLoss() - # y_true, y_preds - loss = tpl(y_true, y_preds) - assert loss > 0.9 - - -def test_triplet_loss_easy(): - num_inputs = 10 - # y_true: labels - y_true = tf.random.uniform((num_inputs,), 0, 3, dtype=tf.int32) - # y_preds: embedding - y_preds = tf.random.uniform((num_inputs, 16), 0, 1) - tpl = TripletLoss(positive_mining_strategy="easy", negative_mining_strategy="easy") - # y_true, y_preds - loss = tpl(y_true, y_preds) - assert loss > 0 - - -def test_triplet_loss_semi_hard(): - num_inputs = 10 - # y_true: labels - y_true = tf.random.uniform((num_inputs,), 0, 3, dtype=tf.int32) - # y_preds: embedding - y_preds = tf.random.uniform((num_inputs, 16), 0, 1) - tpl = TripletLoss( - positive_mining_strategy="easy", negative_mining_strategy="semi-hard" - ) - # y_true, y_preds - loss = tpl(y_true, y_preds) - assert loss - - -def test_triplet_loss_hard(): - num_inputs = 10 - # y_true: labels - y_true = tf.random.uniform((num_inputs,), 0, 3, dtype=tf.int32) - # y_preds: embedding - y_preds = tf.random.uniform((num_inputs, 16), 0, 1) - tpl = TripletLoss(positive_mining_strategy="hard", negative_mining_strategy="hard") - # y_true, y_preds - loss = tpl(y_true, y_preds) - assert loss - - -# [pn loss] -def test_pn_loss_serialization(): - loss = PNLoss() - config = loss.get_config() - print(config) - loss2 = PNLoss.from_config(config) - assert loss.name == loss2.name - assert loss.distance == loss2.distance - - -def test_np_loss(): - num_inputs = 10 - # y_true: labels - y_true = tf.random.uniform((num_inputs,), 0, 10, dtype=tf.int32) - # y_preds: embedding - y_preds = tf.random.uniform((num_inputs, 20), 0, 1) - pnl = PNLoss() - # y_true, y_preds - loss = pnl(y_true, y_preds) - assert loss > 0.9 - - -# [soft neasrest neighbor loss] -def test_softnn_loss_serialization(): - loss = SoftNearestNeighborLoss(distance="cosine", temperature=50) - config = loss.get_config() - loss2 = SoftNearestNeighborLoss.from_config(config) - assert loss.name == loss2.name - assert loss.distance == loss2.distance - assert loss.temperature == loss2.temperature - - -def softnn_util(y_true, x, temperature=1): - """ - A simple loop based implementation of soft - nearest neighbor loss to test the code. - https://arxiv.org/pdf/1902.01889.pdf - """ - - y_true = y_true.numpy() - x = x.numpy() - batch_size = y_true.shape[0] - loss = 0 - eps = 1e-9 - for i in range(batch_size): - numerator = 0 - denominator = 0 - for j in range(batch_size): - if i == j: - continue - if y_true[i] == y_true[j]: - numerator += np.exp(-1 * np.sum(np.square(x[i] - x[j])) / temperature) - denominator += np.exp(-1 * np.sum(np.square(x[i] - x[j])) / temperature) - if numerator == 0: - continue - loss += np.log(numerator / denominator) - return -loss / batch_size - - -def test_softnn_loss(): - num_inputs = 10 - n_classes = 10 - # y_true: labels - y_true = tf.random.uniform((num_inputs,), 0, n_classes, dtype=tf.int32) - # x: embeddings - x = tf.random.uniform((num_inputs, 20), 0, 1) - - temperature = np.random.uniform(0.1, 50) - softnn = SoftNearestNeighborLoss(temperature=temperature) - loss = softnn(y_true, x) - loss_check = softnn_util(y_true, x, temperature) - loss_diff = loss.numpy() - loss_check - assert np.abs(loss_diff) < 1e-3 - - -def test_xbm_loss(): - batch_size = 6 - embed_dim = 16 - - embeddings1 = tf.random.uniform(shape=[batch_size, embed_dim]) - labels1 = tf.constant( - [ - [1], - [1], - [2], - [2], - [3], - [3], - ], - dtype=tf.int32, - ) - - embeddings2 = tf.random.uniform(shape=[batch_size, embed_dim]) - labels2 = tf.constant( - [ - [4], - [4], - [5], - [5], - [6], - [6], - ], - dtype=tf.int32, - ) - - distance = "cosine" - loss = MultiSimilarityLoss(distance=distance) - loss_nowarm = XBM(loss, memory_size=12, warmup_steps=0) - - # test enqueue - loss_nowarm(labels1, embeddings1) - assert loss_nowarm._y_pred_memory.numpy().shape == (batch_size, embed_dim) - tf.assert_equal(loss_nowarm._y_true_memory, labels1) - - loss_nowarm(labels2, embeddings2) - assert loss_nowarm._y_pred_memory.numpy().shape == (2 * batch_size, embed_dim) - tf.assert_equal(loss_nowarm._y_true_memory, tf.concat([labels2, labels1], axis=0)) - - # test dequeue - loss_nowarm(labels2, embeddings2) - assert loss_nowarm._y_pred_memory.numpy().shape == (2 * batch_size, embed_dim) - tf.assert_equal(loss_nowarm._y_true_memory, tf.concat([labels2, labels2], axis=0)) - - # test warmup - loss_warm = XBM(loss, memory_size=12, warmup_steps=1) - - loss_warm(labels1, embeddings1) - assert loss_warm._y_pred_memory.numpy().shape == (0, embed_dim) - tf.assert_equal(loss_warm._y_true_memory, tf.constant([[]], dtype=tf.int32)) - - loss_warm(labels2, embeddings2) - assert loss_warm._y_pred_memory.numpy().shape == (batch_size, embed_dim) - tf.assert_equal(loss_warm._y_true_memory, labels2) - - -# arcface loss -""" -ArcFaceLoss - ArcFace: Additive Angular Margin Loss for Deep Face - Recognition. [online] arXiv.org. Available at: - . -""" - - -def test_arcface_loss_serialization(): - n_classes = 10 - embed_size = 16 - loss = ArcFaceLoss(num_classes=n_classes, embedding_size=embed_size) - config = loss.get_config() - loss2 = ArcFaceLoss.from_config(config) - assert loss.name == loss2.name - assert loss.margin == loss2.margin - assert loss.scale == loss2.scale - assert loss.num_classes == loss2.num_classes - assert loss.embedding_size == loss2.embedding_size - - -def test_arcface_loss(): - tf.random.set_seed(128) - loss_fn = ArcFaceLoss(num_classes=4, embedding_size=5) - labels = tf.Variable([0, 1, 2, 3]) - embeddings = tf.Variable(tf.random.uniform(shape=[4, 5])) - loss = loss_fn(labels, embeddings) - - assert 60.4 < loss.numpy() < 60.5 From 8db6bc9a171dd20de260ac0f511653f0ff74ddd8 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Aylin=20Ayd=C4=B1n?= Date: Thu, 22 Sep 2022 12:16:52 +0300 Subject: [PATCH 08/25] Delete arcface_loss.py --- arcface_loss.py | 120 ------------------------------------------------ 1 file changed, 120 deletions(-) delete mode 100644 arcface_loss.py diff --git a/arcface_loss.py b/arcface_loss.py deleted file mode 100644 index e93a98fd..00000000 --- a/arcface_loss.py +++ /dev/null @@ -1,120 +0,0 @@ -# Copyright 2022 The TensorFlow Authors. All Rights Reserved. -# -# Licensed under the Apache License, Version 2.0 (the "License"); -# you may not use this file except in compliance with the License. -# You may obtain a copy of the License at -# -# http://www.apache.org/licenses/LICENSE-2.0 -# -# Unless required by applicable law or agreed to in writing, software -# distributed under the License is distributed on an "AS IS" BASIS, -# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. -# See the License for the specific language governing permissions and -# limitations under the License. -# ============================================================================== -"""ArcFace losses base class. - -ArcFace: Additive Angular Margin Loss for Deep Face -Recognition. [online] arXiv.org. Available at: -. - -""" - -from typing import Any, Callable, Dict, Optional, Tuple, Union - -import tensorflow as tf - -from tensorflow_similarity.algebra import build_masks -from tensorflow_similarity.distances import Distance, distance_canonicalizer -from tensorflow_similarity.types import FloatTensor, IntTensor -from tensorflow_similarity.utils import is_tensor_or_variable - -from .metric_loss import MetricLoss -from .utils import logsumexp - - -@tf.keras.utils.register_keras_serializable(package="Similarity") -class ArcFaceLoss(tf.keras.losses.Loss): - """Implement of ArcFace: Additive Angular Margin Loss: - Step 1: Create a trainable kernel matrix with the shape of [embedding_size, num_classes]. - Step 2: Normalize the kernel and prediction vectors. - Step 3: Calculate the cosine similarity between the normalized prediction vector and the kernel. - Step 4: Create a one-hot vector include the margin value for the ground truth class. - Step 5: Add margin_hot to the cosine similarity and multiply it by scale. - Step 6: Calculate the cross-entropy loss. - - ArcFace: Additive Angular Margin Loss for Deep Face - Recognition. [online] arXiv.org. Available at: - . - - Standalone usage: - >>> loss_fn = tfsim.losses.ArcFaceLoss(num_classes=2, embedding_size=3) - >>> labels = tf.Variable([1, 0]) - >>> embeddings = tf.Variable([[0.2, 0.3, 0.1], [0.4, 0.5, 0.5]]) - >>> loss = loss_fn(labels, embeddings) - Args: - num_classes: Number of classes. - embedding_size: The size of the embedding vectors. - margin: The margin value. - scale: s in the paper, feature scale - name: Optional name for the operation. - reduction: Type of loss reduction to apply to the loss. - """ - - def __init__( - self, - num_classes: int, - embedding_size: int, - margin: float = 0.50, # margin in radians - scale: float = 64.0, # feature scale - name: Optional[str] = None, - reduction: Callable = tf.keras.losses.Reduction.AUTO, - **kwargs - ): - - super().__init__(reduction=reduction, name=name, **kwargs) - - self.num_classes = num_classes - self.embedding_size = embedding_size - self.margin = margin - self.scale = scale - self.name = name - self.kernel = tf.Variable(tf.random.normal([embedding_size, num_classes])) - - def call(self, y_true: FloatTensor, y_pred: FloatTensor) -> FloatTensor: - - y_pred_norm = tf.math.l2_normalize(y_pred, axis=1) - kernel_norm = tf.math.l2_normalize(self.kernel, axis=0) - - cos_theta = tf.matmul(y_pred_norm, kernel_norm) - cos_theta = tf.clip_by_value(cos_theta, -1.0, 1.0) - - m_hot = tf.one_hot(y_true, self.num_classes, on_value=self.margin, axis=1) - m_hot = tf.reshape(m_hot, [-1, self.num_classes]) - - cos_theta = tf.acos(cos_theta) - cos_theta += m_hot - cos_theta = tf.math.cos(cos_theta) - cos_theta = tf.math.multiply(cos_theta, self.scale) - - cce = tf.keras.losses.SparseCategoricalCrossentropy( - from_logits=True, reduction=self.reduction - ) - loss: FloatTensor = cce(y_true, cos_theta) - - return loss - - def get_config(self) -> Dict[str, Any]: - """Contains the loss configuration. - Returns: - A Python dict containing the configuration of the loss. - """ - config = { - "num_classes": self.num_classes, - "embedding_size": self.embedding_size, - "margin": self.margin, - "scale": self.scale, - "name": self.name, - } - base_config = super().get_config() - return {**base_config, **config} From d6c1d344fceea0e0494fb45a1afa64b6340c416a Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Aylin=20Ayd=C4=B1n?= Date: Thu, 22 Sep 2022 12:25:38 +0300 Subject: [PATCH 09/25] Add files via upload --- tensorflow_similarity/losses/arcface_loss.py | 6 +----- 1 file changed, 1 insertion(+), 5 deletions(-) diff --git a/tensorflow_similarity/losses/arcface_loss.py b/tensorflow_similarity/losses/arcface_loss.py index e0252d5c..e20bf06e 100644 --- a/tensorflow_similarity/losses/arcface_loss.py +++ b/tensorflow_similarity/losses/arcface_loss.py @@ -13,11 +13,9 @@ # limitations under the License. # ============================================================================== """ArcFace losses base class. - ArcFace: Additive Angular Margin Loss for Deep Face Recognition. [online] arXiv.org. Available at: . - """ from typing import Any, Callable, Dict, Optional, Tuple, Union @@ -41,11 +39,9 @@ class ArcFaceLoss(tf.keras.losses.Loss): Step 4: Create a one-hot vector include the margin value for the ground truth class. Step 5: Add margin_hot to the cosine similarity and multiply it by scale. Step 6: Calculate the cross-entropy loss. - ArcFace: Additive Angular Margin Loss for Deep Face Recognition. [online] arXiv.org. Available at: . - Standalone usage: >>> loss_fn = tfsim.losses.ArcFaceLoss(num_classes=2, embedding_size=3) >>> labels = tf.Variable([1, 0]) @@ -106,7 +102,7 @@ def call(self, y_true: FloatTensor, y_pred: FloatTensor) -> FloatTensor: def get_config(self) -> Dict[str, Any]: """Contains the loss configuration. Returns: - A Python dict containing the configuration of the loss. + The configuration of the ArcFace loss. """ config = { "num_classes": self.num_classes, From 0274c3d654ffc4f5354621e5e0f886d05d849991 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Aylin=20Ayd=C4=B1n?= Date: Thu, 22 Sep 2022 12:26:51 +0300 Subject: [PATCH 10/25] Add files via upload --- tests/test_losses.py | 15 ++++++--------- 1 file changed, 6 insertions(+), 9 deletions(-) diff --git a/tests/test_losses.py b/tests/test_losses.py index 1169423f..ce958cb5 100644 --- a/tests/test_losses.py +++ b/tests/test_losses.py @@ -1,14 +1,8 @@ import numpy as np import tensorflow as tf - -from tensorflow_similarity.losses import ( - ArcFaceLoss, - MultiSimilarityLoss, - PNLoss, - SoftNearestNeighborLoss, - TripletLoss, -) - +from tensorflow_similarity.losses import (ArcFaceLoss, MultiSimilarityLoss, + PNLoss, SoftNearestNeighborLoss, + TripletLoss) # [triplet loss] from tensorflow_similarity.losses.xbm_loss import XBM @@ -270,6 +264,9 @@ def test_arcface_loss(): loss_fn = ArcFaceLoss(num_classes=4, embedding_size=5) labels = tf.Variable([0, 1, 2, 3]) embeddings = tf.Variable(tf.random.uniform(shape=[4, 5])) + print(embeddings) + loss = loss_fn(labels, embeddings) + print(loss) assert 60.4 < loss.numpy() < 60.5 From bc108c45156b142ef71320c039aacee055ffd8c8 Mon Sep 17 00:00:00 2001 From: Abhishar Sinha <24841841+abhisharsinha@users.noreply.github.com> Date: Tue, 20 Sep 2022 23:49:16 +0530 Subject: [PATCH 11/25] Fixed typo to resolve #284 The function should be tf.concat instead of tf.constant, according to the description given above. This also resolves issue #284 --- tensorflow_similarity/classification_metrics/precision.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/tensorflow_similarity/classification_metrics/precision.py b/tensorflow_similarity/classification_metrics/precision.py index 4569cb61..4938d74f 100644 --- a/tensorflow_similarity/classification_metrics/precision.py +++ b/tensorflow_similarity/classification_metrics/precision.py @@ -84,7 +84,7 @@ def compute( # The following accounts for the and sets the first precision value to # 1.0 if the first recall and precision are both zero. if (tp + fp)[0] == 0.0 and len(p) > 1: - initial_precision = tf.constant([tf.constant([1.0]), tf.zeros(len(p) - 1)], axis=0) + initial_precision = tf.concat([tf.constant([1.0]), tf.zeros(len(p) - 1)], axis=0) p = p + initial_precision return p From 7cbbdcf8841c0e48c5602ec4c34064e86f87223f Mon Sep 17 00:00:00 2001 From: Owen Vallis Date: Fri, 23 Sep 2022 20:13:00 +0000 Subject: [PATCH 12/25] Patch bump to 0.16.8 --- tensorflow_similarity/__init__.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/tensorflow_similarity/__init__.py b/tensorflow_similarity/__init__.py index 863c4b00..d8fbc9c2 100644 --- a/tensorflow_similarity/__init__.py +++ b/tensorflow_similarity/__init__.py @@ -11,7 +11,7 @@ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # See the License for the specific language governing permissions and # limitations under the License. -__version__ = "0.16.7" +__version__ = "0.16.8" from . import algebra # noqa From 2ff3b7291d71f031621276a536794f6d5e05e9ee Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Aylin=20Ayd=C4=B1n?= Date: Wed, 28 Sep 2022 10:31:19 +0300 Subject: [PATCH 13/25] Add files via upload --- tests/test_losses.py | 1 + 1 file changed, 1 insertion(+) diff --git a/tests/test_losses.py b/tests/test_losses.py index ce958cb5..3a96a32f 100644 --- a/tests/test_losses.py +++ b/tests/test_losses.py @@ -1,5 +1,6 @@ import numpy as np import tensorflow as tf + from tensorflow_similarity.losses import (ArcFaceLoss, MultiSimilarityLoss, PNLoss, SoftNearestNeighborLoss, TripletLoss) From 17f7051eeafdd209f112202727c210f5fcfb9c28 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Aylin=20Ayd=C4=B1n?= Date: Wed, 28 Sep 2022 10:31:38 +0300 Subject: [PATCH 14/25] Add files via upload --- tensorflow_similarity/losses/arcface_loss.py | 14 ++++++-------- 1 file changed, 6 insertions(+), 8 deletions(-) diff --git a/tensorflow_similarity/losses/arcface_loss.py b/tensorflow_similarity/losses/arcface_loss.py index e20bf06e..9ac55c60 100644 --- a/tensorflow_similarity/losses/arcface_loss.py +++ b/tensorflow_similarity/losses/arcface_loss.py @@ -18,16 +18,12 @@ . """ -from typing import Any, Callable, Dict, Optional, Tuple, Union +from typing import Any, Callable, Dict, Optional import tensorflow as tf -from tensorflow_similarity.algebra import build_masks -from tensorflow_similarity.distances import Distance, distance_canonicalizer -from tensorflow_similarity.types import FloatTensor, IntTensor -from tensorflow_similarity.utils import is_tensor_or_variable -from .metric_loss import MetricLoss -from .utils import logsumexp +from tensorflow_similarity.distances import Distance +from tensorflow_similarity.types import FloatTensor @tf.keras.utils.register_keras_serializable(package="Similarity") @@ -74,7 +70,9 @@ def __init__( self.margin = margin self.scale = scale self.name = name - self.kernel = tf.Variable(tf.random.normal([embedding_size, num_classes])) + self.kernel = tf.Variable( + tf.random.normal([embedding_size, num_classes]), trainable=True + ) def call(self, y_true: FloatTensor, y_pred: FloatTensor) -> FloatTensor: From f7de1d827de96d9af6dac860e52283b696b6725a Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Aylin=20Ayd=C4=B1n?= Date: Thu, 6 Oct 2022 21:25:32 +0300 Subject: [PATCH 15/25] Add files via upload --- tensorflow_similarity/losses/__init__.py | 11 +++++------ tensorflow_similarity/losses/arcface_loss.py | 1 - 2 files changed, 5 insertions(+), 7 deletions(-) diff --git a/tensorflow_similarity/losses/__init__.py b/tensorflow_similarity/losses/__init__.py index 8829e09f..0fdb573d 100644 --- a/tensorflow_similarity/losses/__init__.py +++ b/tensorflow_similarity/losses/__init__.py @@ -15,14 +15,13 @@ """ Contrastive learning specialized losses. """ -from .pn_loss import PNLoss # noqa -from .triplet_loss import TripletLoss # noqa -from .metric_loss import MetricLoss # noqa +from .arcface_loss import ArcFaceLoss # noqa from .circle_loss import CircleLoss # noqa +from .metric_loss import MetricLoss # noqa from .multisim_loss import MultiSimilarityLoss # noqa -from .simsiam import SimSiamLoss # noqa +from .pn_loss import PNLoss # noqa from .simclr import SimCLRLoss # noqa +from .simsiam import SimSiamLoss # noqa +from .triplet_loss import TripletLoss # noqa from .vicreg import VicReg # noqa -from .arcface_loss import ArcFaceLoss # noqa from .xbm_loss import XBM # noqa - diff --git a/tensorflow_similarity/losses/arcface_loss.py b/tensorflow_similarity/losses/arcface_loss.py index 9ac55c60..bf4c4842 100644 --- a/tensorflow_similarity/losses/arcface_loss.py +++ b/tensorflow_similarity/losses/arcface_loss.py @@ -21,7 +21,6 @@ from typing import Any, Callable, Dict, Optional import tensorflow as tf - from tensorflow_similarity.distances import Distance from tensorflow_similarity.types import FloatTensor From 455dc3566b8e3d4cad371d18ea76b5b98e63a8ee Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Aylin=20Ayd=C4=B1n?= Date: Thu, 6 Oct 2022 21:25:55 +0300 Subject: [PATCH 16/25] Add files via upload --- tests/test_losses.py | 10 +++++++--- 1 file changed, 7 insertions(+), 3 deletions(-) diff --git a/tests/test_losses.py b/tests/test_losses.py index 3a96a32f..ff149c94 100644 --- a/tests/test_losses.py +++ b/tests/test_losses.py @@ -1,9 +1,13 @@ import numpy as np import tensorflow as tf +from tensorflow_similarity.losses import ( + ArcFaceLoss, + MultiSimilarityLoss, + PNLoss, + SoftNearestNeighborLoss, + TripletLoss, +) -from tensorflow_similarity.losses import (ArcFaceLoss, MultiSimilarityLoss, - PNLoss, SoftNearestNeighborLoss, - TripletLoss) # [triplet loss] from tensorflow_similarity.losses.xbm_loss import XBM From d67630c61afdc7925ce080e72467336a0d566cd7 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Aylin=20Ayd=C4=B1n?= Date: Fri, 7 Oct 2022 10:12:52 +0300 Subject: [PATCH 17/25] Add files via upload From d8c99f5f19bb83719a5fa1fcc074993947e78269 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Aylin=20Ayd=C4=B1n?= Date: Fri, 7 Oct 2022 10:13:10 +0300 Subject: [PATCH 18/25] Add files via upload --- tensorflow_similarity/__init__.py | 37 ++++++++++++------------------- 1 file changed, 14 insertions(+), 23 deletions(-) diff --git a/tensorflow_similarity/__init__.py b/tensorflow_similarity/__init__.py index 00573fe4..7ccee62d 100644 --- a/tensorflow_similarity/__init__.py +++ b/tensorflow_similarity/__init__.py @@ -11,27 +11,18 @@ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # See the License for the specific language governing permissions and # limitations under the License. -__version__ = "0.17.0.dev10" - -from . import algebra # noqa -from . import architectures # noqa -from . import augmenters # noqa -from . import callbacks # noqa -from . import classification_metrics # noqa -from . import distances # noqa -from . import evaluators # noqa -from . import indexer # noqa -from . import layers # noqa -from . import losses # noqa -from . import matchers # noqa -from . import models # noqa -from . import retrieval_metrics # noqa -from . import samplers # noqa -from . import schedules # noqa -from . import search # noqa -from . import stores # noqa -from . import training_metrics # noqa -from . import types # noqa -from . import utils # noqa -from . import visualization # noqa +""" +Contrastive learning specialized losses. +""" +from .arcface_loss import ArcFaceLoss # noqa +from .barlow import Barlow # noqa +from .circle_loss import CircleLoss # noqa +from .metric_loss import MetricLoss # noqa +from .multisim_loss import MultiSimilarityLoss # noqa +from .pn_loss import PNLoss # noqa +from .simclr import SimCLRLoss # noqa +from .simsiam import SimSiamLoss # noqa +from .softnn_loss import SoftNearestNeighborLoss # noqa +from .triplet_loss import TripletLoss # noqa +from .vicreg import VicReg # noqa From 1980579912566bd0efbd2ba980b26f58cbd1fcf7 Mon Sep 17 00:00:00 2001 From: Owen Vallis Date: Fri, 7 Oct 2022 09:35:50 -0700 Subject: [PATCH 19/25] Delete ArcFace Loss Sample Notebook.ipynb --- ArcFace Loss Sample Notebook.ipynb | 775 ----------------------------- 1 file changed, 775 deletions(-) delete mode 100644 ArcFace Loss Sample Notebook.ipynb diff --git a/ArcFace Loss Sample Notebook.ipynb b/ArcFace Loss Sample Notebook.ipynb deleted file mode 100644 index b481492e..00000000 --- a/ArcFace Loss Sample Notebook.ipynb +++ /dev/null @@ -1,775 +0,0 @@ -{ - "cells": [ - { - "cell_type": "markdown", - "id": "28956aa1", - "metadata": { - "pycharm": { - "name": "#%% md\n" - } - }, - "source": [ - "Copyright 2022 The TensorFlow Similarity Authors." - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "24eda1a6", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "# @title Licensed under the Apache License, Version 2.0 (the \"License\");\n", - "# you may not use this file except in compliance with the License.\n", - "# You may obtain a copy of the License at\n", - "#\n", - "# https://www.apache.org/licenses/LICENSE-2.0\n", - "#\n", - "# Unless required by applicable law or agreed to in writing, software\n", - "# distributed under the License is distributed on an \"AS IS\" BASIS,\n", - "# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.\n", - "# See the License for the specific language governing permissions and\n", - "# limitations under the License." - ] - }, - { - "cell_type": "markdown", - "id": "7ca9d025", - "metadata": { - "pycharm": { - "name": "#%% md\n" - } - }, - "source": [ - "# TensorFlow Similarity ArcFace Loss Example" - ] - }, - { - "cell_type": "markdown", - "id": "d072628f", - "metadata": { - "pycharm": { - "name": "#%% md\n" - } - }, - "source": [ - "A Total Angular Margin Loss (ArcFace) calculates the geodetic distance in the hypersphere instead of the euclidean distance to improve the discriminatory strength of the facial recognition model and stabilize the training process. Rails are used to measure all distances in geodetic space. The geodetic trace is the path taken between two places. It specifies the geodetic distance, which is the shortest distance between two places.\n", - "\n", - "ArcFace loss determines the angle between the current feature and the target weight using the arc-cosine function since the dot product between the DCNN feature and the last fully connected layer after feature and weight normalization matches the cosine distance. The target logit is then returned by multiplying the goal angle by an additional angular margin and using the cosine function. After that, we continue as before and rescale all logits to a certain feature norm, just like with softmax loss." - ] - }, - { - "cell_type": "markdown", - "id": "808ac087", - "metadata": { - "pycharm": { - "name": "#%% md\n" - } - }, - "source": [ - "### Notebook goal\n", - "\n", - "This notebook demonstrates how to use ArcFaceLoss implementation of TensorFlow Similarity with standalone usage and to train a `SimilarityModel()` on a fraction of the MNIST classes.\n", - "\n", - "You are going to learn about the main features offered by the `ArcFaceLoss()` and will:\n", - "\n", - " 1. Standalone usage of ArcFaceLoss\n", - "\n", - " 2. Usage with `model.compile()`\n", - "\n", - " 3. 3D-Visualization of ArcFaceLoss \n", - "\n", - "### Things to try \n", - "\n", - "Along the way you can try the following things to improve the model performance:\n", - "- Adding more \"seen\" classes at training time.\n", - "- Use a larger embedding by increasing the size of the output.\n", - "- Add data augmentation pre-processing layers to the model.\n", - "- Include more examples in the index to give the models more points to choose from.\n", - "- Try a more challenging dataset, such as Fashion MNIST." - ] - }, - { - "cell_type": "markdown", - "id": "078c53c0", - "metadata": { - "pycharm": { - "name": "#%% md\n" - } - }, - "source": [ - "### Notebook goal\n", - "\n", - "This notebook demonstrates how to use ArcFaceLoss implementation of TensorFlow Similarity with standalone usage and to train a `SimilarityModel()` on a fraction of the MNIST classes.\n", - "\n", - "You are going to learn about the main features offered by the `ArcFaceLoss()` and will:\n", - "\n", - " 1. Standalone usage of ArcFaceLoss\n", - "\n", - " 2. Usage with `model.compile()`\n", - "\n", - " 3. 3D-Visualization of ArcFaceLoss \n", - "\n", - "### Things to try \n", - "\n", - "Along the way you can try the following things to improve the model performance:\n", - "- Adding more \"seen\" classes at training time.\n", - "- Use a larger embedding by increasing the size of the output.\n", - "- Add data augmentation pre-processing layers to the model.\n", - "- Include more examples in the index to give the models more points to choose from.\n", - "- Try a more challenging dataset, such as Fashion MNIST." - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "8fd63f16", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "import gc\n", - "import os\n", - "\n", - "import numpy as np\n", - "from matplotlib import pyplot as plt\n", - "from tabulate import tabulate\n", - "from mpl_toolkits.mplot3d import Axes3D\n", - "\n", - "# INFO messages are not printed.\n", - "# This must be run before loading other modules.\n", - "os.environ[\"TF_CPP_MIN_LOG_LEVEL\"] = \"1\"" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "80af5fc0", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "import tensorflow as tf" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "8ba8caf7", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "# install TF similarity if needed\n", - "try:\n", - " import tensorflow_similarity as tfsim # main package\n", - "except ModuleNotFoundError:\n", - " !pip install tensorflow_similarity\n", - " import tensorflow_similarity as tfsim" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "2484bd72", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "tfsim.utils.tf_cap_memory()" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "3fe0344e", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "# Clear out any old model state.\n", - "gc.collect()\n", - "tf.keras.backend.clear_session()" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "99d9bef9", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "print(\"TensorFlow:\", tf.__version__)\n", - "print(\"TensorFlow Similarity\", tfsim.__version__)" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "7137afbc", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [] - }, - { - "cell_type": "markdown", - "id": "1d534ad3", - "metadata": { - "pycharm": { - "name": "#%% md\n" - } - }, - "source": [ - "# Standalone Usage of ArcFaceLoss\n", - "\n", - "ArcFace loss alone can be used as follows when it is desired to calculate the additive angular margin loss of the existing data set." - ] - }, - { - "cell_type": "markdown", - "id": "68d526da", - "metadata": { - "pycharm": { - "name": "#%% md\n" - } - }, - "source": [ - "### Initialize Loss function as ArcFaceLoss" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "bebf6ef0", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "loss_fn = tfsim.losses.ArcFaceLoss(num_classes=8, embedding_size=10)" - ] - }, - { - "cell_type": "markdown", - "id": "d2ccfd7d", - "metadata": { - "pycharm": { - "name": "#%% md\n" - } - }, - "source": [ - "### Create own simple random dataset" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "1d1ec43a", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "labels = tf.Variable([0, 1, 2, 3, 4, 5, 6, 7])\n", - "embeddings = tf.Variable(tf.random.uniform(shape=[8, 10]))" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "73d0c1c6", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "print(\"\", embeddings)" - ] - }, - { - "cell_type": "markdown", - "id": "d65b3085", - "metadata": { - "pycharm": { - "name": "#%% md\n" - } - }, - "source": [ - "### Calculate loss" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "cdf7c30c", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "loss = loss_fn(labels, embeddings)" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "16745b7d", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "print(\"loss : \" , loss)" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "outputs": [], - "source": [ - "loss = loss_fn(labels, embeddings)" - ], - "metadata": { - "collapsed": false, - "pycharm": { - "name": "#%%\n" - } - } - }, - { - "cell_type": "code", - "execution_count": null, - "outputs": [], - "source": [ - "print(\"loss : \" , loss)" - ], - "metadata": { - "collapsed": false, - "pycharm": { - "name": "#%%\n" - } - } - }, - { - "cell_type": "markdown", - "source": [ - "## Data preparation\n", - "\n", - "We are going to load the MNIST dataset to showcase how the model is able to find similar examples from classes unseen during training. The model's ability to generalize the matching to unseen classes, without retraining, is one of the main reason you would want to use metric learning.\n", - "\n", - "\n", - "**WARNING**: Tensorflow similarity expects `y_train` to be an IntTensor containing the class ids for each example instead of the standard categorical encoding traditionally used for multi-class classification." - ], - "metadata": { - "collapsed": false, - "pycharm": { - "name": "#%% md\n" - } - } - }, - { - "cell_type": "code", - "execution_count": null, - "id": "8a9f8122", - "metadata": {}, - "outputs": [], - "source": [ - "print(\"loss : \" , loss)" - ] - }, - { - "cell_type": "markdown", - "id": "11ef5236", - "metadata": { - "pycharm": { - "name": "#%% md\n" - } - }, - "source": [ - "## Data preparation\n", - "\n", - "We are going to load the MNIST dataset to showcase how the model is able to find similar examples from classes unseen during training. The model's ability to generalize the matching to unseen classes, without retraining, is one of the main reason you would want to use metric learning.\n", - "\n", - "\n", - "**WARNING**: Tensorflow similarity expects `y_train` to be an IntTensor containing the class ids for each example instead of the standard categorical encoding traditionally used for multi-class classification." - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "97152229", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "(x_train, y_train), (x_test, y_test) = tf.keras.datasets.mnist.load_data()" - ] - }, - { - "cell_type": "markdown", - "id": "08b766d8", - "metadata": { - "pycharm": { - "name": "#%% md\n" - } - }, - "source": [ - "## Model setup" - ] - }, - { - "cell_type": "markdown", - "id": "3eac2da7", - "metadata": { - "pycharm": { - "name": "#%% md\n" - } - }, - "source": [ - "### Model definition\n", - "\n", - "`SimilarityModel()` models extend `tensorflow.keras.model.Model` with additional features and functionality that allow you to index and search for similar looking examples.\n", - "\n", - "As visible in the model definition below, similarity models output a 64 dimensional float embedding using the `MetricEmbedding()` layers. This layer is a Dense layer with L2 normalization. Thanks to the loss, the model learns to minimize the distance between similar examples and maximize the distance between dissimilar examples. As a result, the distance between examples in the embedding space is meaningful; the smaller the distance the more similar the examples are. \n", - "\n", - "Being able to use a distance as a meaningful proxy for how similar two examples are, is what enables the fast ANN (aproximate nearest neighbor) search. Using a sub-linear ANN search instead of a standard quadratic NN search is what allows deep similarity search to scale to millions of items. The built in memory index used in this notebook scales to a million indexed examples very easily... if you have enough RAM :)" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "a003c971", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "def get_model():\n", - " inputs = tf.keras.layers.Input(shape=(28, 28, 1))\n", - " x = tf.keras.layers.experimental.preprocessing.Rescaling(1 / 255)(inputs)\n", - " x = tf.keras.layers.Conv2D(32, 3, activation=\"relu\")(x)\n", - " x = tf.keras.layers.Conv2D(32, 3, activation=\"relu\")(x)\n", - " x = tf.keras.layers.MaxPool2D()(x)\n", - " x = tf.keras.layers.Conv2D(64, 3, activation=\"relu\")(x)\n", - " x = tf.keras.layers.Conv2D(64, 3, activation=\"relu\")(x)\n", - " x = tf.keras.layers.Flatten()(x)\n", - " # smaller embeddings will have faster lookup times while a larger embedding will improve the accuracy up to a point.\n", - " outputs = tfsim.layers.MetricEmbedding(64)(x)\n", - " return tfsim.models.SimilarityModel(inputs, outputs)" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "a2177b12", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "model = get_model()\n", - "model.summary()" - ] - }, - { - "cell_type": "markdown", - "id": "defb3961", - "metadata": { - "pycharm": { - "name": "#%% md\n" - } - }, - "source": [ - "### ArcFace Loss definition\n", - "\n", - "Overall what makes Metric losses different from tradional losses is that:\n", - "- **They expect different inputs.** Instead of having the prediction equal the true values, they expect embeddings as `y_preds` and the id (as an int32) of the class as `y_true`. \n", - "- **They require a distance.** You need to specify which `distance` function to use to compute the distance between embeddings. `cosine` is usually a great starting point and the default.\n", - "\n", - "ArcFace Loss takes inputs as number of classes which labels includes, and embedding size which we define in model `MetricEmbedding()` layers." - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "13b0d745", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "distance = \"cosine\" " - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "c22d10cc", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "num_classes = np.unique(y_train).size\n", - "embedding_size = model.get_layer('metric_embedding').output.shape[1]" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "d5b8e426", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "loss = tfsim.losses.ArcFaceLoss(num_classes= num_classes, embedding_size=embedding_size, name=\"ArcFaceLoss\")" - ] - }, - { - "cell_type": "markdown", - "id": "b6eaf9c8", - "metadata": { - "pycharm": { - "name": "#%% md\n" - } - }, - "source": [ - "### Compilation\n", - "\n", - "Tensorflow similarity use an extended `compile()` method that allows you to optionally specify `distance_metrics` (metrics that are computed over the distance between the embeddings), and the distance to use for the indexer.\n", - "\n", - "By default the `compile()` method tries to infer what type of distance you are using by looking at the first loss specified. If you use multiple losses, and the distance loss is not the first one, then you need to specify the distance function used as `distance=` parameter in the compile function." - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "673f986f", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "LR = 0.0005 # @param {type:\"number\"}\n", - "model.compile(optimizer=tf.keras.optimizers.SGD(LR), loss=loss, distance=distance)" - ] - }, - { - "cell_type": "markdown", - "id": "15961601", - "metadata": { - "pycharm": { - "name": "#%% md\n" - } - }, - "source": [ - "## Training\n", - "\n", - "Similarity models are trained like normal models. " - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "147a6863", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "EPOCHS = 10 # @param {type:\"integer\"}\n", - "history = model.fit(x_train, y_train, epochs=EPOCHS, validation_data=(x_test, y_test))" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "88e1ee4d", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "plt.plot(history.history[\"loss\"])\n", - "plt.plot(history.history[\"val_loss\"])\n", - "plt.legend([\"loss\", \"val_loss\"])\n", - "plt.title(f\"Loss: {loss.name}\")\n", - "plt.show()" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "a5404906", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [] - }, - { - "cell_type": "markdown", - "id": "5ad4ba20", - "metadata": { - "pycharm": { - "name": "#%% md\n" - } - }, - "source": [ - "## Prediction\n", - "\n", - "Let's predict some features and visualiza them." - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "a1936264", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "embedded_features = model.predict(x_test, verbose=1)\n", - "embedded_features /= np.linalg.norm(embedded_features, axis=1, keepdims=True)" - ] - }, - { - "cell_type": "markdown", - "id": "7c0df63b", - "metadata": { - "pycharm": { - "name": "#%% md\n" - } - }, - "source": [ - "### 3D-Visualization of ArcFace Loss" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "5aac5d98", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "fig = plt.figure()\n", - "ax = Axes3D(fig)\n", - "for c in range(len(np.unique(y_test))):\n", - " ax.plot(embedded_features[y_test==c, 0], embedded_features[y_test==c, 1], embedded_features[y_test==c, 2], '.', alpha=0.1)\n", - "plt.title('ArcFace')\n", - "plt.show()" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "8889f840", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "fef529d9", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [] - } - ], - "metadata": { - "kernelspec": { - "display_name": "Python 3 (ipykernel)", - "language": "python", - "name": "python3" - }, - "language_info": { - "codemirror_mode": { - "name": "ipython", - "version": 3 - }, - "file_extension": ".py", - "mimetype": "text/x-python", - "name": "python", - "nbconvert_exporter": "python", - "pygments_lexer": "ipython3", - "version": "3.9.12" - } - }, - "nbformat": 4, - "nbformat_minor": 5 -} \ No newline at end of file From 347a7e9f9acfe39a7770d10c644fa679c164a1ee Mon Sep 17 00:00:00 2001 From: Owen Vallis Date: Fri, 7 Oct 2022 09:37:34 -0700 Subject: [PATCH 20/25] Update __init__.py --- tensorflow_similarity/__init__.py | 38 +++++++++++++++++++------------ 1 file changed, 24 insertions(+), 14 deletions(-) diff --git a/tensorflow_similarity/__init__.py b/tensorflow_similarity/__init__.py index 7ccee62d..15eaae2d 100644 --- a/tensorflow_similarity/__init__.py +++ b/tensorflow_similarity/__init__.py @@ -12,17 +12,27 @@ # See the License for the specific language governing permissions and # limitations under the License. -""" -Contrastive learning specialized losses. -""" -from .arcface_loss import ArcFaceLoss # noqa -from .barlow import Barlow # noqa -from .circle_loss import CircleLoss # noqa -from .metric_loss import MetricLoss # noqa -from .multisim_loss import MultiSimilarityLoss # noqa -from .pn_loss import PNLoss # noqa -from .simclr import SimCLRLoss # noqa -from .simsiam import SimSiamLoss # noqa -from .softnn_loss import SoftNearestNeighborLoss # noqa -from .triplet_loss import TripletLoss # noqa -from .vicreg import VicReg # noqa +__version__ = "0.17.0.dev10" + + +from . import algebra # noqa +from . import architectures # noqa +from . import augmenters # noqa +from . import callbacks # noqa +from . import classification_metrics # noqa +from . import distances # noqa +from . import evaluators # noqa +from . import indexer # noqa +from . import layers # noqa +from . import losses # noqa +from . import matchers # noqa +from . import models # noqa +from . import retrieval_metrics # noqa +from . import samplers # noqa +from . import schedules # noqa +from . import search # noqa +from . import stores # noqa +from . import training_metrics # noqa +from . import types # noqa +from . import utils # noqa +from . import visualization # noqa From 140c837c1970ce4c7ea4212c7bf9c52e106e4ddb Mon Sep 17 00:00:00 2001 From: Owen Vallis Date: Fri, 7 Oct 2022 09:37:54 -0700 Subject: [PATCH 21/25] Update __init__.py --- tensorflow_similarity/__init__.py | 1 - 1 file changed, 1 deletion(-) diff --git a/tensorflow_similarity/__init__.py b/tensorflow_similarity/__init__.py index 15eaae2d..00573fe4 100644 --- a/tensorflow_similarity/__init__.py +++ b/tensorflow_similarity/__init__.py @@ -11,7 +11,6 @@ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # See the License for the specific language governing permissions and # limitations under the License. - __version__ = "0.17.0.dev10" From 5a80c3260422a76c745bd074e2cdf9a43442cc52 Mon Sep 17 00:00:00 2001 From: Owen Vallis Date: Fri, 7 Oct 2022 09:38:34 -0700 Subject: [PATCH 22/25] Update __init__.py --- tensorflow_similarity/losses/__init__.py | 2 ++ 1 file changed, 2 insertions(+) diff --git a/tensorflow_similarity/losses/__init__.py b/tensorflow_similarity/losses/__init__.py index 0fdb573d..1a3d82ff 100644 --- a/tensorflow_similarity/losses/__init__.py +++ b/tensorflow_similarity/losses/__init__.py @@ -16,12 +16,14 @@ Contrastive learning specialized losses. """ from .arcface_loss import ArcFaceLoss # noqa +from .barlow import Barlow # noqa from .circle_loss import CircleLoss # noqa from .metric_loss import MetricLoss # noqa from .multisim_loss import MultiSimilarityLoss # noqa from .pn_loss import PNLoss # noqa from .simclr import SimCLRLoss # noqa from .simsiam import SimSiamLoss # noqa +from .softnn_loss import SoftNearestNeighborLoss # noqa from .triplet_loss import TripletLoss # noqa from .vicreg import VicReg # noqa from .xbm_loss import XBM # noqa From ffc325ce8ef70a193eb6599d46f6eba933e5da5d Mon Sep 17 00:00:00 2001 From: Owen Vallis Date: Wed, 12 Oct 2022 05:13:38 +0000 Subject: [PATCH 23/25] Fix formatting errors. --- tensorflow_similarity/losses/arcface_loss.py | 212 +++++++++---------- tests/test_losses.py | 5 +- 2 files changed, 106 insertions(+), 111 deletions(-) diff --git a/tensorflow_similarity/losses/arcface_loss.py b/tensorflow_similarity/losses/arcface_loss.py index bf4c4842..2362bba3 100644 --- a/tensorflow_similarity/losses/arcface_loss.py +++ b/tensorflow_similarity/losses/arcface_loss.py @@ -1,112 +1,108 @@ -# Copyright 2022 The TensorFlow Authors. All Rights Reserved. -# -# Licensed under the Apache License, Version 2.0 (the "License"); -# you may not use this file except in compliance with the License. -# You may obtain a copy of the License at -# -# http://www.apache.org/licenses/LICENSE-2.0 -# -# Unless required by applicable law or agreed to in writing, software -# distributed under the License is distributed on an "AS IS" BASIS, -# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. -# See the License for the specific language governing permissions and -# limitations under the License. -# ============================================================================== +# Copyright 2022 The TensorFlow Authors. All Rights Reserved. +# +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. +# ============================================================================== """ArcFace losses base class. ArcFace: Additive Angular Margin Loss for Deep Face Recognition. [online] arXiv.org. Available at: . -""" - -from typing import Any, Callable, Dict, Optional - -import tensorflow as tf -from tensorflow_similarity.distances import Distance -from tensorflow_similarity.types import FloatTensor - - -@tf.keras.utils.register_keras_serializable(package="Similarity") -class ArcFaceLoss(tf.keras.losses.Loss): - """Implement of ArcFace: Additive Angular Margin Loss: - Step 1: Create a trainable kernel matrix with the shape of [embedding_size, num_classes]. - Step 2: Normalize the kernel and prediction vectors. - Step 3: Calculate the cosine similarity between the normalized prediction vector and the kernel. - Step 4: Create a one-hot vector include the margin value for the ground truth class. - Step 5: Add margin_hot to the cosine similarity and multiply it by scale. - Step 6: Calculate the cross-entropy loss. - ArcFace: Additive Angular Margin Loss for Deep Face - Recognition. [online] arXiv.org. Available at: - . - Standalone usage: - >>> loss_fn = tfsim.losses.ArcFaceLoss(num_classes=2, embedding_size=3) - >>> labels = tf.Variable([1, 0]) - >>> embeddings = tf.Variable([[0.2, 0.3, 0.1], [0.4, 0.5, 0.5]]) - >>> loss = loss_fn(labels, embeddings) - Args: - num_classes: Number of classes. - embedding_size: The size of the embedding vectors. - margin: The margin value. - scale: s in the paper, feature scale - name: Optional name for the operation. - reduction: Type of loss reduction to apply to the loss. - """ - - def __init__( - self, - num_classes: int, - embedding_size: int, - margin: float = 0.50, # margin in radians - scale: float = 64.0, # feature scale - name: Optional[str] = None, - reduction: Callable = tf.keras.losses.Reduction.AUTO, - **kwargs - ): - - super().__init__(reduction=reduction, name=name, **kwargs) - - self.num_classes = num_classes - self.embedding_size = embedding_size - self.margin = margin - self.scale = scale - self.name = name - self.kernel = tf.Variable( - tf.random.normal([embedding_size, num_classes]), trainable=True - ) - - def call(self, y_true: FloatTensor, y_pred: FloatTensor) -> FloatTensor: - - y_pred_norm = tf.math.l2_normalize(y_pred, axis=1) - kernel_norm = tf.math.l2_normalize(self.kernel, axis=0) - - cos_theta = tf.matmul(y_pred_norm, kernel_norm) - cos_theta = tf.clip_by_value(cos_theta, -1.0, 1.0) - - m_hot = tf.one_hot(y_true, self.num_classes, on_value=self.margin, axis=1) - m_hot = tf.reshape(m_hot, [-1, self.num_classes]) - - cos_theta = tf.acos(cos_theta) - cos_theta += m_hot - cos_theta = tf.math.cos(cos_theta) - cos_theta = tf.math.multiply(cos_theta, self.scale) - - cce = tf.keras.losses.SparseCategoricalCrossentropy( - from_logits=True, reduction=self.reduction - ) - loss: FloatTensor = cce(y_true, cos_theta) - - return loss - - def get_config(self) -> Dict[str, Any]: - """Contains the loss configuration. - Returns: - The configuration of the ArcFace loss. - """ - config = { - "num_classes": self.num_classes, - "embedding_size": self.embedding_size, - "margin": self.margin, - "scale": self.scale, - "name": self.name, - } - base_config = super().get_config() - return {**base_config, **config} +""" + +from typing import Any, Callable, Dict, Optional + +import tensorflow as tf + +from tensorflow_similarity.types import FloatTensor + + +@tf.keras.utils.register_keras_serializable(package="Similarity") +class ArcFaceLoss(tf.keras.losses.Loss): + """Implement of ArcFace: Additive Angular Margin Loss: + Step 1: Create a trainable kernel matrix with the shape of [embedding_size, num_classes]. + Step 2: Normalize the kernel and prediction vectors. + Step 3: Calculate the cosine similarity between the normalized prediction vector and the kernel. + Step 4: Create a one-hot vector include the margin value for the ground truth class. + Step 5: Add margin_hot to the cosine similarity and multiply it by scale. + Step 6: Calculate the cross-entropy loss. + ArcFace: Additive Angular Margin Loss for Deep Face + Recognition. [online] arXiv.org. Available at: + . + Standalone usage: + >>> loss_fn = tfsim.losses.ArcFaceLoss(num_classes=2, embedding_size=3) + >>> labels = tf.Variable([1, 0]) + >>> embeddings = tf.Variable([[0.2, 0.3, 0.1], [0.4, 0.5, 0.5]]) + >>> loss = loss_fn(labels, embeddings) + Args: + num_classes: Number of classes. + embedding_size: The size of the embedding vectors. + margin: The margin value. + scale: s in the paper, feature scale + name: Optional name for the operation. + reduction: Type of loss reduction to apply to the loss. + """ + + def __init__( + self, + num_classes: int, + embedding_size: int, + margin: float = 0.50, # margin in radians + scale: float = 64.0, # feature scale + name: Optional[str] = None, + reduction: Callable = tf.keras.losses.Reduction.AUTO, + **kwargs + ): + + super().__init__(reduction=reduction, name=name, **kwargs) + + self.num_classes = num_classes + self.embedding_size = embedding_size + self.margin = margin + self.scale = scale + self.name = name + self.kernel = tf.Variable(tf.random.normal([embedding_size, num_classes]), trainable=True) + + def call(self, y_true: FloatTensor, y_pred: FloatTensor) -> FloatTensor: + + y_pred_norm = tf.math.l2_normalize(y_pred, axis=1) + kernel_norm = tf.math.l2_normalize(self.kernel, axis=0) + + cos_theta = tf.matmul(y_pred_norm, kernel_norm) + cos_theta = tf.clip_by_value(cos_theta, -1.0, 1.0) + + m_hot = tf.one_hot(y_true, self.num_classes, on_value=self.margin, axis=1) + m_hot = tf.reshape(m_hot, [-1, self.num_classes]) + + cos_theta = tf.acos(cos_theta) + cos_theta += m_hot + cos_theta = tf.math.cos(cos_theta) + cos_theta = tf.math.multiply(cos_theta, self.scale) + + cce = tf.keras.losses.SparseCategoricalCrossentropy(from_logits=True, reduction=self.reduction) + loss: FloatTensor = cce(y_true, cos_theta) + + return loss + + def get_config(self) -> Dict[str, Any]: + """Contains the loss configuration. + Returns: + The configuration of the ArcFace loss. + """ + config = { + "num_classes": self.num_classes, + "embedding_size": self.embedding_size, + "margin": self.margin, + "scale": self.scale, + "name": self.name, + } + base_config = super().get_config() + return {**base_config, **config} diff --git a/tests/test_losses.py b/tests/test_losses.py index ff149c94..86b340b0 100644 --- a/tests/test_losses.py +++ b/tests/test_losses.py @@ -1,5 +1,6 @@ import numpy as np import tensorflow as tf + from tensorflow_similarity.losses import ( ArcFaceLoss, MultiSimilarityLoss, @@ -87,9 +88,7 @@ def test_triplet_loss_semi_hard(): y_true = tf.random.uniform((num_inputs,), 0, 3, dtype=tf.int32) # y_preds: embedding y_preds = tf.random.uniform((num_inputs, 16), 0, 1) - tpl = TripletLoss( - positive_mining_strategy="easy", negative_mining_strategy="semi-hard" - ) + tpl = TripletLoss(positive_mining_strategy="easy", negative_mining_strategy="semi-hard") # y_true, y_preds loss = tpl(y_true, y_preds) assert loss From b832f95fcb773b76a18332fef10324f06a7a48a0 Mon Sep 17 00:00:00 2001 From: Owen Vallis Date: Wed, 12 Oct 2022 05:28:33 +0000 Subject: [PATCH 24/25] Update Arcface notebook. Initial review of notebook. Removed empty cells and verified that everything WAI. --- examples/ArcFace Loss Sample Notebook.ipynb | 1608 ++++++++++--------- 1 file changed, 833 insertions(+), 775 deletions(-) diff --git a/examples/ArcFace Loss Sample Notebook.ipynb b/examples/ArcFace Loss Sample Notebook.ipynb index b481492e..9eb1c21d 100644 --- a/examples/ArcFace Loss Sample Notebook.ipynb +++ b/examples/ArcFace Loss Sample Notebook.ipynb @@ -1,775 +1,833 @@ -{ - "cells": [ - { - "cell_type": "markdown", - "id": "28956aa1", - "metadata": { - "pycharm": { - "name": "#%% md\n" - } - }, - "source": [ - "Copyright 2022 The TensorFlow Similarity Authors." - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "24eda1a6", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "# @title Licensed under the Apache License, Version 2.0 (the \"License\");\n", - "# you may not use this file except in compliance with the License.\n", - "# You may obtain a copy of the License at\n", - "#\n", - "# https://www.apache.org/licenses/LICENSE-2.0\n", - "#\n", - "# Unless required by applicable law or agreed to in writing, software\n", - "# distributed under the License is distributed on an \"AS IS\" BASIS,\n", - "# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.\n", - "# See the License for the specific language governing permissions and\n", - "# limitations under the License." - ] - }, - { - "cell_type": "markdown", - "id": "7ca9d025", - "metadata": { - "pycharm": { - "name": "#%% md\n" - } - }, - "source": [ - "# TensorFlow Similarity ArcFace Loss Example" - ] - }, - { - "cell_type": "markdown", - "id": "d072628f", - "metadata": { - "pycharm": { - "name": "#%% md\n" - } - }, - "source": [ - "A Total Angular Margin Loss (ArcFace) calculates the geodetic distance in the hypersphere instead of the euclidean distance to improve the discriminatory strength of the facial recognition model and stabilize the training process. Rails are used to measure all distances in geodetic space. The geodetic trace is the path taken between two places. It specifies the geodetic distance, which is the shortest distance between two places.\n", - "\n", - "ArcFace loss determines the angle between the current feature and the target weight using the arc-cosine function since the dot product between the DCNN feature and the last fully connected layer after feature and weight normalization matches the cosine distance. The target logit is then returned by multiplying the goal angle by an additional angular margin and using the cosine function. After that, we continue as before and rescale all logits to a certain feature norm, just like with softmax loss." - ] - }, - { - "cell_type": "markdown", - "id": "808ac087", - "metadata": { - "pycharm": { - "name": "#%% md\n" - } - }, - "source": [ - "### Notebook goal\n", - "\n", - "This notebook demonstrates how to use ArcFaceLoss implementation of TensorFlow Similarity with standalone usage and to train a `SimilarityModel()` on a fraction of the MNIST classes.\n", - "\n", - "You are going to learn about the main features offered by the `ArcFaceLoss()` and will:\n", - "\n", - " 1. Standalone usage of ArcFaceLoss\n", - "\n", - " 2. Usage with `model.compile()`\n", - "\n", - " 3. 3D-Visualization of ArcFaceLoss \n", - "\n", - "### Things to try \n", - "\n", - "Along the way you can try the following things to improve the model performance:\n", - "- Adding more \"seen\" classes at training time.\n", - "- Use a larger embedding by increasing the size of the output.\n", - "- Add data augmentation pre-processing layers to the model.\n", - "- Include more examples in the index to give the models more points to choose from.\n", - "- Try a more challenging dataset, such as Fashion MNIST." - ] - }, - { - "cell_type": "markdown", - "id": "078c53c0", - "metadata": { - "pycharm": { - "name": "#%% md\n" - } - }, - "source": [ - "### Notebook goal\n", - "\n", - "This notebook demonstrates how to use ArcFaceLoss implementation of TensorFlow Similarity with standalone usage and to train a `SimilarityModel()` on a fraction of the MNIST classes.\n", - "\n", - "You are going to learn about the main features offered by the `ArcFaceLoss()` and will:\n", - "\n", - " 1. Standalone usage of ArcFaceLoss\n", - "\n", - " 2. Usage with `model.compile()`\n", - "\n", - " 3. 3D-Visualization of ArcFaceLoss \n", - "\n", - "### Things to try \n", - "\n", - "Along the way you can try the following things to improve the model performance:\n", - "- Adding more \"seen\" classes at training time.\n", - "- Use a larger embedding by increasing the size of the output.\n", - "- Add data augmentation pre-processing layers to the model.\n", - "- Include more examples in the index to give the models more points to choose from.\n", - "- Try a more challenging dataset, such as Fashion MNIST." - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "8fd63f16", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "import gc\n", - "import os\n", - "\n", - "import numpy as np\n", - "from matplotlib import pyplot as plt\n", - "from tabulate import tabulate\n", - "from mpl_toolkits.mplot3d import Axes3D\n", - "\n", - "# INFO messages are not printed.\n", - "# This must be run before loading other modules.\n", - "os.environ[\"TF_CPP_MIN_LOG_LEVEL\"] = \"1\"" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "80af5fc0", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "import tensorflow as tf" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "8ba8caf7", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "# install TF similarity if needed\n", - "try:\n", - " import tensorflow_similarity as tfsim # main package\n", - "except ModuleNotFoundError:\n", - " !pip install tensorflow_similarity\n", - " import tensorflow_similarity as tfsim" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "2484bd72", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "tfsim.utils.tf_cap_memory()" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "3fe0344e", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "# Clear out any old model state.\n", - "gc.collect()\n", - "tf.keras.backend.clear_session()" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "99d9bef9", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "print(\"TensorFlow:\", tf.__version__)\n", - "print(\"TensorFlow Similarity\", tfsim.__version__)" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "7137afbc", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [] - }, - { - "cell_type": "markdown", - "id": "1d534ad3", - "metadata": { - "pycharm": { - "name": "#%% md\n" - } - }, - "source": [ - "# Standalone Usage of ArcFaceLoss\n", - "\n", - "ArcFace loss alone can be used as follows when it is desired to calculate the additive angular margin loss of the existing data set." - ] - }, - { - "cell_type": "markdown", - "id": "68d526da", - "metadata": { - "pycharm": { - "name": "#%% md\n" - } - }, - "source": [ - "### Initialize Loss function as ArcFaceLoss" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "bebf6ef0", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "loss_fn = tfsim.losses.ArcFaceLoss(num_classes=8, embedding_size=10)" - ] - }, - { - "cell_type": "markdown", - "id": "d2ccfd7d", - "metadata": { - "pycharm": { - "name": "#%% md\n" - } - }, - "source": [ - "### Create own simple random dataset" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "1d1ec43a", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "labels = tf.Variable([0, 1, 2, 3, 4, 5, 6, 7])\n", - "embeddings = tf.Variable(tf.random.uniform(shape=[8, 10]))" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "73d0c1c6", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "print(\"\", embeddings)" - ] - }, - { - "cell_type": "markdown", - "id": "d65b3085", - "metadata": { - "pycharm": { - "name": "#%% md\n" - } - }, - "source": [ - "### Calculate loss" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "cdf7c30c", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "loss = loss_fn(labels, embeddings)" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "16745b7d", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "print(\"loss : \" , loss)" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "outputs": [], - "source": [ - "loss = loss_fn(labels, embeddings)" - ], - "metadata": { - "collapsed": false, - "pycharm": { - "name": "#%%\n" - } - } - }, - { - "cell_type": "code", - "execution_count": null, - "outputs": [], - "source": [ - "print(\"loss : \" , loss)" - ], - "metadata": { - "collapsed": false, - "pycharm": { - "name": "#%%\n" - } - } - }, - { - "cell_type": "markdown", - "source": [ - "## Data preparation\n", - "\n", - "We are going to load the MNIST dataset to showcase how the model is able to find similar examples from classes unseen during training. The model's ability to generalize the matching to unseen classes, without retraining, is one of the main reason you would want to use metric learning.\n", - "\n", - "\n", - "**WARNING**: Tensorflow similarity expects `y_train` to be an IntTensor containing the class ids for each example instead of the standard categorical encoding traditionally used for multi-class classification." - ], - "metadata": { - "collapsed": false, - "pycharm": { - "name": "#%% md\n" - } - } - }, - { - "cell_type": "code", - "execution_count": null, - "id": "8a9f8122", - "metadata": {}, - "outputs": [], - "source": [ - "print(\"loss : \" , loss)" - ] - }, - { - "cell_type": "markdown", - "id": "11ef5236", - "metadata": { - "pycharm": { - "name": "#%% md\n" - } - }, - "source": [ - "## Data preparation\n", - "\n", - "We are going to load the MNIST dataset to showcase how the model is able to find similar examples from classes unseen during training. The model's ability to generalize the matching to unseen classes, without retraining, is one of the main reason you would want to use metric learning.\n", - "\n", - "\n", - "**WARNING**: Tensorflow similarity expects `y_train` to be an IntTensor containing the class ids for each example instead of the standard categorical encoding traditionally used for multi-class classification." - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "97152229", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "(x_train, y_train), (x_test, y_test) = tf.keras.datasets.mnist.load_data()" - ] - }, - { - "cell_type": "markdown", - "id": "08b766d8", - "metadata": { - "pycharm": { - "name": "#%% md\n" - } - }, - "source": [ - "## Model setup" - ] - }, - { - "cell_type": "markdown", - "id": "3eac2da7", - "metadata": { - "pycharm": { - "name": "#%% md\n" - } - }, - "source": [ - "### Model definition\n", - "\n", - "`SimilarityModel()` models extend `tensorflow.keras.model.Model` with additional features and functionality that allow you to index and search for similar looking examples.\n", - "\n", - "As visible in the model definition below, similarity models output a 64 dimensional float embedding using the `MetricEmbedding()` layers. This layer is a Dense layer with L2 normalization. Thanks to the loss, the model learns to minimize the distance between similar examples and maximize the distance between dissimilar examples. As a result, the distance between examples in the embedding space is meaningful; the smaller the distance the more similar the examples are. \n", - "\n", - "Being able to use a distance as a meaningful proxy for how similar two examples are, is what enables the fast ANN (aproximate nearest neighbor) search. Using a sub-linear ANN search instead of a standard quadratic NN search is what allows deep similarity search to scale to millions of items. The built in memory index used in this notebook scales to a million indexed examples very easily... if you have enough RAM :)" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "a003c971", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "def get_model():\n", - " inputs = tf.keras.layers.Input(shape=(28, 28, 1))\n", - " x = tf.keras.layers.experimental.preprocessing.Rescaling(1 / 255)(inputs)\n", - " x = tf.keras.layers.Conv2D(32, 3, activation=\"relu\")(x)\n", - " x = tf.keras.layers.Conv2D(32, 3, activation=\"relu\")(x)\n", - " x = tf.keras.layers.MaxPool2D()(x)\n", - " x = tf.keras.layers.Conv2D(64, 3, activation=\"relu\")(x)\n", - " x = tf.keras.layers.Conv2D(64, 3, activation=\"relu\")(x)\n", - " x = tf.keras.layers.Flatten()(x)\n", - " # smaller embeddings will have faster lookup times while a larger embedding will improve the accuracy up to a point.\n", - " outputs = tfsim.layers.MetricEmbedding(64)(x)\n", - " return tfsim.models.SimilarityModel(inputs, outputs)" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "a2177b12", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "model = get_model()\n", - "model.summary()" - ] - }, - { - "cell_type": "markdown", - "id": "defb3961", - "metadata": { - "pycharm": { - "name": "#%% md\n" - } - }, - "source": [ - "### ArcFace Loss definition\n", - "\n", - "Overall what makes Metric losses different from tradional losses is that:\n", - "- **They expect different inputs.** Instead of having the prediction equal the true values, they expect embeddings as `y_preds` and the id (as an int32) of the class as `y_true`. \n", - "- **They require a distance.** You need to specify which `distance` function to use to compute the distance between embeddings. `cosine` is usually a great starting point and the default.\n", - "\n", - "ArcFace Loss takes inputs as number of classes which labels includes, and embedding size which we define in model `MetricEmbedding()` layers." - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "13b0d745", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "distance = \"cosine\" " - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "c22d10cc", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "num_classes = np.unique(y_train).size\n", - "embedding_size = model.get_layer('metric_embedding').output.shape[1]" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "d5b8e426", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "loss = tfsim.losses.ArcFaceLoss(num_classes= num_classes, embedding_size=embedding_size, name=\"ArcFaceLoss\")" - ] - }, - { - "cell_type": "markdown", - "id": "b6eaf9c8", - "metadata": { - "pycharm": { - "name": "#%% md\n" - } - }, - "source": [ - "### Compilation\n", - "\n", - "Tensorflow similarity use an extended `compile()` method that allows you to optionally specify `distance_metrics` (metrics that are computed over the distance between the embeddings), and the distance to use for the indexer.\n", - "\n", - "By default the `compile()` method tries to infer what type of distance you are using by looking at the first loss specified. If you use multiple losses, and the distance loss is not the first one, then you need to specify the distance function used as `distance=` parameter in the compile function." - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "673f986f", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "LR = 0.0005 # @param {type:\"number\"}\n", - "model.compile(optimizer=tf.keras.optimizers.SGD(LR), loss=loss, distance=distance)" - ] - }, - { - "cell_type": "markdown", - "id": "15961601", - "metadata": { - "pycharm": { - "name": "#%% md\n" - } - }, - "source": [ - "## Training\n", - "\n", - "Similarity models are trained like normal models. " - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "147a6863", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "EPOCHS = 10 # @param {type:\"integer\"}\n", - "history = model.fit(x_train, y_train, epochs=EPOCHS, validation_data=(x_test, y_test))" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "88e1ee4d", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "plt.plot(history.history[\"loss\"])\n", - "plt.plot(history.history[\"val_loss\"])\n", - "plt.legend([\"loss\", \"val_loss\"])\n", - "plt.title(f\"Loss: {loss.name}\")\n", - "plt.show()" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "a5404906", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [] - }, - { - "cell_type": "markdown", - "id": "5ad4ba20", - "metadata": { - "pycharm": { - "name": "#%% md\n" - } - }, - "source": [ - "## Prediction\n", - "\n", - "Let's predict some features and visualiza them." - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "a1936264", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "embedded_features = model.predict(x_test, verbose=1)\n", - "embedded_features /= np.linalg.norm(embedded_features, axis=1, keepdims=True)" - ] - }, - { - "cell_type": "markdown", - "id": "7c0df63b", - "metadata": { - "pycharm": { - "name": "#%% md\n" - } - }, - "source": [ - "### 3D-Visualization of ArcFace Loss" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "5aac5d98", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [ - "fig = plt.figure()\n", - "ax = Axes3D(fig)\n", - "for c in range(len(np.unique(y_test))):\n", - " ax.plot(embedded_features[y_test==c, 0], embedded_features[y_test==c, 1], embedded_features[y_test==c, 2], '.', alpha=0.1)\n", - "plt.title('ArcFace')\n", - "plt.show()" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "8889f840", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "fef529d9", - "metadata": { - "pycharm": { - "name": "#%%\n" - } - }, - "outputs": [], - "source": [] - } - ], - "metadata": { - "kernelspec": { - "display_name": "Python 3 (ipykernel)", - "language": "python", - "name": "python3" - }, - "language_info": { - "codemirror_mode": { - "name": "ipython", - "version": 3 - }, - "file_extension": ".py", - "mimetype": "text/x-python", - "name": "python", - "nbconvert_exporter": "python", - "pygments_lexer": "ipython3", - "version": "3.9.12" - } - }, - "nbformat": 4, - "nbformat_minor": 5 -} \ No newline at end of file +{ + "cells": [ + { + "cell_type": "markdown", + "id": "28956aa1", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "Copyright 2022 The TensorFlow Similarity Authors." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "24eda1a6", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "# @title Licensed under the Apache License, Version 2.0 (the \"License\");\n", + "# you may not use this file except in compliance with the License.\n", + "# You may obtain a copy of the License at\n", + "#\n", + "# https://www.apache.org/licenses/LICENSE-2.0\n", + "#\n", + "# Unless required by applicable law or agreed to in writing, software\n", + "# distributed under the License is distributed on an \"AS IS\" BASIS,\n", + "# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.\n", + "# See the License for the specific language governing permissions and\n", + "# limitations under the License." + ] + }, + { + "cell_type": "markdown", + "id": "7ca9d025", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "# TensorFlow Similarity ArcFace Loss Example" + ] + }, + { + "cell_type": "markdown", + "id": "d072628f", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "A Total Angular Margin Loss (ArcFace) calculates the geodetic distance in the hypersphere instead of the euclidean distance to improve the discriminatory strength of the facial recognition model and stabilize the training process. Rails are used to measure all distances in geodetic space. The geodetic trace is the path taken between two places. It specifies the geodetic distance, which is the shortest distance between two places.\n", + "\n", + "ArcFace loss determines the angle between the current feature and the target weight using the arc-cosine function since the dot product between the DCNN feature and the last fully connected layer after feature and weight normalization matches the cosine distance. The target logit is then returned by multiplying the goal angle by an additional angular margin and using the cosine function. After that, we continue as before and rescale all logits to a certain feature norm, just like with softmax loss." + ] + }, + { + "cell_type": "markdown", + "id": "808ac087", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "### Notebook goal\n", + "\n", + "This notebook demonstrates how to use ArcFaceLoss implementation of TensorFlow Similarity with standalone usage and to train a `SimilarityModel()` on a fraction of the MNIST classes.\n", + "\n", + "You are going to learn about the main features offered by the `ArcFaceLoss()` and will:\n", + "\n", + " 1. Standalone usage of ArcFaceLoss\n", + "\n", + " 2. Usage with `model.compile()`\n", + "\n", + " 3. 3D-Visualization of ArcFaceLoss \n", + "\n", + "### Things to try \n", + "\n", + "Along the way you can try the following things to improve the model performance:\n", + "- Adding more \"seen\" classes at training time.\n", + "- Use a larger embedding by increasing the size of the output.\n", + "- Add data augmentation pre-processing layers to the model.\n", + "- Include more examples in the index to give the models more points to choose from.\n", + "- Try a more challenging dataset, such as Fashion MNIST." + ] + }, + { + "cell_type": "markdown", + "id": "078c53c0", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "### Notebook goal\n", + "\n", + "This notebook demonstrates how to use ArcFaceLoss implementation of TensorFlow Similarity with standalone usage and to train a `SimilarityModel()` on a fraction of the MNIST classes.\n", + "\n", + "You are going to learn about the main features offered by the `ArcFaceLoss()` and will:\n", + "\n", + " 1. Standalone usage of ArcFaceLoss\n", + "\n", + " 2. Usage with `model.compile()`\n", + "\n", + " 3. 3D-Visualization of ArcFaceLoss \n", + "\n", + "### Things to try \n", + "\n", + "Along the way you can try the following things to improve the model performance:\n", + "- Adding more \"seen\" classes at training time.\n", + "- Use a larger embedding by increasing the size of the output.\n", + "- Add data augmentation pre-processing layers to the model.\n", + "- Include more examples in the index to give the models more points to choose from.\n", + "- Try a more challenging dataset, such as Fashion MNIST." + ] + }, + { + "cell_type": "code", + "execution_count": 1, + "id": "8fd63f16", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "import gc\n", + "import os\n", + "\n", + "import numpy as np\n", + "from matplotlib import pyplot as plt\n", + "from tabulate import tabulate\n", + "from mpl_toolkits.mplot3d import Axes3D\n", + "\n", + "# INFO messages are not printed.\n", + "# This must be run before loading other modules.\n", + "os.environ[\"TF_CPP_MIN_LOG_LEVEL\"] = \"1\"" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "id": "80af5fc0", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "import tensorflow as tf" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "id": "8ba8caf7", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "Your CPU supports instructions that this binary was not compiled to use: SSE3 SSE4.1 SSE4.2 AVX AVX2\n", + "For maximum performance, you can install NMSLIB from sources \n", + "pip install --no-binary :all: nmslib\n" + ] + } + ], + "source": [ + "# install TF similarity if needed\n", + "try:\n", + " import tensorflow_similarity as tfsim # main package\n", + "except ModuleNotFoundError:\n", + " !pip install tensorflow_similarity\n", + " import tensorflow_similarity as tfsim" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "id": "2484bd72", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "tfsim.utils.tf_cap_memory()" + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "id": "3fe0344e", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "# Clear out any old model state.\n", + "gc.collect()\n", + "tf.keras.backend.clear_session()" + ] + }, + { + "cell_type": "code", + "execution_count": 6, + "id": "99d9bef9", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "TensorFlow: 2.8.0\n", + "TensorFlow Similarity 0.17.0.dev10\n" + ] + } + ], + "source": [ + "print(\"TensorFlow:\", tf.__version__)\n", + "print(\"TensorFlow Similarity\", tfsim.__version__)" + ] + }, + { + "cell_type": "markdown", + "id": "1d534ad3", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "# Standalone Usage of ArcFaceLoss\n", + "\n", + "ArcFace loss alone can be used as follows when it is desired to calculate the additive angular margin loss of the existing data set." + ] + }, + { + "cell_type": "markdown", + "id": "68d526da", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "### Initialize Loss function as ArcFaceLoss" + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "id": "bebf6ef0", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "loss_fn = tfsim.losses.ArcFaceLoss(num_classes=8, embedding_size=10)" + ] + }, + { + "cell_type": "markdown", + "id": "d2ccfd7d", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "### Create own simple random dataset" + ] + }, + { + "cell_type": "code", + "execution_count": 8, + "id": "1d1ec43a", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "labels = tf.Variable([0, 1, 2, 3, 4, 5, 6, 7])\n", + "embeddings = tf.Variable(tf.random.uniform(shape=[8, 10]))" + ] + }, + { + "cell_type": "code", + "execution_count": 9, + "id": "73d0c1c6", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + " \n" + ] + } + ], + "source": [ + "print(\"\", embeddings)" + ] + }, + { + "cell_type": "markdown", + "id": "d65b3085", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "### Calculate loss" + ] + }, + { + "cell_type": "code", + "execution_count": 10, + "id": "cdf7c30c", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "loss = loss_fn(labels, embeddings)" + ] + }, + { + "cell_type": "code", + "execution_count": 11, + "id": "16745b7d", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "loss : tf.Tensor(48.764076, shape=(), dtype=float32)\n" + ] + } + ], + "source": [ + "print(\"loss : \" , loss)" + ] + }, + { + "cell_type": "markdown", + "id": "11ef5236", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "## Data preparation\n", + "\n", + "We are going to load the MNIST dataset to showcase how the model is able to find similar examples from classes unseen during training. The model's ability to generalize the matching to unseen classes, without retraining, is one of the main reason you would want to use metric learning.\n", + "\n", + "\n", + "**WARNING**: Tensorflow similarity expects `y_train` to be an IntTensor containing the class ids for each example instead of the standard categorical encoding traditionally used for multi-class classification." + ] + }, + { + "cell_type": "code", + "execution_count": 15, + "id": "97152229", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "(x_train, y_train), (x_test, y_test) = tf.keras.datasets.mnist.load_data()" + ] + }, + { + "cell_type": "markdown", + "id": "08b766d8", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "## Model setup" + ] + }, + { + "cell_type": "markdown", + "id": "3eac2da7", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "### Model definition\n", + "\n", + "`SimilarityModel()` models extend `tensorflow.keras.model.Model` with additional features and functionality that allow you to index and search for similar looking examples.\n", + "\n", + "As visible in the model definition below, similarity models output a 64 dimensional float embedding using the `MetricEmbedding()` layers. This layer is a Dense layer with L2 normalization. Thanks to the loss, the model learns to minimize the distance between similar examples and maximize the distance between dissimilar examples. As a result, the distance between examples in the embedding space is meaningful; the smaller the distance the more similar the examples are. \n", + "\n", + "Being able to use a distance as a meaningful proxy for how similar two examples are, is what enables the fast ANN (aproximate nearest neighbor) search. Using a sub-linear ANN search instead of a standard quadratic NN search is what allows deep similarity search to scale to millions of items. The built in memory index used in this notebook scales to a million indexed examples very easily... if you have enough RAM :)" + ] + }, + { + "cell_type": "code", + "execution_count": 16, + "id": "a003c971", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "def get_model():\n", + " inputs = tf.keras.layers.Input(shape=(28, 28, 1))\n", + " x = tf.keras.layers.experimental.preprocessing.Rescaling(1 / 255)(inputs)\n", + " x = tf.keras.layers.Conv2D(32, 3, activation=\"relu\")(x)\n", + " x = tf.keras.layers.Conv2D(32, 3, activation=\"relu\")(x)\n", + " x = tf.keras.layers.MaxPool2D()(x)\n", + " x = tf.keras.layers.Conv2D(64, 3, activation=\"relu\")(x)\n", + " x = tf.keras.layers.Conv2D(64, 3, activation=\"relu\")(x)\n", + " x = tf.keras.layers.Flatten()(x)\n", + " # smaller embeddings will have faster lookup times while a larger embedding will improve the accuracy up to a point.\n", + " outputs = tfsim.layers.MetricEmbedding(64)(x)\n", + " return tfsim.models.SimilarityModel(inputs, outputs)" + ] + }, + { + "cell_type": "code", + "execution_count": 17, + "id": "a2177b12", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Model: \"similarity_model\"\n", + "_________________________________________________________________\n", + " Layer (type) Output Shape Param # \n", + "=================================================================\n", + " input_1 (InputLayer) [(None, 28, 28, 1)] 0 \n", + " \n", + " rescaling (Rescaling) (None, 28, 28, 1) 0 \n", + " \n", + " conv2d (Conv2D) (None, 26, 26, 32) 320 \n", + " \n", + " conv2d_1 (Conv2D) (None, 24, 24, 32) 9248 \n", + " \n", + " max_pooling2d (MaxPooling2D (None, 12, 12, 32) 0 \n", + " ) \n", + " \n", + " conv2d_2 (Conv2D) (None, 10, 10, 64) 18496 \n", + " \n", + " conv2d_3 (Conv2D) (None, 8, 8, 64) 36928 \n", + " \n", + " flatten (Flatten) (None, 4096) 0 \n", + " \n", + " metric_embedding (MetricEmb (None, 64) 262208 \n", + " edding) \n", + " \n", + "=================================================================\n", + "Total params: 327,200\n", + "Trainable params: 327,200\n", + "Non-trainable params: 0\n", + "_________________________________________________________________\n" + ] + } + ], + "source": [ + "model = get_model()\n", + "model.summary()" + ] + }, + { + "cell_type": "markdown", + "id": "defb3961", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "### ArcFace Loss definition\n", + "\n", + "Overall what makes Metric losses different from tradional losses is that:\n", + "- **They expect different inputs.** Instead of having the prediction equal the true values, they expect embeddings as `y_preds` and the id (as an int32) of the class as `y_true`. \n", + "- **They require a distance.** You need to specify which `distance` function to use to compute the distance between embeddings. `cosine` is usually a great starting point and the default.\n", + "\n", + "ArcFace Loss takes inputs as number of classes which labels includes, and embedding size which we define in model `MetricEmbedding()` layers." + ] + }, + { + "cell_type": "code", + "execution_count": 18, + "id": "13b0d745", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "distance = \"cosine\" " + ] + }, + { + "cell_type": "code", + "execution_count": 19, + "id": "c22d10cc", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "num_classes = np.unique(y_train).size\n", + "embedding_size = model.get_layer('metric_embedding').output.shape[1]" + ] + }, + { + "cell_type": "code", + "execution_count": 20, + "id": "d5b8e426", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "loss = tfsim.losses.ArcFaceLoss(num_classes=num_classes, embedding_size=embedding_size, name=\"ArcFaceLoss\")" + ] + }, + { + "cell_type": "markdown", + "id": "b6eaf9c8", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "### Compilation\n", + "\n", + "Tensorflow similarity use an extended `compile()` method that allows you to optionally specify `distance_metrics` (metrics that are computed over the distance between the embeddings), and the distance to use for the indexer.\n", + "\n", + "By default the `compile()` method tries to infer what type of distance you are using by looking at the first loss specified. If you use multiple losses, and the distance loss is not the first one, then you need to specify the distance function used as `distance=` parameter in the compile function." + ] + }, + { + "cell_type": "code", + "execution_count": 21, + "id": "673f986f", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [], + "source": [ + "LR = 0.0005 # @param {type:\"number\"}\n", + "model.compile(optimizer=tf.keras.optimizers.SGD(LR), loss=loss, distance=distance)" + ] + }, + { + "cell_type": "markdown", + "id": "15961601", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "## Training\n", + "\n", + "Similarity models are trained like normal models. " + ] + }, + { + "cell_type": "code", + "execution_count": 22, + "id": "147a6863", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Epoch 1/10\n", + "1875/1875 [==============================] - 11s 4ms/step - loss: 5.2161 - val_loss: 1.8907\n", + "Epoch 2/10\n", + "1875/1875 [==============================] - 7s 4ms/step - loss: 1.8353 - val_loss: 1.6826\n", + "Epoch 3/10\n", + "1875/1875 [==============================] - 7s 4ms/step - loss: 1.3566 - val_loss: 1.1404\n", + "Epoch 4/10\n", + "1875/1875 [==============================] - 7s 4ms/step - loss: 1.1160 - val_loss: 1.0936\n", + "Epoch 5/10\n", + "1875/1875 [==============================] - 7s 4ms/step - loss: 0.9555 - val_loss: 1.0854\n", + "Epoch 6/10\n", + "1875/1875 [==============================] - 7s 4ms/step - loss: 0.8343 - val_loss: 1.0062\n", + "Epoch 7/10\n", + "1875/1875 [==============================] - 7s 4ms/step - loss: 0.7546 - val_loss: 0.9062\n", + "Epoch 8/10\n", + "1875/1875 [==============================] - 7s 4ms/step - loss: 0.6776 - val_loss: 0.8000\n", + "Epoch 9/10\n", + "1875/1875 [==============================] - 7s 4ms/step - loss: 0.6194 - val_loss: 0.8160\n", + "Epoch 10/10\n", + "1875/1875 [==============================] - 7s 4ms/step - loss: 0.5676 - val_loss: 0.7515\n" + ] + } + ], + "source": [ + "EPOCHS = 10 # @param {type:\"integer\"}\n", + "history = model.fit(x_train, y_train, epochs=EPOCHS, validation_data=(x_test, y_test))" + ] + }, + { + "cell_type": "code", + "execution_count": 23, + "id": "88e1ee4d", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [ + { + "data": { + "image/png": "\n", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + } + ], + "source": [ + "plt.plot(history.history[\"loss\"])\n", + "plt.plot(history.history[\"val_loss\"])\n", + "plt.legend([\"loss\", \"val_loss\"])\n", + "plt.title(f\"Loss: {loss.name}\")\n", + "plt.show()" + ] + }, + { + "cell_type": "markdown", + "id": "5ad4ba20", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "## Prediction\n", + "\n", + "Let's predict some features and visualize them." + ] + }, + { + "cell_type": "code", + "execution_count": 28, + "id": "a1936264", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "313/313 [==============================] - 1s 2ms/step\n" + ] + } + ], + "source": [ + "embedded_features = model.predict(x_test, verbose=1)" + ] + }, + { + "cell_type": "markdown", + "id": "7c0df63b", + "metadata": { + "pycharm": { + "name": "#%% md\n" + } + }, + "source": [ + "### 3D-Visualization of ArcFace Loss" + ] + }, + { + "cell_type": "code", + "execution_count": 38, + "id": "5aac5d98", + "metadata": { + "pycharm": { + "name": "#%%\n" + } + }, + "outputs": [ + { + "data": { + "image/png": "\n", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + } + ], + "source": [ + "fig = plt.figure()\n", + "ax = Axes3D(fig, auto_add_to_figure=False)\n", + "fig.add_axes(ax)\n", + "for c in range(len(np.unique(y_test))):\n", + " ax.plot(\n", + " embedded_features[y_test==c, 0], \n", + " embedded_features[y_test==c, 1], \n", + " embedded_features[y_test==c, 2], \n", + " '.', \n", + " alpha=0.1,\n", + " )\n", + "plt.title('ArcFace')\n", + "plt.show()" + ] + } + ], + "metadata": { + "environment": { + "kernel": "python3", + "name": "tf2-gpu.2-8.m91", + "type": "gcloud", + "uri": "gcr.io/deeplearning-platform-release/tf2-gpu.2-8:m91" + }, + "kernelspec": { + "display_name": "Python 3", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.7.12" + } + }, + "nbformat": 4, + "nbformat_minor": 5 +} From 8093f1f7587e4557303c6cb2c57818e17c38eaa2 Mon Sep 17 00:00:00 2001 From: Owen Vallis Date: Wed, 12 Oct 2022 15:41:42 +0000 Subject: [PATCH 25/25] Fix formatting errors. --- benchmark/supervised/components/__init__.py | 4 ++-- benchmark/supervised/train.py | 2 +- tensorflow_similarity/retrieval_metrics/map_at_k.py | 2 +- 3 files changed, 4 insertions(+), 4 deletions(-) diff --git a/benchmark/supervised/components/__init__.py b/benchmark/supervised/components/__init__.py index 0eda9b56..e1093a0b 100644 --- a/benchmark/supervised/components/__init__.py +++ b/benchmark/supervised/components/__init__.py @@ -1,6 +1,6 @@ +from . import metrics # noqa +from . import utils # noqa from .architectures import make_architecture # noqa from .augmentations import make_augmentations # noqa from .losses import make_loss # noqa -from . import metrics # noqa from .optimizers import make_optimizer # noqa -from . import utils # noqa diff --git a/benchmark/supervised/train.py b/benchmark/supervised/train.py index 474506dc..5db82487 100644 --- a/benchmark/supervised/train.py +++ b/benchmark/supervised/train.py @@ -106,7 +106,7 @@ def run(config): version, dataset_name, architecture_name, - aconf['embedding'], + aconf["embedding"], loss_name, opt_name, fold, diff --git a/tensorflow_similarity/retrieval_metrics/map_at_k.py b/tensorflow_similarity/retrieval_metrics/map_at_k.py index 0fed2e2e..8c074365 100644 --- a/tensorflow_similarity/retrieval_metrics/map_at_k.py +++ b/tensorflow_similarity/retrieval_metrics/map_at_k.py @@ -157,7 +157,7 @@ def compute( avg_p_at_k = tf.map_fn( lambda x: tf.math.reduce_sum(x[0][: x[1][0]]) / tf.cast(x[1], dtype="float"), elems, - fn_output_signature="float" + fn_output_signature="float", ) else: avg_p_at_k = tf.math.divide(