utils.py

# Copyright 2021 DeepMind Technologies Limited. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# ==============================================================================
import jax
from jax import numpy as jnp


def reduce_fn(x, mode):
    """Reduce fn for various losses."""
    if mode == 'none' or mode is None:
        return jnp.asarray(x)
    elif mode == 'sum':
        return jnp.sum(x)
    elif mode == 'mean':
        return jnp.mean(x)
    else:
        raise ValueError('Unsupported reduction option.')


def softmax_cross_entropy(logits, labels, reduction='sum'):
    """Computes softmax cross entropy given logits and one-hot class labels.
  Args:
    logits: Logit output values.
    labels: Ground truth one-hot-encoded labels.
    reduction: Type of reduction to apply to loss.
  Returns:
    Loss value. If `reduction` is `none`, this has the same shape as `labels`;
    otherwise, it is scalar.
  Raises:
    ValueError: If the type of `reduction` is unsupported.
  """
    loss = -jnp.sum(labels * jax.nn.log_softmax(logits), axis=-1)
    return reduce_fn(loss, reduction)


def topk_correct(logits, labels, mask=None, prefix='', topk=(1, 5)):
    """Calculate top-k error for multiple k values."""
    metrics = {}
    argsorted_logits = jnp.argsort(logits)
    for k in topk:
        pred_labels = argsorted_logits[..., -k:]
        # Get the number of examples where the label is in the top-k predictions
        correct = any_in(pred_labels, labels).any(axis=-1).astype(jnp.float32)
        if mask is not None:
            correct *= mask
        metrics[f'{prefix}top_{k}_acc'] = correct
    return metrics


@jax.vmap
def any_in(prediction, target):
    """For each row in a and b, checks if any element of a is in b."""
    return jnp.isin(prediction, target)


def to_bf16(x):
    if x.dtype == jnp.float32:
        return x.astype(jnp.bfloat16)
    return x


def from_bf16(x):
    if x.dtype == jnp.bfloat16:
        return x.astype(jnp.float32)
    return x