Python/machine_learning/label_smoothing.py at faaa92f15ed668cc6fedb75f2ef84f14cd91dd0a · TheAlgorithms/Python · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
"""
Label Smoothing is a regularization technique used during training of
classification models. Instead of using hard one-hot encoded targets
(e.g. [0, 0, 1, 0]), it softens the labels by distributing a small
amount of probability mass (epsilon) uniformly across all classes.

This prevents the model from becoming overconfident and improves
generalization, especially when training data is noisy or limited.

Formula:
    smoothed_label = (1 - epsilon) * one_hot + epsilon / num_classes

Reference:
    Szegedy et al., "Rethinking the Inception Architecture for Computer
    Vision", https://arxiv.org/abs/1512.00567

Example usage:
    >>> import numpy as np
    >>> smoother = LabelSmoother(num_classes=4, epsilon=0.1)
    >>> smoother.smooth(2)
    array([0.025, 0.025, 0.925, 0.025])
"""

import numpy as np


class LabelSmoother:
    """
    Applies label smoothing to a one-hot encoded target vector.

    Attributes:
        num_classes: Total number of classes.
        epsilon: Smoothing factor in the range [0.0, 1.0).
                 0.0 means no smoothing (standard one-hot).

    >>> smoother = LabelSmoother(num_classes=3, epsilon=0.0)
    >>> smoother.smooth(1)
    array([0., 1., 0.])

    >>> smoother = LabelSmoother(num_classes=3, epsilon=0.3)
    >>> smoother.smooth(0)
    array([0.8, 0.1, 0.1])
    """

    def __init__(self, num_classes: int, epsilon: float = 0.1) -> None:
        """
        Initialize LabelSmoother.

        Args:
            num_classes: Number of target classes (must be >= 2).
            epsilon: Smoothing factor. Must satisfy 0.0 <= epsilon < 1.0.

        Raises:
            ValueError: If num_classes < 2 or epsilon is out of range.

        >>> LabelSmoother(num_classes=1, epsilon=0.1)
        Traceback (most recent call last):
            ...
        ValueError: num_classes must be at least 2.

        >>> LabelSmoother(num_classes=3, epsilon=1.0)
        Traceback (most recent call last):
            ...
        ValueError: epsilon must be in [0.0, 1.0).
        """
        if num_classes < 2:
            raise ValueError("num_classes must be at least 2.")
        if not (0.0 <= epsilon < 1.0):
            raise ValueError("epsilon must be in [0.0, 1.0).")
        self.num_classes = num_classes
        self.epsilon = epsilon

    def smooth(self, true_class: int) -> np.ndarray:
        """
        Return a smoothed label vector for the given true class index.

        Args:
            true_class: The index of the correct class (0-indexed).

        Returns:
            A numpy array of shape (num_classes,) with smoothed probabilities.
            All values sum to 1.0.

        Raises:
            ValueError: If true_class is out of range.

        >>> smoother = LabelSmoother(num_classes=4, epsilon=0.1)
        >>> smoother.smooth(2)
        array([0.025, 0.025, 0.925, 0.025])

        >>> smoother.smooth(0)
        array([0.925, 0.025, 0.025, 0.025])

        >>> float(round(smoother.smooth(1).sum(), 10))
        1.0

        >>> smoother.smooth(5)
        Traceback (most recent call last):
            ...
        ValueError: true_class index 5 is out of range for 4 classes.
        """
        if not (0 <= true_class < self.num_classes):
            raise ValueError(
                f"true_class index {true_class} is out of range "
                f"for {self.num_classes} classes."
            )
        # Start with uniform distribution weighted by epsilon
        labels = np.full(self.num_classes, self.epsilon / self.num_classes)
        # Add the remaining probability mass to the true class
        labels[true_class] += 1.0 - self.epsilon
        return labels

    def smooth_batch(self, true_classes: list[int]) -> np.ndarray:
        """
        Return smoothed label vectors for a batch of true class indices.

        Args:
            true_classes: List of true class indices.

        Returns:
            A numpy array of shape (batch_size, num_classes).

        >>> smoother = LabelSmoother(num_classes=3, epsilon=0.3)
        >>> smoother.smooth_batch([0, 2])
        array([[0.8, 0.1, 0.1],
               [0.1, 0.1, 0.8]])
        """
        return np.array([self.smooth(c) for c in true_classes])


def cross_entropy_loss(
    smoothed_labels: np.ndarray, predicted_probs: np.ndarray
) -> float:
    """
    Compute cross-entropy loss between smoothed labels and predicted
    probability distribution.

    Args:
        smoothed_labels: Target distribution, shape (num_classes,).
        predicted_probs: Predicted probabilities, shape (num_classes,).
                         Values must be in (0, 1] and sum to 1.

    Returns:
        Scalar cross-entropy loss value.

    >>> import numpy as np
    >>> labels = np.array([0.025, 0.025, 0.925, 0.025])
    >>> preds  = np.array([0.01,  0.01,  0.97,  0.01])
    >>> round(cross_entropy_loss(labels, preds), 4)
    0.3736
    """
    # Clip to avoid log(0)
    predicted_probs = np.clip(predicted_probs, 1e-12, 1.0)
    return float(-np.sum(smoothed_labels * np.log(predicted_probs)))


if __name__ == "__main__":
    import doctest

    doctest.testmod(verbose=True)

    print("\n--- Label Smoothing Demo ---")
    smoother = LabelSmoother(num_classes=5, epsilon=0.1)

    print("\nHard one-hot (no smoothing, epsilon=0.0):")
    hard = LabelSmoother(num_classes=5, epsilon=0.0)
    print(f"  Class 2 -> {hard.smooth(2)}")

    print("\nSmoothed labels (epsilon=0.1):")
    print(f"  Class 2 -> {smoother.smooth(2)}")

    print("\nBatch smoothing for classes [0, 2, 4]:")
    print(smoother.smooth_batch([0, 2, 4]))

    print("\nCross-entropy loss with smoothed target vs confident prediction:")
    smoothed = smoother.smooth(2)
    confident_pred = np.array([0.01, 0.01, 0.96, 0.01, 0.01])
    print(f"  Loss = {cross_entropy_loss(smoothed, confident_pred):.4f}")