Merge pull request #1 from THEGAMECHANGER416/THEGAMECHANGER416-patch-1

THEGAMECHANGER416 · web-flow · commit dc3129bd5ee8 · 2023-10-09T12:00:01.000+05:30
Create categorical_cross_entropy.py
diff --git a/machine_learning/loss_functions/categorical_cross_entropy.py b/machine_learning/loss_functions/categorical_cross_entropy.py
@@ -0,0 +1,55 @@
+"""
+Categorical Cross-Entropy Loss
+
+This function calculates the Categorical Cross-Entropy Loss between true class
+labels and predicted class probabilities.
+
+Formula:
+Categorical Cross-Entropy Loss = -Σ(y_true * log(y_pred))
+
+Resources:
+- [Wikipedia - Cross entropy](https://en.wikipedia.org/wiki/Cross_entropy)
+"""
+
+import numpy as np
+
+def categorical_crossentropy(
+    y_true: np.ndarray, y_pred: np.ndarray, epsilon: float = 1e-15
+) -> float:
+    """
+    Calculate Categorical Cross-Entropy Loss between true class labels and
+    predicted class probabilities.
+
+    Parameters:
+    - y_true: True class labels (one-hot encoded) as a NumPy array.
+    - y_pred: Predicted class probabilities as a NumPy array.
+    - epsilon: Small constant to avoid numerical instability.
+
+    Returns:
+    - ce_loss: Categorical Cross-Entropy Loss as a floating-point number.
+
+    Example:
+    >>> true_labels = np.array([[1, 0, 0], [0, 1, 0], [0, 0, 1]])
+    >>> pred_probs = np.array([[0.9, 0.1, 0.0], [0.2, 0.7, 0.1], [0.0, 0.1, 0.9]])
+    >>> categorical_crossentropy(true_labels, pred_probs)
+    0.18913199175146167
+
+    >>> y_true = np.array([[1, 0], [0, 1]])
+    >>> y_pred = np.array([[0.9, 0.1, 0.0], [0.2, 0.7, 0.1]])
+    >>> categorical_crossentropy(y_true, y_pred)
+    Traceback (most recent call last):
+        ...
+    ValueError: Input arrays must have the same length.
+    """
+    if y_true.shape != y_pred.shape:
+        raise ValueError("Input arrays must have the same length.")
+    
+    # Clip predicted probabilities to avoid log(0)
+    y_pred = np.clip(y_pred, epsilon, 1 - epsilon)
+
+    # Calculate categorical cross-entropy loss
+    return -np.sum(y_true * np.log(y_pred)) / len(y_true)
+
+if __name__ == "__main__":
+    import doctest
+    doctest.testmod()