Spaces:

Jensen-holm
/

Numpy-Neuron

Build error

App Files Files Community

Jensen Holm commited on Jul 26, 2024

Commit

d7ea050

1 Parent(s): ff1254a

loss functions now just have staticmethods

Browse files

Files changed (5) hide show

numpyneuron/__init__.py +6 -0
numpyneuron/activation.py +2 -2
numpyneuron/loss.py +17 -20
test/{test_activation.py → test_activation_fns.py} +0 -0
test/test_loss_fns.py +0 -0

numpyneuron/__init__.py CHANGED Viewed

@@ -8,3 +8,9 @@ ACTIVATIONS: dict[str, Activation] = {
     "TanH": TanH(),
     "SoftMax": SoftMax(),
 }

     "TanH": TanH(),
     "SoftMax": SoftMax(),
 }
+LOSSES: dict[str, Loss] = {
+    "MSE": MSE(),
+    "CrossEntropy": CrossEntropy(),
+    "CrossEntropyWithLogitsLoss": CrossEntropyWithLogits(),
+}

numpyneuron/activation.py CHANGED Viewed

@@ -4,11 +4,11 @@ from abc import abstractmethod, ABC
 class Activation(ABC):
     @abstractmethod
-    def forward(self, X: np.ndarray) -> np.ndarray:
         pass
     @abstractmethod
-    def backward(self, X: np.ndarray) -> np.ndarray:
         pass

 class Activation(ABC):
     @abstractmethod
+    def forward(X: np.ndarray) -> np.ndarray:
         pass
     @abstractmethod
+    def backward(X: np.ndarray) -> np.ndarray:
         pass

numpyneuron/loss.py CHANGED Viewed

@@ -4,12 +4,14 @@ import numpy as np
 class Loss(ABC):
     @abstractmethod
-    def forward(self, y_hat: np.ndarray, y_true: np.ndarray) -> np.ndarray:
         pass
     @abstractmethod
-    def backward(self, y_hat: np.ndarray, y_true: np.ndarray) -> np.ndarray:
         pass
@@ -18,19 +20,22 @@ class LogitsLoss(Loss):
 class MSE(Loss):
-    def forward(self, y_hat: np.ndarray, y_true: np.ndarray) -> np.ndarray:
         return np.sum(np.square(y_hat - y_true)) / y_true.shape[0]
-    def backward(self, y_hat: np.ndarray, y_true: np.ndarray) -> np.ndarray:
         return (y_hat - y_true) * (2 / y_true.shape[0])
 class CrossEntropy(Loss):
-    def forward(self, y_hat: np.ndarray, y_true: np.ndarray) -> np.ndarray:
         y_hat = np.asarray(y_hat)
         y_true = np.asarray(y_true)
         m = y_true.shape[0]
-        p = self._softmax(y_hat)
         eps = 1e-15  # to prevent log(0)
         log_likelihood = -np.log(
             np.clip(p[range(m), y_true.argmax(axis=1)], a_min=eps, a_max=None)
@@ -38,19 +43,17 @@ class CrossEntropy(Loss):
         loss = np.sum(log_likelihood) / m
         return loss
-    def backward(self, y_hat: np.ndarray, y_true: np.ndarray) -> np.ndarray:
         y_hat = np.asarray(y_hat)
         y_true = np.asarray(y_true)
         grad = y_hat - y_true
         return grad / y_true.shape[0]
-    @staticmethod
-    def _softmax(X: np.ndarray) -> np.ndarray:
-        return SoftMax().forward(X)
 class CrossEntropyWithLogits(LogitsLoss):
-    def forward(self, y_hat: np.ndarray, y_true: np.ndarray) -> np.ndarray:
         # Apply the log-sum-exp trick for numerical stability
         max_logits = np.max(y_hat, axis=1, keepdims=True)
         log_sum_exp = np.log(np.sum(np.exp(y_hat - max_logits), axis=1, keepdims=True))
@@ -59,17 +62,11 @@ class CrossEntropyWithLogits(LogitsLoss):
         loss = -np.sum(log_probs * y_true) / y_true.shape[0]
         return loss
-    def backward(self, y_hat: np.ndarray, y_true: np.ndarray) -> np.ndarray:
         # Compute softmax probabilities
         exps = np.exp(y_hat - np.max(y_hat, axis=1, keepdims=True))
         probs = exps / np.sum(exps, axis=1, keepdims=True)
         # Subtract the one-hot encoded labels from the probabilities
         grad = (probs - y_true) / y_true.shape[0]
         return grad
-LOSSES: dict[str, Loss] = {
-    "MSE": MSE(),
-    "CrossEntropy": CrossEntropy(),
-    "CrossEntropyWithLogitsLoss": CrossEntropyWithLogits(),
-}

 class Loss(ABC):
+    @staticmethod
     @abstractmethod
+    def forward(y_hat: np.ndarray, y_true: np.ndarray) -> np.ndarray:
         pass
+    @staticmethod
     @abstractmethod
+    def backward(y_hat: np.ndarray, y_true: np.ndarray) -> np.ndarray:
         pass
 class MSE(Loss):
+    @staticmethod
+    def forward(y_hat: np.ndarray, y_true: np.ndarray) -> np.ndarray:
         return np.sum(np.square(y_hat - y_true)) / y_true.shape[0]
+    @staticmethod
+    def backward(y_hat: np.ndarray, y_true: np.ndarray) -> np.ndarray:
         return (y_hat - y_true) * (2 / y_true.shape[0])
 class CrossEntropy(Loss):
+    @staticmethod
+    def forward(y_hat: np.ndarray, y_true: np.ndarray) -> np.ndarray:
         y_hat = np.asarray(y_hat)
         y_true = np.asarray(y_true)
         m = y_true.shape[0]
+        p = SoftMax().forward(y_hat)
         eps = 1e-15  # to prevent log(0)
         log_likelihood = -np.log(
             np.clip(p[range(m), y_true.argmax(axis=1)], a_min=eps, a_max=None)
         loss = np.sum(log_likelihood) / m
         return loss
+    @staticmethod
+    def backward(y_hat: np.ndarray, y_true: np.ndarray) -> np.ndarray:
         y_hat = np.asarray(y_hat)
         y_true = np.asarray(y_true)
         grad = y_hat - y_true
         return grad / y_true.shape[0]
 class CrossEntropyWithLogits(LogitsLoss):
+    @staticmethod
+    def forward(y_hat: np.ndarray, y_true: np.ndarray) -> np.ndarray:
         # Apply the log-sum-exp trick for numerical stability
         max_logits = np.max(y_hat, axis=1, keepdims=True)
         log_sum_exp = np.log(np.sum(np.exp(y_hat - max_logits), axis=1, keepdims=True))
         loss = -np.sum(log_probs * y_true) / y_true.shape[0]
         return loss
+    @staticmethod
+    def backward(y_hat: np.ndarray, y_true: np.ndarray) -> np.ndarray:
         # Compute softmax probabilities
         exps = np.exp(y_hat - np.max(y_hat, axis=1, keepdims=True))
         probs = exps / np.sum(exps, axis=1, keepdims=True)
         # Subtract the one-hot encoded labels from the probabilities
         grad = (probs - y_true) / y_true.shape[0]
         return grad

test/{test_activation.py → test_activation_fns.py} RENAMED Viewed

File without changes

test/test_loss_fns.py ADDED Viewed

File without changes