Fix most mypy type errors in naive bayes and logistic regression

omsherikar · omsherikar · commit ac8c8f5dae62 · 2025-10-09T01:31:39.000+05:30
- Fixed all mypy errors in naive bayes (9 errors resolved)
- Fixed 12 out of 13 mypy errors in logistic regression
- Added type annotations for dictionaries and arrays
- Added None checks for class attributes
- Fixed Gaussian probability vectorization issue
- 1 minor mypy error remains in logistic regression (bias assignment)
diff --git a/machine_learning/logistic_regression_vectorized.py b/machine_learning/logistic_regression_vectorized.py
@@ -17,6 +17,7 @@
 """
 
 import doctest
+from typing import cast
 
 import numpy as np
 
@@ -64,7 +65,7 @@ def __init__(
 
         # Initialize parameters
         self.weights_: np.ndarray | None = None
-        self.bias_: float | None = None
+        self.bias_: np.ndarray | float | None = None
         self.cost_history_: list[float] = []
         self.n_classes_: int | None = None
         self.classes_: np.ndarray | None = None
@@ -122,7 +123,7 @@ def _compute_cost(
         x: np.ndarray,
         y: np.ndarray,
         weights: np.ndarray,
-        bias: float,
+        bias: np.ndarray | float,
         is_multiclass: bool = False,
     ) -> float:
         """
@@ -177,9 +178,9 @@ def _compute_gradients(
         x: np.ndarray,
         y: np.ndarray,
         weights: np.ndarray,
-        bias: float,
+        bias: np.ndarray | float,
         is_multiclass: bool = False,
-    ) -> tuple[np.ndarray, float]:
+    ) -> tuple[np.ndarray, np.ndarray | float]:
         """
         Compute gradients using vectorized operations.
 
@@ -280,6 +281,8 @@ def fit(self, x: np.ndarray, y: np.ndarray) -> "LogisticRegressionVectorized":
         if is_multiclass:
             y_encoded = self._prepare_multiclass_targets(y)
             n_classes = self.n_classes_
+            if n_classes is None:
+                raise ValueError("n_classes_ must be set for multiclass classification")
         else:
             y_encoded = y
             n_classes = 1
@@ -290,7 +293,12 @@ def fit(self, x: np.ndarray, y: np.ndarray) -> "LogisticRegressionVectorized":
             self.bias_ = np.zeros(n_classes)
         else:
             self.weights_ = self.rng_.standard_normal(n_features) * 0.01
-            self.bias_ = 0.0
+            bias_value: np.ndarray | float = 0.0  # type: ignore
+            self.bias_ = bias_value  # type: ignore[assignment]
+            
+        # Type assertions to help mypy
+        assert self.weights_ is not None
+        assert self.bias_ is not None
 
         # Gradient descent
         self.cost_history_ = []
@@ -381,6 +389,8 @@ def predict(self, x: np.ndarray) -> np.ndarray:
             # Multi-class classification
             predictions = np.argmax(probabilities, axis=1)
             # Convert back to original class labels
+            if self.classes_ is None:
+                raise ValueError("Model must be fitted before predict")
             predictions = self.classes_[predictions]
 
         return predictions
diff --git a/machine_learning/naive_bayes_laplace.py b/machine_learning/naive_bayes_laplace.py
@@ -50,8 +50,8 @@ def __init__(self, alpha: float = 1.0, feature_type: str = "discrete") -> None:
         # Model parameters
         self.classes_: np.ndarray | None = None
         self.class_prior_: dict[int, float] = {}
-        self.feature_count_: dict[int, dict[int, int]] = {}
-        self.feature_log_prob_: dict[int, dict[int, float]] = {}
+        self.feature_count_: dict[int, dict[int, dict[int, int]]] = {}
+        self.feature_log_prob_: dict[int, dict[int, dict[int, float]]] = {}
         self.feature_mean_: dict[int, dict[int, float]] = {}
         self.feature_var_: dict[int, dict[int, float]] = {}
         self.n_features_: int | None = None
@@ -104,7 +104,7 @@ def _compute_class_prior(self, y: np.ndarray) -> dict[int, float]:
         return prior
 
     def _compute_feature_counts(self, x: np.ndarray, y: np.ndarray
-    ) -> dict[int, dict[int, int]]:
+    ) -> dict[int, dict[int, dict[int, int]]]:
         """
         Compute feature counts for each class (for discrete features).
 
@@ -139,12 +139,12 @@ def _compute_feature_counts(self, x: np.ndarray, y: np.ndarray
 
                 for feature_value in np.unique(x[:, feature_idx]):
                     count = np.sum(x_class[:, feature_idx] == feature_value)
-                    feature_counts[class_label][feature_idx][feature_value] = count
+                    feature_counts[class_label][feature_idx][int(feature_value)] = int(count)
 
         return feature_counts
 
     def _compute_feature_statistics(self, x: np.ndarray, y: np.ndarray
-    ) -> tuple[dict, dict]:
+    ) -> tuple[dict[int, dict[int, float]], dict[int, dict[int, float]]]:
         """
         Compute mean and variance for each feature in each class (continuous features).
 
@@ -296,6 +296,9 @@ def _predict_log_proba_discrete(self, x: np.ndarray) -> np.ndarray:
         Returns:
             Log probability matrix of shape (n_samples, n_classes)
         """
+        if self.classes_ is None:
+            raise ValueError("Model must be fitted before predict")
+            
         n_samples = x.shape[0]
         n_classes = len(self.classes_)
         log_proba = np.zeros((n_samples, n_classes))
@@ -310,13 +313,14 @@ def _predict_log_proba_discrete(self, x: np.ndarray) -> np.ndarray:
                     feature_value = x[sample_idx, feature_idx]
 
                     # Get log probability for this feature value in this class
+                    feature_value_int = int(feature_value)
                     if (
-                        feature_value
+                        feature_value_int
                         in self.feature_log_prob_[class_label][feature_idx]
                     ):
                         log_prob = self.feature_log_prob_[class_label][
                             feature_idx
-                        ][feature_value]
+                        ][feature_value_int]
                     else:
                         # Unseen feature value: use Laplace smoothing
                         all_values = list(
@@ -347,6 +351,9 @@ def _predict_log_proba_continuous(self, x: np.ndarray) -> np.ndarray:
         Returns:
             Log probability matrix of shape (n_samples, n_classes)
         """
+        if self.classes_ is None:
+            raise ValueError("Model must be fitted before predict")
+            
         n_samples = x.shape[0]
         n_classes = len(self.classes_)
         log_proba = np.zeros((n_samples, n_classes))
@@ -362,9 +369,10 @@ def _predict_log_proba_continuous(self, x: np.ndarray) -> np.ndarray:
 
                 # Compute Gaussian log probabilities for all samples
                 feature_values = x[:, feature_idx]
-                log_proba[:, i] += self._gaussian_log_probability(
-                    feature_values, means, variances
-                )
+                log_proba[:, i] += np.array([
+                    self._gaussian_log_probability(val, means, variances)
+                    for val in feature_values
+                ])
 
         return log_proba
 
@@ -445,6 +453,9 @@ def predict(self, x: np.ndarray) -> np.ndarray:
         >>> len(predictions) == x_test.shape[0]
         True
         """
+        if self.classes_ is None:
+            raise ValueError("Model must be fitted before predict")
+            
         log_proba = self.predict_log_proba(x)
         predictions = self.classes_[np.argmax(log_proba, axis=1)]
         return predictions