Source code for mightypy.ml._linear

"""
Linear Models of Machine Learning
"""

from typing import Union, Tuple
import numpy as np
from mightypy.ml._error_fxs import calculate_mse_cost, calculate_entropy_cost
from mightypy.ml._utils import sigmoid

__author__ = "Nishant Baheti"
__copyright__ = "Nishant Baheti"
__license__ = "MIT"



[docs]
class LinearRegression:
    """Linear Regression Model Class

    Args:
        alpha (float, optional): learning rate. Defaults to 0.01.
        iterations (int, optional): number of iteratons. Defaults to 10000.

    References:
        https://machinelearningexploration.readthedocs.io/en/latest/LinearRegression/Explore.html
    """

    def __init__(self, alpha: float = 0.01, iterations: int = 10000):
        """Constructor"""
        self.alpha = alpha
        self.iterations = iterations
        self._theta = None
        self._X = None
        self._y = None
        self._theta_history = None
        self._cost_history = None
        self._n = None
        self._m = None

    def _format_x_for_theta_0(self, x_i: np.ndarray) -> np.ndarray:
        """format X matrix for linear model

        put 1's in the first column as feature for theta_0

        Args:
            x_i (np.ndarray): input x matrix

        Returns:
            np.ndarray: formatted x matrix
        """
        x_i = x_i.copy()
        if len(x_i.shape) == 1:
            x_i = x_i.reshape(-1, 1)

        if False in (x_i[..., 0] == 1):
            return np.hstack(tup=(np.ones(shape=(x_i.shape[0], 1)), x_i))
        else:
            return x_i

    @property
    def X(self) -> Union[np.ndarray, None]:
        """property X

        Returns:
            Union[np.ndarray, None]: X matrix
        """
        return self._X

    @property
    def y(self) -> Union[np.ndarray, None]:
        """property y

        Returns:
            Union[np.ndarray, None]: y matrix
        """
        return self._y

    @property
    def theta(self) -> Union[np.ndarray, None]:
        """property theta

        Returns:
            Union[np.ndarray, None]: theta matrix
        """
        return self._theta

    @property
    def theta_history(self) -> Union[list, None]:
        """theta training history

        Returns:
            Union[list, None]: theta history list
        """
        return self._theta_history

    @property
    def cost_history(self) -> Union[list, None]:
        """cost learning history

        Returns:
            Union[list, None]: cost history list
        """
        return self._cost_history


[docs]
    def predict(self, X: np.ndarray) -> np.ndarray:
        """generate prediction

        Args:
            X (np.ndarray): input feature matrix

        Raises:
            ValueError: if shape is not proper for the input feature
            Warning: if model is not trained yet

        Returns:
            np.ndarray: predicted values
        """

        if self._theta is not None:
            format_x = self._format_x_for_theta_0(X)
            if format_x.shape[1] == self._theta.shape[0]:
                y_pred = format_x @ self._theta  # (m,1) = (m,n) * (n,1)
                return y_pred
            elif format_x.shape[1] == self._theta.shape[1]:
                y_pred = format_x @ self._theta.T  # (m,1) = (m,n) * (n,1)
                return y_pred
            else:
                raise ValueError("Shape is not proper.")
        else:
            raise Warning("Model is not trained yet. Theta is None.")



[docs]
    def train(
        self,
        X: np.ndarray,
        y: np.ndarray,
        verbose: bool = True,
        method: str = "SGD",
        theta_precision: float = 0.001,
        batch_size: int = 30,
    ) -> None:
        """train model /theta estimator

        Args:
            X (np.ndarray): X matrix/feature matrix.
            y (np.ndarray): y matrix/target matrix.
            verbose (bool, optional): print things. Defaults to True.
            method (str, optional): training method. Defaults to "SGD".

                    Available-
                        "BGD"(Batch Graident Descent),
                        "SGD"(Stochastic Gradient Descent),
                        "NORMAL"(Normal Equation)

            theta_precision (float, optional): theta initialization value precision. Defaults to 0.001.
            batch_size (int, optional): batch size only for BGD. Defaults to 30.
        """

        self._X = self._format_x_for_theta_0(X)
        self._y = y

        # number of features+1 because of theta_0
        self._n = self._X.shape[1]
        self._m = self._y.shape[0]

        self._theta_history = []
        self._cost_history = []

        if method == "BGD":
            self._theta = np.random.rand(1, self._n) * theta_precision
            if verbose:
                print("random initial θ value :", self._theta)

            for iteration in range(self.iterations):
                # calculate y_pred
                y_pred = self.predict(self._X)

                # new θ to replace old θ
                new_theta = None

                # simultaneous operation
                gradient = np.mean((y_pred - self._y) * self._X, axis=0)  # type: ignore
                new_theta = self._theta - (self.alpha * gradient)

                if np.isnan(np.sum(new_theta)) or np.isinf(np.sum(new_theta)):
                    print("breaking. found inf or nan.")
                    break
                # override with new θ
                self._theta = new_theta

                # calculate cost to put in history
                cost = calculate_mse_cost(y_pred=self.predict(X=self._X), y=self._y)
                self._cost_history.append(cost)

                # calcualted theta in history
                self._theta_history.append(self._theta[0])

        elif method == "SGD":  # stochastic gradient descent
            self._theta = np.random.rand(1, self._n) * theta_precision
            if verbose:
                print("random initial θ value :", self._theta)

            for iteration in range(self.iterations):

                # creating indices for batches
                indices = np.random.randint(0, self._m, size=batch_size)

                # creating batch for this iteration
                # X_batch = np.take(self._X, indices, axis=0)
                # y_batch = np.take(self._y, indices, axis=0)
                X_batch = self._X[indices, :]
                y_batch = self._y[indices, :]

                # calculate y_pred
                y_pred = self.predict(X_batch)
                # new θ to replace old θ
                new_theta = None

                # simultaneous operation
                gradient = np.mean((y_pred - y_batch) * X_batch, axis=0)  # type: ignore
                new_theta = self._theta - (self.alpha * gradient)

                if np.isnan(np.sum(new_theta)) or np.isinf(np.sum(new_theta)):
                    print("breaking. found inf or nan.")
                    break
                # override with new θ
                self._theta = new_theta

                # calculate cost to put in history
                cost = calculate_mse_cost(y_pred=self.predict(X=X_batch), y=y_batch)
                self._cost_history.append(cost)

                # calcualted theta in history
                self._theta_history.append(self._theta[0])

        elif method == "NORMAL":
            self._theta = np.linalg.inv(self._X.T @ self._X) @ self._X.T @ self._y

        else:
            print("No Method Defined.")





[docs]
class RidgeRegression:
    """Ridge Regression Model Class (L2 Regularization)

    Args:
        alpha (float, optional): learning rate. Defaults to 0.01.
        iterations (int, optional): number of iteratons. Defaults to 10000.

    References:
        https://machinelearningexploration.readthedocs.io/en/latest/LinearRegression/Explore.html#Ridge(L2-Regularization)-Regression
    """

    def __init__(self, alpha: float = 0.01, iterations: int = 10000):
        """Constructor"""
        self.alpha = alpha
        self.iterations = iterations
        self._theta = None
        self._X = None
        self._y = None
        self._theta_history = None
        self._cost_history = None
        self._n = None
        self._m = None

    def _format_x_for_theta_0(self, x_i: np.ndarray) -> np.ndarray:
        """format X matrix for linear model

        put 1's in the first column as feature for theta_0

        Args:
            x_i (np.ndarray): input x matrix

        Returns:
            np.ndarray: formatted x matrix
        """
        x_i = x_i.copy()
        if len(x_i.shape) == 1:
            x_i = x_i.reshape(-1, 1)

        if False in (x_i[..., 0] == 1):
            return np.hstack(tup=(np.ones(shape=(x_i.shape[0], 1)), x_i))
        else:
            return x_i

    @property
    def X(self) -> Union[np.ndarray, None]:
        """property X

        Returns:
            Union[np.ndarray, None]: X matrix
        """
        return self._X

    @property
    def y(self) -> Union[np.ndarray, None]:
        """property y

        Returns:
            Union[np.ndarray, None]: y matrix
        """
        return self._y

    @property
    def theta(self) -> Union[np.ndarray, None]:
        """property theta

        Returns:
            Union[np.ndarray, None]: theta matrix
        """
        return self._theta

    @property
    def theta_history(self) -> Union[list, None]:
        """theta training history

        Returns:
            Union[list, None]: theta history list
        """
        return self._theta_history

    @property
    def cost_history(self) -> Union[list, None]:
        """cost learning history

        Returns:
            Union[list, None]: cost history list
        """
        return self._cost_history


[docs]
    def predict(self, X: np.ndarray) -> np.ndarray:
        """generate prediction

        Args:
            X (np.ndarray): input feature matrix

        Raises:
            ValueError: if shape is not proper for the input feature
            Warning: if model is not trained yet

        Returns:
            np.ndarray: predicted values
        """

        if self._theta is not None:
            format_x = self._format_x_for_theta_0(X)
            if format_x.shape[1] == self._theta.shape[0]:
                y_pred = format_x @ self._theta  # (m,1) = (m,n) * (n,1)
                return y_pred
            elif format_x.shape[1] == self._theta.shape[1]:
                y_pred = format_x @ self._theta.T  # (m,1) = (m,n) * (n,1)
                return y_pred
            else:
                raise ValueError("Shape is not proper.")
        else:
            raise Warning("Model is not trained yet. Theta is None.")



[docs]
    def train(
        self,
        X: np.ndarray,
        y: np.ndarray,
        verbose: bool = True,
        method: str = "SGD",
        theta_precision: float = 0.001,
        penalty: Union[float, int] = 1.0,
        batch_size: int = 30,
    ) -> None:
        """train model /theta estimator

        Args:
            X (np.ndarray): X matrix/feature matrix.
            y (np.ndarray): y matrix/target matrix.
            verbose (bool, optional): print things. Defaults to True.
            method (str, optional): training method. Defaults to "SGD".

                    Available-
                        "BGD"(Batch Graident Descent),
                        "SGD"(Stochastic Gradient Descent),
                        "NORMAL"(Normal Equation)

            theta_precision (float, optional): theta initialization value precision. Defaults to 0.001.
            penalty (Union[float, int], optional): regularization penalty. Defaults to 1.0.
            batch_size (int, optional): batch size only for BGD. Defaults to 30.
        """

        self._X = self._format_x_for_theta_0(X)
        self._y = y

        # number of features+1 because of theta_0
        self._n = self._X.shape[1]
        self._m = self._y.shape[0]

        self._theta_history = []
        self._cost_history = []

        if method == "BGD":
            self._theta = np.random.rand(1, self._n) * theta_precision
            if verbose:
                print("random initial θ value :", self._theta)

            for iteration in range(self.iterations):
                # calculate y_pred
                y_pred = self.predict(self._X)
                # new θ to replace old θ
                new_theta = None

                # simultaneous operation
                ######################################################

                gradient = np.mean((y_pred - self._y) * self._X, axis=0)  # type: ignore

                # theta_0 will not be effected by penalty
                new_theta_0 = self._theta[:, [0]] - (self.alpha * gradient[0])  # type: ignore
                # rest of theta's will be effected by it
                new_theta_rest = self._theta[:, range(1, self._n)] * (1 - (penalty / self._m)) - (self.alpha * gradient[1:])  # type: ignore

                new_theta = np.hstack((new_theta_0, new_theta_rest))

                if np.isnan(np.sum(new_theta)) or np.isinf(np.sum(new_theta)):
                    print("breaking. found inf or nan.")
                    break
                # override with new θ
                self._theta = new_theta

                # calculate cost to put in history
                cost = calculate_mse_cost(y_pred=self.predict(X=self._X), y=self._y)
                self._cost_history.append(cost)

                # calcualted theta in history
                self._theta_history.append(self._theta[0])
        elif method == "SGD":
            self._theta = np.random.rand(1, self._n) * theta_precision
            if verbose:
                print("random initial θ value :", self._theta)

            for iteration in range(self.iterations):

                indices = np.random.randint(0, self._m, size=batch_size)

                # X_batch = np.take(self._X, indices, axis=0)
                # y_batch = np.take(self._y, indices, axis=0)

                X_batch = self._X[indices, :]
                y_batch = self._y[indices, :]

                # calculate y_pred
                y_pred = self.predict(X_batch)
                # new θ to replace old θ
                new_theta = None

                # simultaneous operation
                gradient = np.mean((y_pred - y_batch) * X_batch, axis=0)  # type: ignore
                new_theta_0 = self._theta[:, [0]] - (self.alpha * gradient[0])  # type: ignore
                new_theta_rest = self._theta[:, range(1, self._n)] * (1 - (penalty / self._m)) - (self.alpha * gradient[1:])  # type: ignore

                new_theta = np.hstack((new_theta_0, new_theta_rest))

                if np.isnan(np.sum(new_theta)) or np.isinf(np.sum(new_theta)):
                    print("breaking. found inf or nan.")
                    break
                # override with new θ
                self._theta = new_theta

                # calculate cost to put in history
                cost = calculate_mse_cost(y_pred=self.predict(X=X_batch), y=y_batch)
                self._cost_history.append(cost)

                # calcualted theta in history
                self._theta_history.append(self._theta[0])

        elif method == "NORMAL":
            self._theta = (
                np.linalg.inv(self._X.T @ self._X + (penalty * np.identity(self._n)))

[docs]
                @ self._X.T
                @ self._y
            )

        else:
            print("No Method Defined.")




class LassoRegression:
    """Lasso Regression Model Class (L1 Regularization)

    Args:
        alpha (float, optional): learning rate. Defaults to 0.01.
        iterations (int, optional): number of iteratons. Defaults to 10000.

    References:
        https://machinelearningexploration.readthedocs.io/en/latest/LinearRegression/Explore.html#Lasso(L1-Regularization)-Regression
    """

    def __init__(self, alpha: float = 0.01, iterations: int = 10000):
        """Constructor"""
        self.alpha = alpha
        self.iterations = iterations
        self._theta = None
        self._X = None
        self._y = None
        self._theta_history = None
        self._cost_history = None
        self._n = None
        self._m = None

    def _format_x_for_theta_0(self, x_i: np.ndarray) -> np.ndarray:
        """format X matrix for linear model

        put 1's in the first column as feature for theta_0

        Args:
            x_i (np.ndarray): input x matrix

        Returns:
            np.ndarray: formatted x matrix
        """
        x_i = x_i.copy()
        if len(x_i.shape) == 1:
            x_i = x_i.reshape(-1, 1)

        if False in (x_i[..., 0] == 1):
            return np.hstack(tup=(np.ones(shape=(x_i.shape[0], 1)), x_i))
        else:
            return x_i

    @property
    def X(self) -> Union[np.ndarray, None]:
        """property X

        Returns:
            Union[np.ndarray, None]: X matrix
        """
        return self._X

    @property
    def y(self) -> Union[np.ndarray, None]:
        """property y

        Returns:
            Union[np.ndarray, None]: y matrix
        """
        return self._y

    @property
    def theta(self) -> Union[np.ndarray, None]:
        """property theta

        Returns:
            Union[np.ndarray, None]: theta matrix
        """
        return self._theta

    @property
    def theta_history(self) -> Union[list, None]:
        """theta training history

        Returns:
            Union[list, None]: theta history list
        """
        return self._theta_history

    @property
    def cost_history(self) -> Union[list, None]:
        """cost learning history

        Returns:
            Union[list, None]: cost history list
        """
        return self._cost_history


[docs]
    def predict(self, X: np.ndarray) -> np.ndarray:
        """generate prediction

        Args:
            X (np.ndarray): input feature matrix

        Raises:
            ValueError: if shape is not proper for the input feature
            Warning: if model is not trained yet

        Returns:
            np.ndarray: predicted values
        """

        if self._theta is not None:
            format_x = self._format_x_for_theta_0(X)
            if format_x.shape[1] == self._theta.shape[0]:
                y_pred = format_x @ self._theta  # (m,1) = (m,n) * (n,1)
                return y_pred
            elif format_x.shape[1] == self._theta.shape[1]:
                y_pred = format_x @ self._theta.T  # (m,1) = (m,n) * (n,1)
                return y_pred
            else:
                raise ValueError("Shape is not proper.")
        else:
            raise Warning("Model is not trained yet. Theta is None.")



[docs]
    def train(
        self,
        X: np.ndarray,
        y: np.ndarray,
        verbose: bool = True,
        method: str = "SGD",
        theta_precision: float = 0.001,
        penalty: Union[int, float] = 1.0,
        batch_size: int = 30,
    ) -> None:
        """train model /theta estimator

        Args:
            X (np.ndarray): X matrix/feature matrix.
            y (np.ndarray): y matrix/target matrix.
            verbose (bool, optional): print things. Defaults to True.
            method (str, optional): training method. Defaults to "SGD".

                    Available-
                        "BGD"(Batch Graident Descent),
                        "SGD"(Stochastic Gradient Descent)

            theta_precision (float, optional): theta initialization value precision. Defaults to 0.001.
            penalty (Union[float, int], optional): regularization penalty. Defaults to 1.0.
            batch_size (int, optional): batch size only for BGD. Defaults to 30.
        """

        self._X = self._format_x_for_theta_0(X)
        self._y = y

        # number of features+1 because of theta_0
        self._n = self._X.shape[1]
        self._m = self._y.shape[0]

        self._theta_history = []
        self._cost_history = []

        if method == "BGD":
            self._theta = np.random.rand(1, self._n) * theta_precision
            if verbose:
                print("random initial θ value :", self._theta)

            for iteration in range(self.iterations):
                # calculate y_pred
                y_pred = self.predict(self._X)
                # new θ to replace old θ
                new_theta = np.zeros_like(self._theta)

                # simultaneous operation
                ################################################################################################################

                gradient = np.mean((y_pred - self._y) * self._X, axis=0)  # type: ignore
                new_theta_0 = self._theta[:, [0]] - (self.alpha * gradient[0])  # type: ignore
                new_theta_rest = self._theta[:, range(1, self._n)] - (self.alpha * gradient[1:]) - (penalty / self._m)  # type: ignore

                new_theta = np.hstack((new_theta_0, new_theta_rest))

                if np.isnan(np.sum(new_theta)) or np.isinf(np.sum(new_theta)):
                    print("breaking. found inf or nan.")
                    break
                # override with new θ
                self._theta = new_theta

                # calculate cost to put in history
                cost = calculate_mse_cost(y_pred=self.predict(X=self._X), y=self._y)
                self._cost_history.append(cost)

                # calcualted theta in history
                self._theta_history.append(self._theta[0])

        elif method == "SGD":
            self._theta = np.random.rand(1, self._n) * theta_precision
            if verbose:
                print("random initial θ value :", self._theta)

            for iteration in range(self.iterations):

                indices = np.random.randint(0, self._m, size=batch_size)

                # X_batch = np.take(self._X, indices, axis=0)
                # y_batch = np.take(self._y, indices, axis=0)
                X_batch = self._X[indices, :]
                y_batch = self._y[indices, :]

                # calculate y_pred
                y_pred = self.predict(X_batch)
                # new θ to replace old θ
                new_theta = None

                # simultaneous operation
                ################################################################################################################

                gradient = np.mean((y_pred - y_batch) * X_batch, axis=0)  # type: ignore
                new_theta_0 = self._theta[:, [0]] - (self.alpha * gradient[0])  # type: ignore
                new_theta_rest = self._theta[:, range(1, self._n)] - (self.alpha * gradient[1:]) - (penalty / self._m)  # type: ignore

                new_theta = np.hstack((new_theta_0, new_theta_rest))

                if np.isnan(np.sum(new_theta)) or np.isinf(np.sum(new_theta)):
                    print("breaking. found inf or nan.")
                    break
                # override with new θ
                self._theta = new_theta

                # calculate cost to put in history
                cost = calculate_mse_cost(y_pred=self.predict(X=X_batch), y=y_batch)
                self._cost_history.append(cost)

                # calcualted theta in history
                self._theta_history.append(self._theta[0])

        else:
            print("No Method Defined.")





[docs]
class LogisticRegression:
    """Logisitic Regression Model Class

    Args:
        alpha (float, optional): [description]. Defaults to 0.01.
        iterations (int, optional): [description]. Defaults to 10000.

    References:
        https://machinelearningexploration.readthedocs.io/en/latest/LogisticRegression/Explore.html
    """

    def __init__(self, alpha: float = 0.01, iterations: int = 10000):
        self.alpha = alpha
        self.iterations = iterations
        self._theta = None
        self._X = None
        self._y = None
        self._theta_history = None
        self._cost_history = None
        self._n = None
        self._m = None

    def _format_x_for_theta_0(self, x_i: np.ndarray) -> np.ndarray:
        """format X matrix for linear model

        put 1's in the first column as feature for theta_0

        Args:
            x_i (np.ndarray): input x matrix

        Returns:
            np.ndarray: formatted x matrix
        """

        x_i = x_i.copy()
        if len(x_i.shape) == 1:
            x_i = x_i.reshape(-1, 1)

        if False in (x_i[..., 0] == 1):
            return np.hstack(tup=(np.ones(shape=(x_i.shape[0], 1)), x_i))
        else:
            return x_i

    @property
    def X(self) -> Union[np.ndarray, None]:
        """property X

        Returns:
            Union[np.ndarray, None]: X matrix
        """
        return self._X

    @property
    def y(self) -> Union[np.ndarray, None]:
        """property y

        Returns:
            Union[np.ndarray, None]: y matrix
        """
        return self._y

    @property
    def theta(self) -> Union[np.ndarray, None]:
        """property theta

        Returns:
            Union[np.ndarray, None]: theta matrix
        """
        return self._theta

    @property
    def theta_history(self) -> Union[list, None]:
        """theta training history

        Returns:
            Union[list, None]: theta history list
        """
        return self._theta_history

    @property
    def cost_history(self) -> Union[list, None]:
        """cost learning history

        Returns:
            Union[list, None]: cost history list
        """
        return self._cost_history


[docs]
    def predict(self, X: np.ndarray) -> np.ndarray:
        """generate prediction

        Args:
            X (np.ndarray): input feature matrix

        Raises:
            ValueError: if shape is not proper for the input feature
            Warning: if model is not trained yet

        Returns:
            np.ndarray: predicted values
        """
        if self._theta is not None:
            format_X = self._format_x_for_theta_0(X)

            if format_X.shape[1] == self._theta.shape[0]:
                y_pred = sigmoid(format_X @ self._theta)  # (m,1) = (m,n) * (n,1)
                return y_pred
            elif format_X.shape[1] == self._theta.shape[1]:
                y_pred = sigmoid(format_X @ self._theta.T)  # (m,1) = (m,n) * (n,1)
                return y_pred
            else:
                raise ValueError("Shape is not proper.")
        else:
            raise Warning("Model is not trained yet. Theta is None.")



[docs]
    def train(
        self,
        X: np.ndarray,
        y: np.ndarray,
        verbose: bool = True,
        method: str = "SGD",
        theta_precision: float = 0.001,
        batch_size: int = 30,
        regularization: bool = False,
        penalty: Union[float, int] = 1.0,
    ) -> None:
        """train theta / estimator

        Args:
            X (np.ndarray): X matrix/feature matrix.
            y (np.ndarray): y matrix/target matrix.
            verbose (bool, optional): print things. Defaults to True.
            method (str, optional): training method. Defaults to "SGD".

                    Available-
                        "BGD"(Batch Graident Descent),
                        "SGD"(Stochastic Gradient Descent)

            theta_precision (float, optional): theta initialization value precision. Defaults to 0.001.
            batch_size (int, optional): batch size only for BGD. Defaults to 30.
            regularization (bool, optional): Apply Regularization. Defaults to False.
            penalty (Union[float, int], optional): regularization penalty only works for regularization=True. Defaults to 1.0.
        """

        self._X = self._format_x_for_theta_0(X)
        self._y = y

        # number of features+1 because of theta_0
        self._n = self._X.shape[1]
        self._m = self._y.shape[0]

        self._theta_history = []
        self._cost_history = []

        if method == "BGD":
            self._theta = np.random.rand(1, self._n) * theta_precision
            if verbose:
                print("random initial θ value :", self._theta)

            for iteration in range(self.iterations):
                # calculate y_pred
                y_pred = self.predict(self._X)

                # new θ to replace old θ
                new_theta = None

                # simultaneous operation

                if regularization:
                    gradient = np.mean((y_pred - self._y) * self._X, axis=0)
                    new_theta_0 = self._theta[:, [0]] - (self.alpha * gradient[0])
                    new_theta_rest = self._theta[:, range(1, self._n)] * (
                        1 - (penalty / self._m)
                    ) - (self.alpha * gradient[1:])
                    new_theta = np.hstack((new_theta_0, new_theta_rest))

                else:
                    gradient = np.mean((y_pred - self._y) * self._X, axis=0)
                    new_theta = self._theta - (self.alpha * gradient)

                if np.isnan(np.sum(new_theta)) or np.isinf(np.sum(new_theta)):
                    print("breaking. found inf or nan.")
                    break
                # override with new θ
                self._theta = new_theta

                # calculate cost to put in history
                cost = calculate_entropy_cost(y_pred=self.predict(X=self._X), y=self._y)
                self._cost_history.append(cost)

                # calcualted theta in history
                self._theta_history.append(self._theta[0])

        elif method == "SGD":  # stochastic gradient descent
            self._theta = np.random.rand(1, self._n) * theta_precision
            if verbose:
                print("random initial θ value :", self._theta)

            for iteration in range(self.iterations):

                # creating indices for batches
                indices = np.random.randint(0, self._m, size=batch_size)

                # creating batch for this iteration
                # X_batch = np.take(self._X, indices, axis=0)
                # y_batch = np.take(self._y, indices, axis=0)
                X_batch = self._X[indices, :]
                y_batch = self._y[indices, :]

                # calculate y_pred
                y_pred = self.predict(X_batch)
                # new θ to replace old θ
                new_theta = None

                # simultaneous operation
                if regularization:
                    gradient = np.mean((y_pred - y_batch) * X_batch, axis=0)
                    new_theta_0 = self._theta[:, [0]] - (self.alpha * gradient[0])
                    new_theta_rest = self._theta[:, range(1, self._n)] * (
                        1 - (penalty / self._m)
                    ) - (self.alpha * gradient[1:])
                    new_theta = np.hstack((new_theta_0, new_theta_rest))

                else:
                    gradient = np.mean((y_pred - y_batch) * X_batch, axis=0)
                    new_theta = self._theta - (self.alpha * gradient)

                if np.isnan(np.sum(new_theta)) or np.isinf(np.sum(new_theta)):
                    print("breaking. found inf or nan.")
                    break
                # override with new θ
                self._theta = new_theta

                # calculate cost to put in history
                cost = calculate_entropy_cost(y_pred=self.predict(X=X_batch), y=y_batch)
                self._cost_history.append(cost)

                # calcualted theta in history
                self._theta_history.append(self._theta[0])

        else:
            print("No Method Defined.")





[docs]
def polynomial_regression(
    x: np.ndarray, y: np.ndarray, degree: int
) -> Tuple[np.ndarray, np.ndarray, np.ndarray]:
    """
    fit Regression line with polynomial degree.

    Args:
        x (np.ndarray): independent variable.
        y (np.ndarray): dependent variable.
        degree (int): polynomial degree.

    Returns:
        Tuple[np.ndarray, np.ndarray, np.ndarray]: slope, residual, fitline.

    Examples:
        >>> import matplotlib.pyplot as plt
        >>> x = np.arange(-10, 10)
        >>> y = x**2 + x**3
        >>> s, r, l = polynomial_regression(x, y, 3)
        >>> plt.plot(x, y, 'ko', label='original')
        >>> plt.plot(x, l, '.-',  label='regression line')
        >>> plt.legend()
        >>> plt.show()
    """
    a = np.polynomial.Polynomial.fit(x, y, deg=degree).convert().coef

    if len(a) == 1:
        slope = a
        resid = np.array([0])
    else:
        slope = a[1:]
        resid = a[0]
    fit_line = (
        np.array([(x ** (degree - i)) * slope[i] for i in range(0, degree)]).sum(axis=0)
        + resid
    )
    return slope, resid, fit_line




[docs]
def trend(x: np.ndarray, y: np.ndarray) -> Tuple[np.ndarray, np.ndarray, np.ndarray]:
    """
    get trend of the data.

    Args:
        x (np.ndarray): independent variable.
        y (np.ndarray): dependent variable.

    Returns:
        Tuple[np.ndarray, np.ndarray, np.ndarray]: slope, residual, trendline.

    Examples;
        >>> import matplotlib.pyplot as plt
        >>> x = np.array([1, 2, 3, 4, 5, 6, 7, 8])
        >>> y = np.array([1, 2, 3, 3, 4, 5, 7, 10])
        >>> s, r, t = trend(x, y)
        >>> plt.plot(x, y, 'o', label='original')
        >>> plt.plot(x, t, '.-',  label='regression line')
        >>> plt.legend()
        >>> plt.show()
    """
    return polynomial_regression(x, y, 1)



if __name__ == "__main__":
    import matplotlib.pyplot as plt
    import matplotlib

    x = np.array([1, 2, 3, 4, 5, 6, 7, 8])
    y = np.array([1, 2, 3, 3, 4, 5, 7, 10])
    s, r, t = trend(x, y)
    plt.plot(x, y, "o", label="original", alpha=0.6)
    plt.plot(x, t, ".-", label="regression line")
    plt.legend()
    plt.show(block=True)

    x = np.arange(1, 10)
    y = x**2 + x**3
    s, r, l = polynomial_regression(x, y, 1)

    plt.plot(x, y, "ko", label="original", alpha=0.6)
    plt.plot(x, l, ".-", label="regression line")
    plt.legend()
    plt.show()

    # pass