%matplotlib inline
import matplotlib.pyplot as plt
import numpy as np
import math, warnings
import seaborn as sns

from mpl_toolkits.mplot3d import Axes3D
from random import random
#from mpl_toolkits.mplot3d import axes3d
import matplotlib.pyplot as plt
import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import StandardScaler
from sklearn.linear_model import LinearRegression
from sklearn.linear_model import LogisticRegression
from sklearn.linear_model import Lasso
from sklearn.linear_model import  Ridge
from sklearn.preprocessing import PolynomialFeatures
from sklearn.model_selection import KFold

sns.set()
#warnings.filterwarnings('ignore')


p = np.linspace(0,1)
odds =  p/(1-p)
plt.plot(p, odds)
plt.xlabel("p(A)", size='20')
plt.ylabel("odds(p)", size='20')

<ipython-input-12-f62918826903>:2: RuntimeWarning: divide by zero encountered in true_divide
  odds =  p/(1-p)

Text(0, 0.5, 'odds(p)')


# def sigmoid(x,a,b):
#     z = [i*a +b for i in x]
#     result = [1/(1+np.exp(-i)) for i in z ]
#     return result

def sigmoid(x,a,b):
    z = np.array([i*a +b for i in x])
    return 1/(1+np.exp(-z))


x = np.linspace(-10,10,30)
y =  sigmoid(x,2,4)
plt.plot(x,y)
plt.xlabel("X",size='20')
plt.ylabel(r'$\sigma(X)$',size='20')

Text(0, 0.5, '$\\sigma(X)$')


def cartesian(start,end,step):
    x = y = np.linspace(start,end,step)
    return  np.transpose([np.tile(x, len(y)), np.repeat(y, len(x))])
              
def plot(num):
    size = np.sqrt(num)  
    a = cartesian(1, 100, num)
    x = np.linspace(-10, 10, 30)
    size = int(size)
    fig, axs = plt.subplots(size, size,figsize=(25, 25))    
    for i in range(size):
        for j in range(size):
            t_1= 2**i/10 + i
            t_2 = 3**j - j
            axs[i, j].set_title(r'$ \theta_0 = {},\theta_1 = {} $'.format(t_1, t_2), size=20) 
            y=sigmoid(x, t_1, t_2)
            axs[i, j].plot(x, y)


plot(25)


class BinaryLogisticRegression:

    def __init__(self):
        self.sample_weight = None
        self.X_prime = None
        self.Y_prime = None

    def fit(self, X, y, C=0.05, I=2500):
        self.X_prime, self.Y_prime = self.__validate(X, y)
        self.X_prime, self.sample_weight = self.__prepare(self.X_prime, self.Y_prime)
        m = 1 / X.shape[0]

        for i in range(I):
            gradient = m * self.X_prime.T.dot(self.__sigmoid__(self.X_prime, self.sample_weight) - self.Y_prime)
            self.sample_weight = self.sample_weight - gradient * C

    def score(self, X, y):
        X, y = self.__validate(X, y)
        y_p = self.predict(X)
        res = y - y_p
        correct = res[np.nonzero(res == 0)].shape[0]
        size = y_p.shape[0]
        return correct / size

    def predict(self, X):
        X, e = self.__validate(X, self.Y_prime)
        X, e = self.__prepare(X, self.Y_prime)
        return np.round(self.__sigmoid__(X, self.sample_weight))

    def __sigmoid__(self, X, wights):
        H = X.dot(wights)
        return 1 / (1 + np.exp(-H))

    def __validate(self, X, y):
        X = np.array(X)
        # y = np.array(y)
        y = np.array(y).reshape(y.shape[0], 1)
        return X, y
        if False:
            raise ValueError("Maximum number of iteration must be positive;"" got (max_iter=%r)" % self.max_iter)

    def __prepare(self, X, y):
        weights = None
        X = np.append(np.ones((X.shape[0], 1)), X, axis=1)
        weights = np.ones((X.shape[1], 1))
        return X, weights


data = pd.read_csv('https://archive.ics.uci.edu/ml/machine-learning-databases/00267/data_banknote_authentication.txt')
data.columns = ['variance','skewness','curtosis','entropy','Class']


data


x = data.iloc[:, : -1]
y = data.iloc[:, -1]

scaler = StandardScaler()
x = scaler.fit_transform(x)
X_train, X_test, y_train, y_test = train_test_split(x, y, test_size=0.33, random_state=42)


r = BinaryLogisticRegression()
r.fit(X_train, y_train)
print('predictors weights')
print(r.sample_weight)
print('accuracy')
print(r.score(X_test, y_test))

predictors weights
[[-0.79795648]
 [-3.72638035]
 [-3.0569379 ]
 [-2.96198232]
 [ 0.36577552]]
accuracy
0.977924944812362


from sklearn.linear_model import LogisticRegression


model = LogisticRegression()
model.fit(X_train, y_train)

LogisticRegression()


print('predictors weights')
print(model.coef_ )
print('accuracy sklearn-learn implementation')
print(model.score(X_test, y_test))

predictors weights
[[-4.55543599 -4.47292913 -4.19422475  0.31206293]]
accuracy sklearn-learn implementation
0.9801324503311258

	variance	skewness	curtosis	entropy	Class
0	4.54590	8.16740	-2.4586	-1.46210	0
1	3.86600	-2.63830	1.9242	0.10645	0
2	3.45660	9.52280	-4.0112	-3.59440	0
3	0.32924	-4.45520	4.5718	-0.98880	0
4	4.36840	9.67180	-3.9606	-3.16250	0
...	...	...	...	...	...
1366	0.40614	1.34920	-1.4501	-0.55949	1
1367	-1.38870	-4.87730	6.4774	0.34179	1
1368	-3.75030	-13.45860	17.5932	-2.77710	1
1369	-3.56370	-8.38270	12.3930	-1.28230	1
1370	-2.54190	-0.65804	2.6842	1.19520	1

author: daodeiv (David Stankov)

Logistic Regression

Log-odds or Loggit function

The math origin of the Sigmoid function

Properties and Identities Of Sigmoid Function

Maximum Likelihood of Logistic regression, Cross-entropy loss

Mathematical derivation of cross-entopy loss.Gradient Descent

Implementation of BinaryLogisticRegression using numpy

Reguralization of Logistic Regression

References