Skip to content
Merged
Changes from 6 commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
65 changes: 63 additions & 2 deletions machine_learning/logistic_regression.py
Original file line number Diff line number Diff line change
Expand Up @@ -27,7 +27,7 @@
# classification problems


def sigmoid_function(z):
def sigmoid_function(z: np.ndarray) -> np.ndarray:
"""
Also known as Logistic Function.

Expand All @@ -42,11 +42,68 @@ def sigmoid_function(z):

@param z: input to the function
@returns: returns value in the range 0 to 1

Examples:
>>> sigmoid_function(4)
0.9820137900379085
>>> sigmoid_function(np.array([-3, 3]))
array([0.04742587, 0.95257413])
>>> sigmoid_function(np.array([-3, 3, 1]))
array([0.04742587, 0.95257413, 0.73105858])
>>> sigmoid_function(np.array([-0.01, -2, -1.9]))
array([0.49750002, 0.11920292, 0.13010847])
>>> sigmoid_function(np.array([-1.3, 5.3, 12]))
array([0.21416502, 0.9950332 , 0.99999386])
>>> sigmoid_function(np.array([0.01, 0.02, 4.1]))
array([0.50249998, 0.50499983, 0.9836975 ])
>>> sigmoid_function(np.array([0.8]))
array([0.68997448])
"""
return 1 / (1 + np.exp(-z))


def cost_function(h, y):
def cost_function(h: np.ndarray, y: np.ndarray) -> int:
"""
Cost function quantifies the error between predicted and expected values.
The cost function used in Logistic Regression is called Log Loss
or Cross Entropy Function.

J(θ) = (1/m) * Σ [ -y * log(hθ(x)) - (1 - y) * log(1 - hθ(x)) ]

Where:
- J(θ) is the cost that we want to minimize during training
- m is the number of training examples
- Σ represents the summation over all training examples
- y is the actual binary label (0 or 1) for a given example
- hθ(x) is the predicted probability that x belongs to the positive class

@param h: the output of sigmoid function. It is the estimated probability
that the input example 'x' belongs to the positive class

@param y: the actual binary label associated with input example 'x'

Examples:
>>> estimations = np.array([
... sigmoid_function(0.3), sigmoid_function(-4.3), sigmoid_function(8.1)
... ])
>>> cost_function(h=estimations, y=np.array([1, 0, 1]))
0.18937868932131605
>>> estimations = np.array([
... sigmoid_function(4), sigmoid_function(3), sigmoid_function(1)
... ])
>>> cost_function(h=estimations, y=np.array([1, 0, 0]))
1.459999655669926
>>> estimations = np.array([
... sigmoid_function(4), sigmoid_function(-3), sigmoid_function(-1)
... ])
>>> cost_function(h=estimations, y=np.array([1, 0, 0]))
0.1266663223365915
>>> cost_function(h=np.array([sigmoid_function(0)]), y=np.array([1]))
0.6931471805599453

References:
- https://en.wikipedia.org/wiki/Logistic_regression
"""
return (-y * np.log(h) - (1 - y) * np.log(1 - h)).mean()


Expand Down Expand Up @@ -75,6 +132,10 @@ def logistic_reg(alpha, x, y, max_iterations=70000):
# In[68]:

if __name__ == "__main__":
import doctest

doctest.testmod()

iris = datasets.load_iris()
x = iris.data[:, :2]
y = (iris.target != 0) * 1
Expand Down