import numpy as np # numeric operations

def generate_data(samples=1000, features=3):                # data generation function with input for samples and features
    X = np.random.randn(samples, features)                  # generate features randomly
    X += np.random.normal(0, 0.1, X.shape)                  # add noise
    true_weights = np.random.randn(features, 1)             # randomly generate weights
    true_bias = np.random.randn()                           # randomly generate a bias
    combination = X.dot(true_weights) + true_bias           # calculate linear combination of input and weights plus bias
    combination += np.random.normal(0, 0.1, (samples, 1))   # add noise
    probabilities = 1 / (1 + np.exp(-combination))          # calculate probabilities with sigmoid
    y = (probabilities > 0.5).astype(int)                   # convert probabilities to a binary
    return X, y                                             # return features and labels

X, y = generate_data()  # generate synthetic data

def split_data(X, y, test_size=0.2):
    # shuffle indices for every sample
    indices = np.arange(X.shape[0])                 # create array of possible indices
    np.random.shuffle(indices)                      # shuffle indices randomly

    # calculate index to seperate at
    split_index = int(X.shape[0] * (1 - test_size))

    # split into train/test sets
    train_indices = indices[:split_index]           # select training indices
    test_indices = indices[split_index:]            # select testing indices

    # seperate target and features into training/testing sets
    X_train = X[train_indices]                      # seperate training features
    X_test = X[test_indices]                        # seperate training target
    y_train = y[train_indices].flatten()            # seperate testing features
    y_test = y[test_indices].flatten()              # seperate training target

    return X_train, X_test, y_train, y_test         # return split dataset

X_train, X_test, y_train, y_test = split_data(X, y) # split features and target into train and test sets

def sigmoid(z):                 # define sigmoid function for activation
    return 1 / (1 + np.exp(-z)) # map input to range by computing sigmoid

def compute_loss(y, probs):                                             # cross entropy function to compute loss
    eps = 1e-15                                                         # small constant to prevent errors
    probs = np.clip(probs, eps, 1 - eps)                                # clip probabilities to avoid absolutes
    return -np.mean(y * np.log(probs) + (1 - y) * np.log(1 - probs))    # return average log loss over every sample

def predict_proba(X, weights, bias):        # calculate label probabilty
    combination = np.dot(X, weights) + bias # calculate linear combination
    return sigmoid(combination)             # caclulate and return probability

def parameter_initialization(X):    # function to initialize model parameters
    weights = np.zeros(X.shape[1])  # initialize a weight for each feature
    bias = 0.0                      # initialize bias
    return weights, bias            # return zeroed weights and bias

weights, bias = parameter_initialization(X_train)   # initialize zeroed weights and bias

def train(X, y, weights, bias, epochs = 1000, learning_rate = 0.1): # train the model using gradient descent
    # initialize history
    loss_history = []                                               # store loss history for each epoch
    error_history = []                                              # store error history for each epoch

    # training loop
    for epoch in range(epochs): # begin training, iterating for each epoch
        # forward pass
        probs = predict_proba(X, weights, bias) # predict probability for each sample

        # loss and error calculation
        loss = compute_loss(y, probs)   # calcuate loss using binary cross entropy
        error = probs - y               # calculate prediction error
        average_error = np.mean(error)

        # save to history
        loss_history.append(loss)
        error_history.append(average_error)

        # backpropagation (backwards pass or gradient descent)
        gradient_weights = np.dot(X.T, error) / len(y)  # calculate gradient for the weights
        gradient_bias = average_error                   # set gradient for bias (same calcuation as earlier)

        # parameter updates
        weights -= learning_rate * gradient_weights # update weights with gradient descent
        bias -= learning_rate * gradient_bias       # update bias with gradient descent

        # progress
        if epochs >= 10 and epoch % (epochs // 10) == 0:    # print progress every tenth of epochs
            print(f"Epoch {epoch}, Loss: {loss:.2f}")

    return weights, bias, loss_history, error_history   # return updated parameters and history

learned_weights, learned_bias, loss_history, error_history = train(X_train, y_train, weights, bias) # train model

Epoch 0, Loss: 0.69
Epoch 100, Loss: 0.27
Epoch 200, Loss: 0.21
Epoch 300, Loss: 0.18
Epoch 400, Loss: 0.16
Epoch 500, Loss: 0.14
Epoch 600, Loss: 0.13
Epoch 700, Loss: 0.13
Epoch 800, Loss: 0.12
Epoch 900, Loss: 0.12

def predict(X, weights, bias, threshold = 0.5):         # use weights and bias to predict labels
    z = np.dot(X, weights) + bias                       # calculate linear combination
    probability = sigmoid(z)                            # use sigmoid activation to predict probability
    return (probability >= threshold).astype(int)       # convert probabilities to binary comparing to threshold

predictions = predict(X_test, learned_weights, learned_bias)    # predict testing data

def score(predictions, actual):             # calculate accuracy by comparing predictions vs actual
    return np.mean(predictions == actual)   # return proportion of correct predictions

accuracy = score(predictions, y_test)           # score model
print(f"Accuracy Score: {accuracy*100:.2f}%")   # print score

Accuracy Score: 96.00%

import matplotlib.pyplot as plt # for making graphs

plt.plot(loss_history)          # plot losses
plt.title("Loss vs Epoch")      # add title
plt.ylabel("Loss")              # y axis label
plt.xlabel("Epoch")             # x axis label
plt.show()                      # display plot

plt.plot(error_history)             # plot average errors
plt.title("Average Error vs Epoch") # add title
plt.ylabel("Average Error")         # add x label
plt.xlabel("Epoch")                 # add y label
plt.show()                          # print

Logistic Regression From Scratch¶

Background¶

Step 1: Data Preparation¶

Step 2: Training Functions¶

Step 3: Model Training¶

Step 4: Predict¶

Step 5: Evaluate¶

Author and Liscense¶