import random


def generate_dataset(num_items=20, start=0, stop=100):
    random.seed(42)
    dataset = []
    x1_values = set()
    while len(dataset) < num_items:
        x1 = random.randint(start, stop)
        if x1 in x1_values:
            continue
        x1_values.add(x1)
        x2 = x1 if x1 % 2 == 0 else 2 * x1
        y = (
            0 if x1 == x2 else 1
        )  # (x1, x2) is labeled as Class 0 if x1 is even, and Class 1 otherwise
        dataset.append((x1, x2, y))
    return dataset


dataset = generate_dataset()

# let's now split the dataset into training and test sets
train_ratio = 0.8
num_train = int(len(dataset) * train_ratio)
dataset_train, dataset_test = dataset[:num_train], dataset[num_train:]
print(f"Training set (n={len(dataset_train)}): {dataset_train}")
print(f"Test set (n={len(dataset_test)}: {dataset_test}")

Training set (n=16): [(81, 162, 1), (14, 14, 0), (3, 6, 1), (94, 94, 0), (35, 70, 1), (31, 62, 1), (28, 28, 0), (17, 34, 1), (13, 26, 1), (86, 86, 0), (69, 138, 1), (11, 22, 1), (75, 150, 1), (54, 54, 0), (4, 4, 0), (27, 54, 1)]
Test set (n=4: [(29, 58, 1), (64, 64, 0), (77, 154, 1), (71, 142, 1)]

import matplotlib.pyplot as plt
import pandas as pd


def plot_datasets(train_dataset, test_dataset):
    # Combine datasets into a DataFrame for easier handling
    train_df = pd.DataFrame(train_dataset, columns=["x1", "x2", "class"])
    train_df["set"] = "Train"

    test_df = pd.DataFrame(test_dataset, columns=["x1", "x2", "class"])
    test_df["set"] = "Test"

    combined_df = pd.concat([train_df, test_df], ignore_index=True)

    # Define colors and markers
    colors = {0: "blue", 1: "red"}
    markers = {"Train": "o", "Test": "x"}

    # Plot each group using Matplotlib
    fig, ax = plt.subplots()
    for (dataset, cls), group in combined_df.groupby(["set", "class"]):
        ax.scatter(
            group["x1"],
            group["x2"],
            color=colors[cls],
            label=f"{dataset} Dataset, Class {cls}",
            s=30,
            marker=markers[dataset],
        )

    # Manage legend and labels
    handles, labels = ax.get_legend_handles_labels()
    by_label = dict(zip(labels, handles))
    ax.legend(by_label.values(), by_label.keys(), title="Dataset and Class", loc="best")
    ax.set_xlabel("x1")
    ax.set_ylabel("x2")
    ax.set_title("Training and Test Datasets")
    ax.grid(True)


plot_datasets(dataset_train, dataset_test)
plt.show()

zx = lambda x1, x2, w1, w2, c: w1 * x1 + w2 * x2 + c


def plot_zx(w1, w2, c):
    x2 = lambda x1: (
        (-w1 * x1 - c) / w2 if w2 != 0 else -c / w1 if w1 != 0 else c
    )  # this is because the equation of the line is w1*x1 + w2*x2 + c = 0, hence x2 = (-w1*x1 - c) / w2
    x1_values = range(0, 101)
    x2_values = [x2(x1) for x1 in x1_values]
    plt.plot(x1_values, x2_values, label=f"{w1}x1+{w2}x2+{c}=0")
    plt.legend(loc="best")


def plot_datasets_and_zx(w1, w2, c):
    plot_datasets(dataset_train, dataset_test)
    plot_zx(w1, w2, c)


plot_datasets_and_zx(-1.5, 1.1, -10)

plot_datasets_and_zx(0.1, 0.1, 0.5)

cx = lambda x1, x2, w1, w2, c: 1 if zx(x1, x2, w1, w2, c) >= 0 else 0


def accuracy(dataset, w1, w2, c):
    print(f"Calculating accuracy on training set using w1={w1}, w2={w2}, c={c}")
    correct = 0
    for x1, x2, y in dataset:
        if y == cx(x1, x2, w1, w2, c):
            correct += 1
    print(
        f"Resulting accuracy: {correct}/{len(dataset)}, or {correct/len(dataset)*100:.2f}%"
    )
    return correct / len(dataset)


# Applying the accuracy function to the training set using the two sets of weights and bias as shown above, in the first example
accuracy(dataset_train, -1.5, 1.1, -10)

# Applying the accuracy function to the training set using two sets of weights and bias as shown above, in the second example
accuracy(dataset_train, 0.1, 0.1, 0.5)

Calculating accuracy on training set using w1=-1.5, w2=1.1, c=-10
Resulting accuracy: 13/16, or 81.25%
Calculating accuracy on training set using w1=0.1, w2=0.1, c=0.5
Resulting accuracy: 10/16, or 62.50%

0.625

# First, let's initialize the weights and bias to zero
w1, w2, c = 0, 0, 0

# Let's now define the learning rate
learning_rate = 0.1

# Let's now define the number of epochs
num_epochs = 5

# Create a DataFrame to store the details of the epochs
epoch_data = []

# Let's now start the training loop
for epoch in range(num_epochs):
    print(f"Epoch {epoch+1}")
    error = 0
    for x1, x2, y in dataset_train:
        z = zx(x1, x2, w1, w2, c)
        y_hat = 1 if z >= 0 else 0
        if y != y_hat:
            error += 1 # Count the number of errors
        w1 += learning_rate * (y - y_hat) * x1
        w2 += learning_rate * (y - y_hat) * x2
        c += learning_rate * (y - y_hat)
        print(f"  x1={x1}, x2={x2}, y={y}, z={z:.2f}, y_hat={y_hat}, w1={w1:.2f}, w2={w2:.2f}, c={c:.2f}")
        # Append the details to the DataFrame
    epoch_data.append({
        "epoch": epoch + 1,
        "x1": x1,
        "x2": x2,
        "y": y,
        "z": z,
        "y_hat": y_hat,
        "w1": w1,
        "w2": w2,
        "c": c,
        "err": error
    })
epoch_details = pd.DataFrame(epoch_data)

# Display the DataFrame
epoch_details.head()

Epoch 1
  x1=81, x2=162, y=1, z=0.00, y_hat=1, w1=0.00, w2=0.00, c=0.00
  x1=14, x2=14, y=0, z=0.00, y_hat=1, w1=-1.40, w2=-1.40, c=-0.10
  x1=3, x2=6, y=1, z=-12.70, y_hat=0, w1=-1.10, w2=-0.80, c=0.00
  x1=94, x2=94, y=0, z=-178.60, y_hat=0, w1=-1.10, w2=-0.80, c=0.00
  x1=35, x2=70, y=1, z=-94.50, y_hat=0, w1=2.40, w2=6.20, c=0.10
  x1=31, x2=62, y=1, z=458.90, y_hat=1, w1=2.40, w2=6.20, c=0.10
  x1=28, x2=28, y=0, z=240.90, y_hat=1, w1=-0.40, w2=3.40, c=0.00
  x1=17, x2=34, y=1, z=108.80, y_hat=1, w1=-0.40, w2=3.40, c=0.00
  x1=13, x2=26, y=1, z=83.20, y_hat=1, w1=-0.40, w2=3.40, c=0.00
  x1=86, x2=86, y=0, z=258.00, y_hat=1, w1=-9.00, w2=-5.20, c=-0.10
  x1=69, x2=138, y=1, z=-1338.70, y_hat=0, w1=-2.10, w2=8.60, c=0.00
  x1=11, x2=22, y=1, z=166.10, y_hat=1, w1=-2.10, w2=8.60, c=0.00
  x1=75, x2=150, y=1, z=1132.50, y_hat=1, w1=-2.10, w2=8.60, c=0.00
  x1=54, x2=54, y=0, z=351.00, y_hat=1, w1=-7.50, w2=3.20, c=-0.10
  x1=4, x2=4, y=0, z=-17.30, y_hat=0, w1=-7.50, w2=3.20, c=-0.10
  x1=27, x2=54, y=1, z=-29.80, y_hat=0, w1=-4.80, w2=8.60, c=0.00
Epoch 2
  x1=81, x2=162, y=1, z=1004.40, y_hat=1, w1=-4.80, w2=8.60, c=0.00
  x1=14, x2=14, y=0, z=53.20, y_hat=1, w1=-6.20, w2=7.20, c=-0.10
  x1=3, x2=6, y=1, z=24.50, y_hat=1, w1=-6.20, w2=7.20, c=-0.10
  x1=94, x2=94, y=0, z=93.90, y_hat=1, w1=-15.60, w2=-2.20, c=-0.20
  x1=35, x2=70, y=1, z=-700.20, y_hat=0, w1=-12.10, w2=4.80, c=-0.10
  x1=31, x2=62, y=1, z=-77.60, y_hat=0, w1=-9.00, w2=11.00, c=0.00
  x1=28, x2=28, y=0, z=56.00, y_hat=1, w1=-11.80, w2=8.20, c=-0.10
  x1=17, x2=34, y=1, z=78.10, y_hat=1, w1=-11.80, w2=8.20, c=-0.10
  x1=13, x2=26, y=1, z=59.70, y_hat=1, w1=-11.80, w2=8.20, c=-0.10
  x1=86, x2=86, y=0, z=-309.70, y_hat=0, w1=-11.80, w2=8.20, c=-0.10
  x1=69, x2=138, y=1, z=317.30, y_hat=1, w1=-11.80, w2=8.20, c=-0.10
  x1=11, x2=22, y=1, z=50.50, y_hat=1, w1=-11.80, w2=8.20, c=-0.10
  x1=75, x2=150, y=1, z=344.90, y_hat=1, w1=-11.80, w2=8.20, c=-0.10
  x1=54, x2=54, y=0, z=-194.50, y_hat=0, w1=-11.80, w2=8.20, c=-0.10
  x1=4, x2=4, y=0, z=-14.50, y_hat=0, w1=-11.80, w2=8.20, c=-0.10
  x1=27, x2=54, y=1, z=124.10, y_hat=1, w1=-11.80, w2=8.20, c=-0.10
Epoch 3
  x1=81, x2=162, y=1, z=372.50, y_hat=1, w1=-11.80, w2=8.20, c=-0.10
  x1=14, x2=14, y=0, z=-50.50, y_hat=0, w1=-11.80, w2=8.20, c=-0.10
  x1=3, x2=6, y=1, z=13.70, y_hat=1, w1=-11.80, w2=8.20, c=-0.10
  x1=94, x2=94, y=0, z=-338.50, y_hat=0, w1=-11.80, w2=8.20, c=-0.10
  x1=35, x2=70, y=1, z=160.90, y_hat=1, w1=-11.80, w2=8.20, c=-0.10
  x1=31, x2=62, y=1, z=142.50, y_hat=1, w1=-11.80, w2=8.20, c=-0.10
  x1=28, x2=28, y=0, z=-100.90, y_hat=0, w1=-11.80, w2=8.20, c=-0.10
  x1=17, x2=34, y=1, z=78.10, y_hat=1, w1=-11.80, w2=8.20, c=-0.10
  x1=13, x2=26, y=1, z=59.70, y_hat=1, w1=-11.80, w2=8.20, c=-0.10
  x1=86, x2=86, y=0, z=-309.70, y_hat=0, w1=-11.80, w2=8.20, c=-0.10
  x1=69, x2=138, y=1, z=317.30, y_hat=1, w1=-11.80, w2=8.20, c=-0.10
  x1=11, x2=22, y=1, z=50.50, y_hat=1, w1=-11.80, w2=8.20, c=-0.10
  x1=75, x2=150, y=1, z=344.90, y_hat=1, w1=-11.80, w2=8.20, c=-0.10
  x1=54, x2=54, y=0, z=-194.50, y_hat=0, w1=-11.80, w2=8.20, c=-0.10
  x1=4, x2=4, y=0, z=-14.50, y_hat=0, w1=-11.80, w2=8.20, c=-0.10
  x1=27, x2=54, y=1, z=124.10, y_hat=1, w1=-11.80, w2=8.20, c=-0.10
Epoch 4
  x1=81, x2=162, y=1, z=372.50, y_hat=1, w1=-11.80, w2=8.20, c=-0.10
  x1=14, x2=14, y=0, z=-50.50, y_hat=0, w1=-11.80, w2=8.20, c=-0.10
  x1=3, x2=6, y=1, z=13.70, y_hat=1, w1=-11.80, w2=8.20, c=-0.10
  x1=94, x2=94, y=0, z=-338.50, y_hat=0, w1=-11.80, w2=8.20, c=-0.10
  x1=35, x2=70, y=1, z=160.90, y_hat=1, w1=-11.80, w2=8.20, c=-0.10
  x1=31, x2=62, y=1, z=142.50, y_hat=1, w1=-11.80, w2=8.20, c=-0.10
  x1=28, x2=28, y=0, z=-100.90, y_hat=0, w1=-11.80, w2=8.20, c=-0.10
  x1=17, x2=34, y=1, z=78.10, y_hat=1, w1=-11.80, w2=8.20, c=-0.10
  x1=13, x2=26, y=1, z=59.70, y_hat=1, w1=-11.80, w2=8.20, c=-0.10
  x1=86, x2=86, y=0, z=-309.70, y_hat=0, w1=-11.80, w2=8.20, c=-0.10
  x1=69, x2=138, y=1, z=317.30, y_hat=1, w1=-11.80, w2=8.20, c=-0.10
  x1=11, x2=22, y=1, z=50.50, y_hat=1, w1=-11.80, w2=8.20, c=-0.10
  x1=75, x2=150, y=1, z=344.90, y_hat=1, w1=-11.80, w2=8.20, c=-0.10
  x1=54, x2=54, y=0, z=-194.50, y_hat=0, w1=-11.80, w2=8.20, c=-0.10
  x1=4, x2=4, y=0, z=-14.50, y_hat=0, w1=-11.80, w2=8.20, c=-0.10
  x1=27, x2=54, y=1, z=124.10, y_hat=1, w1=-11.80, w2=8.20, c=-0.10
Epoch 5
  x1=81, x2=162, y=1, z=372.50, y_hat=1, w1=-11.80, w2=8.20, c=-0.10
  x1=14, x2=14, y=0, z=-50.50, y_hat=0, w1=-11.80, w2=8.20, c=-0.10
  x1=3, x2=6, y=1, z=13.70, y_hat=1, w1=-11.80, w2=8.20, c=-0.10
  x1=94, x2=94, y=0, z=-338.50, y_hat=0, w1=-11.80, w2=8.20, c=-0.10
  x1=35, x2=70, y=1, z=160.90, y_hat=1, w1=-11.80, w2=8.20, c=-0.10
  x1=31, x2=62, y=1, z=142.50, y_hat=1, w1=-11.80, w2=8.20, c=-0.10
  x1=28, x2=28, y=0, z=-100.90, y_hat=0, w1=-11.80, w2=8.20, c=-0.10
  x1=17, x2=34, y=1, z=78.10, y_hat=1, w1=-11.80, w2=8.20, c=-0.10
  x1=13, x2=26, y=1, z=59.70, y_hat=1, w1=-11.80, w2=8.20, c=-0.10
  x1=86, x2=86, y=0, z=-309.70, y_hat=0, w1=-11.80, w2=8.20, c=-0.10
  x1=69, x2=138, y=1, z=317.30, y_hat=1, w1=-11.80, w2=8.20, c=-0.10
  x1=11, x2=22, y=1, z=50.50, y_hat=1, w1=-11.80, w2=8.20, c=-0.10
  x1=75, x2=150, y=1, z=344.90, y_hat=1, w1=-11.80, w2=8.20, c=-0.10
  x1=54, x2=54, y=0, z=-194.50, y_hat=0, w1=-11.80, w2=8.20, c=-0.10
  x1=4, x2=4, y=0, z=-14.50, y_hat=0, w1=-11.80, w2=8.20, c=-0.10
  x1=27, x2=54, y=1, z=124.10, y_hat=1, w1=-11.80, w2=8.20, c=-0.10

plot_datasets_and_zx(w1, w2, c)

from ipywidgets import interact

trained_w1 = w1
trained_w2 = w2
trained_c = c
print(f"Trained weights: w1={trained_w1}, w2={trained_w2}, c={trained_c}")

def plot_dynamic_line(w1=trained_w1, w2=trained_w2, c=trained_c):
    plot_datasets(dataset_train, dataset_test)
    plot_zx(w1, w2, c)

# This will display an interactive plot that allows you to change the weights and bias. The default values are the trained weights and bias.
interact(plot_dynamic_line, w1=(-20, 20, 0.5), w2=(-20, 20, 0.5), c=(-50, 50, 0.5))

Trained weights: w1=-11.800000000000002, w2=8.2, c=-0.1

interactive(children=(FloatSlider(value=-11.800000000000002, description='w1', max=20.0, min=-20.0, step=0.5),…

<function __main__.plot_dynamic_line(w1=-11.800000000000002, w2=8.2, c=-0.1)>

Simple Perceptron Implementation¶

Introduction to the Perceptron¶

Objective¶

Dataset¶

Visual Representation¶

Defining a Linear Classifier¶

Evaluating the Performance of the Classifier¶

Defining the Classifier¶

Discussion on Accuracy¶

Model Training¶

Interpreting the Results¶

Visualizing the Decision Boundary¶

Interactive Visualization¶

Conclusion¶

Limitations and Future Work¶

	epoch	x1	x2	y	z	y_hat	w1	w2	c	err
0	1	27	54	1	-29.8	0	-4.8	8.6	0.0	8
1	2	27	54	1	124.1	1	-11.8	8.2	-0.1	5
2	3	27	54	1	124.1	1	-11.8	8.2	-0.1	0
3	4	27	54	1	124.1	1	-11.8	8.2	-0.1	0
4	5	27	54	1	124.1	1	-11.8	8.2	-0.1	0