LearningFromData/perceptron.py at master · monkey0105/LearningFromData · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
# -*- coding: utf-8 -*-
__author__ = 'wangjz'

import random
import numpy as np

"""
Learning From Data
HW 1
The Perceptron Learning Algorithm
目前本目录下的main函数不能使用

In this problem, you will create your own target function f and data set D to see how the
Perceptron Learning Algorithm works.Take d = 2 so you can visualize the problem,
and assume X = [−1, 1] × [−1, 1] with uniform probability of picking each x∈X.
In each run, choose a random line in the plane as your target function f
(do this by taking two random, uniformly distributed points in [−1, 1] × [−1, 1] and
taking the line passing through them), where one side of the line maps to +1 and the other maps to −1.
Choose the inputs xn of the data set as random points (uniformly in X ), and evaluate the target function on each xn
to get the corresponding output yn.Now, in each run, use the Perceptron Learning Algorithm to find g.
Start the PLA with the weight vector w being all zeros, and at each iteration have the algorithm
choose a point randomly from the set of misclassified points. We are interested in two quantities:
the number of iterations that PLA takes to converge to g, and the disagreement between f and g which is
P[f(x) ̸= g(x)] (the probability that f and g will disagree on their classification of a random point).
You can either calculate this probability exactly, or approximate it by generating a sufficiently large,
separate set of points to estimate it.In order to get a reliable estimate for these two quantities, you should
repeat the experiment for 1000 runs (each run as specified above) and take the average over these runs.
"""


def update_w(w, item):
    x, y = item[0], item[1]
    x.shape = 3,1
    w = w + y * x
    return w


def dot_prodcut(a1, a2):
    """dot product"""
    res = 0
    for i in range(len(a1)):
        res += a1[i] * a2[i]
    return res


def sign(a1, a2):
    #element-wise multiply
    return 1 if np.dot(a1, a2) >= 0 else -1


class Perceptron:
    def __init__(self, training_X, training_Y, init_w=[]):
        self.__N = training_X.shape[0]
        self.__training_X = training_X
        self.__training_Y = training_Y
        self.num_iterations = 0
        self.w = init_w

    def gd_algorithm(self):
        weights = self.w
        num_iteration = 0
        while True:
            #find misclassified points
            mis_classify = []
            for index in range(self.__N):
                x = self.__training_X[index, :]
                y = self.__training_Y[index, 0]
                if sign(x, weights) != y:
                    mis_classify.append((x, y))
            if len(mis_classify) == 0:
                break
            num_iteration += 1

            #randomly choose a misclassified point and apply gradient descent
            mis_item = random.choice(mis_classify)
            weights = update_w(weights, mis_item)

        self.num_iterations = num_iteration
        self.w = weights


def generate_training_date(n):
    #generate target function (represented by vector w)
    p1 = [random.uniform(-1, 1), random.uniform(-1, 1)]
    p2 = [random.uniform(-1, 1), random.uniform(-1, 1)]
    w = [1, 0, 0]
    w[1] = (p2[0] - p1[0]) / (p1[1] - p2[1])
    w[2] = - (p1[0] * w[0] + p1[1] * w[1])

    #generate n random points between [-1,1]X[-1,1]
    training_data = []
    for i in range(n):
        p = [random.uniform(-1, 1), random.uniform(-1, 1), 1]
        p = [sign(w, p)] + p #set label
        training_data.append(p)

    return training_data, w


def main():
    #Let's do the experiment
    num_points = 100
    num_random_test = 100
    iterations = 1000
    iter_list = []
    p_agree = []

    for i in range(iterations):
        td, f = generate_training_date(num_points)
        perce = Perceptron(td)
        perce.gd_algorithm()
        iter_list.append(perce.num_iterations)
        g = perce.w

        agree = 0
        for _ in range(num_random_test):
            ran_p = [random.uniform(-1, 1), random.uniform(-1, 1), 1]
            if sign(ran_p, f) == sign(ran_p, g):
                agree += 1

        p_agree.append(1.0 * agree / num_random_test)

    print max(iter_list)
    print min(iter_list)
    print 1.0 * sum(iter_list) / len(iter_list)

    print max(p_agree)
    print min(p_agree)
    print 1.0 * sum(p_agree) / len(p_agree)

if __name__ == "__main__":
    main()