python - 如何在 Python 中实现感知机？-6ren

python - 如何在 Python 中实现感知机？

转载作者：太空宇宙更新时间：2023-11-04 04:55:18

我正在努力学习 Daume 的书

http://ciml.info/dl/v0_99/ciml-v0_99-ch04.pdf (第 43 页)。

使用 numpy 和不使用 python 在 python 中拟合普通感知器模型使用 sciki-learn 库。

书上给出了算法

我们如何在实践中实现该模型？

到目前为止，我已经学会了如何读取数据和标签:

def read_data(infile):
    data = np.loadtxt(infile)
    X = data[:,:-1]
    Y = data[:,-1]

    return X, Y

我们将不胜感激!!

最佳答案

我想到的一种方法是:

(随时欢迎更好的想法!!)

#!python
# -*- coding: utf-8 -*-#
"""
Perceptron Algorithm.

@author: Bhishan Poudel

@date:  Oct 31, 2017

"""
# Imports
import numpy as np
import matplotlib.pyplot as plt
from numpy.linalg import norm
import os, shutil
np.random.seed(100)

def read_data(infile):
    data = np.loadtxt(infile)
    X = data[:,:-1]
    Y = data[:,-1]

    return X, Y

def plot_boundary(X,Y,w,epoch):
    try:
        plt.style.use('seaborn-darkgrid')
        # plt.style.use('ggplot')
        #plt.style.available
    except:
        pass

    # Get data for two classes
    idxN = np.where(np.array(Y)==-1)
    idxP = np.where(np.array(Y)==1)
    XN = X[idxN]
    XP = X[idxP]

    # plot two classes
    plt.scatter(XN[:,0],XN[:,1],c='b', marker='_', label="Negative class")
    plt.scatter(XP[:,0],XP[:,1],c='r', marker='+', label="Positive class")
    # plt.plot(XN[:,0],XN[:,1],'b_', markersize=8, label="Negative class")
    # plt.plot(XP[:,0],XP[:,1],'r+', markersize=8, label="Positive class")
    plt.title("Perceptron Algorithm iteration: {}".format(epoch))

    # plot decision boundary orthogonal to w
    # w is w2,w1, w0  last term is bias.
    if len(w) == 3:
        a  = -w[0] / w[1]
        b  = -w[0] / w[2]
        xx = [ 0, a]
        yy = [b, 0]
        plt.plot(xx,yy,'--g',label='Decision Boundary')

    if len(w) == 2:
        x2=[ w[0],  w[1],  -w[1],  w[0]]
        x3=[ w[0],  w[1],   w[1], -w[0]]

        x2x3 =np.array([x2,x3])
        XX,YY,U,V = list(zip(*x2x3))
        ax = plt.gca()
        ax.quiver(XX,YY,U,V,scale=1, color='g')

    # Add labels
    plt.xlabel('X')
    plt.ylabel('Y')

    # limits
    x_min, x_max = X[:, 0].min() - 1, X[:, 0].max() + 1
    y_min, y_max = X[:, 1].min() - 1, X[:, 1].max() + 1
    plt.xlim(x_min,x_max)
    plt.ylim(y_min,y_max)

    # lines from origin
    plt.axhline(y=0, color='k', linestyle='--',alpha=0.2)
    plt.axvline(x=0, color='k', linestyle='--',alpha=0.2)
    plt.grid(True)
    plt.legend(loc=1)
    plt.show()

    # Always clost the plot
    plt.close()


def predict(X,w):
    return np.sign(np.dot(X, w))

def plot_contour(X,Y,w,mesh_stepsize):
    try:
        plt.style.use('seaborn-darkgrid')
        # plt.style.use('ggplot')
        #plt.style.available
    except:
        pass    
    # Get data for two classes
    idxN = np.where(np.array(Y)==-1)
    idxP = np.where(np.array(Y)==1)
    XN = X[idxN]
    XP = X[idxP]

    # plot two classes with + and - sign
    fig, ax = plt.subplots()
    ax.set_title('Perceptron Algorithm')
    plt.xlabel("X")
    plt.ylabel("Y")
    plt.plot(XN[:,0],XN[:,1],'b_', markersize=8, label="Negative class")
    plt.plot(XP[:,0],XP[:,1],'y+', markersize=8, label="Positive class")
    plt.legend()

    # create a mesh for contour plot
    # We first make a meshgrid (rectangle full of pts) from xmin to xmax and ymin to ymax.
    # We then predict the label for each grid point and color it.
    x_min, x_max = X[:, 0].min() - 1, X[:, 0].max() + 1
    y_min, y_max = X[:, 1].min() - 1, X[:, 1].max() + 1

    # Get 2D array for grid axes xx and yy  (shape = 700, 1000)
    # xx has 700 rows.
    # xx[0] has 1000 values.
    xx, yy = np.meshgrid(np.arange(x_min, x_max, mesh_stepsize),
                         np.arange(y_min, y_max, mesh_stepsize))

    # Get 1d array for x and y axes
    xxr = xx.ravel()  # shape (700000,)
    yyr = yy.ravel()  # shape (700000,)

    # ones vector
    # ones = np.ones(xxr.shape[0]) # shape (700000,)
    ones = np.ones(len(xxr)) # shape (700000,)

    # Predict the score
    Xvals  = np.c_[ones, xxr, yyr]
    scores = predict(Xvals, w)

    # Plot contour plot
    scores = scores.reshape(xx.shape)
    ax.contourf(xx, yy, scores, cmap=plt.cm.Paired)
    # print("xx.shape = {}".format(xx.shape))               # (700, 1000)
    # print("scores.shape = {}".format(scores.shape))       # (700, 1000)
    # print("scores[0].shape = {}".format(scores[0].shape)) # (1000,)

    # show the plot
    plt.savefig("Perceptron.png")
    plt.show()
    plt.close()

def perceptron_sgd(X, Y,epochs):
    """
    X: data matrix without bias.
    Y: target
    """
    # add bias to X's first column
    ones = np.ones(X.shape[0]).reshape(X.shape[0],1)
    X1 = np.append(ones, X, axis=1)


    w = np.zeros(X1.shape[1])
    final_iter = epochs

    for epoch in range(epochs):
        print("\n")
        print("epoch: {} {}".format(epoch, '-'*30))

        misclassified = 0
        for i, x in enumerate(X1):
            y = Y[i]
            h = np.dot(x, w)*y

            if h <= 0:
                w = w + x*y
                misclassified += 1
                print('misclassified? yes  w: {} '.format(w,i))

            else:
                print('misclassified? no  w: {}'.format(w))
                pass

        if misclassified == 0:
            final_iter = epoch
            break

    return w, final_iter

def gen_lin_separable_data(data, data_tr, data_ts,data_size):
    mean1 = np.array([0, 2])
    mean2 = np.array([2, 0])
    cov = np.array([[0.8, 0.6], [0.6, 0.8]])
    X1 = np.random.multivariate_normal(mean1, cov, size=int(data_size/2))
    y1 = np.ones(len(X1))
    X2 = np.random.multivariate_normal(mean2, cov, size=int(data_size/2))
    y2 = np.ones(len(X2)) * -1


    with open(data,'w') as fo, \
         open(data_tr,'w') as fo1, \
         open(data_ts,'w') as fo2:
        for i in range( len(X1)):
            line = '{:5.2f} {:5.2f} {:5.0f} \n'.format(X1[i][0], X1[i][1], y1[i])
            line2 = '{:5.2f} {:5.2f} {:5.0f} \n'.format(X2[i][0], X2[i][1], y2[i])
            fo.write(line)
            fo.write(line2)

        for i in range( len(X1) - 20):
            line = '{:5.2f} {:5.2f} {:5.0f} \n'.format(X1[i][0], X1[i][1], y1[i])
            line2 = '{:5.2f} {:5.2f} {:5.0f} \n'.format(X2[i][0], X2[i][1], y2[i])
            fo1.write(line)
            fo1.write(line2)

        for i in range((len(X1) - 20), len(X1) ):
            line = '{:5.2f} {:5.2f} {:5.0f} \n'.format(X1[i][0], X1[i][1], y1[i])
            line2 = '{:5.2f} {:5.2f} {:5.0f} \n'.format(X2[i][0], X2[i][1], y2[i])
            fo2.write(line)
            fo2.write(line2)

def main():
    """Run main function."""

    # generate linearly separable data
    data = 'data.txt'
    data_tr = 'data_train.txt'
    data_ts = 'data_test.txt'
    data_size = 200
    gen_lin_separable_data(data, data_tr, data_ts,data_size)

    # read data
    epochs = 20
    X_train, Y_train = read_data(data_tr)
    X_test, Y_test = read_data(data_ts)

    # fit perceptron 
    w, final_iter = perceptron_sgd(X_train,Y_train,epochs)
    print('w = ', w)

    plot_boundary(X_test,Y_test,w,final_iter)

    # contour plot
    mesh_stepsize = 0.01
    plot_contour(X_test,Y_test,w,mesh_stepsize)

if __name__ == "__main__":
    main()

决策边界如下所示:

关于python - 如何在 Python 中实现感知机？，我们在Stack Overflow上找到一个类似的问题： https://stackoverflow.com/questions/47213847/

文章推荐： python - 环境 : ‘jupyter’ : No such file or directory

文章推荐： javascript - Javascript 中的 XMLRPC 客户端

文章推荐： c - 如何在 32 位和 64 位机器的头文件中获得相同的结构？

JavaFX DPI 感知
晚安，我正在与一些合作伙伴使用 javaFx 制作一个应用程序；我们的想法是它将在 Windows 和 Linux 中使用。我们进行了一些测试，发现应用程序在两种操作系统中的显示有所不同。我们正在使
winapi - 意外处理 DPI 感知
我有一项服务，可通过 CreateProcessAsUser 将可执行文件启动到用户 session 中，并在 STARTUPINFO 参数中指定桌面。它运行良好。我的可执行文件没有显示出来，也没有
hadoop 管道写入和 Rack 感知
当每个文件写入集群时，HDFS 会创建一个复制管道。假设有两个 Rack 1 和 5。根据 Rack 感知，第一个 block 将被保存到 Rack 1，其他两个复制 block 将被插入 Rack
python - 如何在不更改值的情况下使时间对象 TZ 感知？
我正在做一个 Django 项目，我对时区感到困惑。我有一个事件对象，它有 publish_start 和 publish_end 日期。控制台输出示例； campaingObject.publi
windows - 安装字体并让 Windows 感知
我在下面有一个函数，它通过将字体 (.ttf) 复制到 Windows 字体文件夹然后触发 WM_FONTCHANGE 消息将其安装到 Windows 中。但是，该字体不会立即在 Windows 资源
java - Stacktrace 感知 grep
是否有类似 grep 的 Unix/Linux 命令行工具可以理解由 log4j 或 logback 打印的日志文件中的 Java 堆栈跟踪？该工具应该理解堆栈跟踪由多行组成。典型的用例是在查看存储
Java 感知 merge 命令
每次我在我的 SCM 中看到诸如导入或方法签名更改(例如变量的重命名)之类的冲突时，我想知道是否有类似语言感知的 diff/merge 方法可以处理更烦人的小更改发生在共享项目上。有什么东西可以在 U
cassandra - token 感知 Astyanax 连接池在节点上连接而不在节点上分配连接
我使用 astyanax 连接池定义如下: ipSeeds = "LOAD_BALANCER_HOST:9160"; conPool.setSeeds(ipSeeds) .setDiscoveryTy
utf-8 - UTF8 感知 printf？
据我所知，OCaml 中的字符串只是简单的字节序列。他们没有编码的概念。这对于大多数用途来说都很好。但是，标准库的某些部分对以单字节字符集编码的字符串做出了假设，例如 printf 的对齐功能: #
utf-8 - UTF8 感知 printf？
据我所知，OCaml 中的字符串只是简单的字节序列。他们没有编码的概念。这对于大多数用途来说都很好。但是，标准库的某些部分对以单字节字符集编码的字符串做出了假设，例如 printf 的对齐功能: #
c# - 使用 Cookie 感知 WebClient
我正在使用 this enhanced version of WebClient登录网站: public class CookieAwareWebClient : WebClient {
android - ACL_ACCESS_DENIED 感知 API - Android
我正在尝试将 Awareness API 集成到一个新项目中，但我遇到了一条错误消息:ACL_ACCESS_DENIED 状态代码:7503。我也在其他项目中集成了 Awareness API，但上
java - session 感知 spring bean
有什么方法可以定义一个 spring bean，当 session 中的数据发生变化时，它会得到通知？如果可能的话，我还想知道纯 Java 解决方案。我想要的只是当我在 httpsession 中添
c++ - NUMA 感知 Cpp 容器
有没有方便有效的方式以 NUMA 感知方式使用 cpp 标准容器 API？我想在 cpp 环境中执行 OpenMP 并行稀疏矩阵 vector 乘法。要分配和初始化与 NUMA 域有关的 vecto
c++ - SetWindowPos() 跨进程 DPI 感知
我正在创建一个程序，它使用 SetWindowPos() 从另一个进程移动/调整窗口大小。我自己的程序是 PROCESS_PER_MONITOR_DPI_AWARE。其他程序可以是 PROCESS_D
java - JTA 感知 JDBC 连接池
我一直在研究许多 JDBC 连接池，但我有一个特定的要求，即池需要是 JTA 感知的，这给我留下了 Apache DBCP 和 OW2 XAPool 的简短列表。我查看的其他池(c3p0、Proxoo
php - 如何使 file_get_contents session 感知？
我有一个 php 脚本，可以在服务器上发出一系列请求。第一个请求将是登录请求。问题是 file_get_contents 似乎每次都创建一个新 session ，那么我怎样才能让它感知 sessio
numpy - 从整数创建 tz 感知 pandas 时间戳对象
我有一个整数，表示 unix 纪元之后的微秒数。 (格林威治标准时间) 如何使用 astype 将 1349863207154117 转换为 pandas.Timestamp("2012-10-10T
web-services - 如何使@WebService Spring 感知
我有一个 Web 服务，我正在尝试将变量 Autowiring 到其中。这是类(class): package com.xetius.isales.pr7.service; import java.u
wpf - 禁用 WPF 应用程序的 DPI 感知
再会! 我已经在 WPF 应用程序上工作了一段时间(作为一种学习体验，哦，天哪，这是一种学习体验)，它终于可以发布了。发布意味着将其安装在我的 HTPC 上，用于浏览我的电影收藏。我在运行 1920

太空宇宙

个人简介

我是一名优秀的程序员,十分优秀！

作者热门文章

滴滴打车优惠券免费领取

全站热门文章

首页

博学

6Ren·AI

商城

python - 如何在 Python 中实现感知机？