c - 感知器学习算法不收敛到 0-6ren

c - 感知器学习算法不收敛到 0

转载作者：太空狗更新时间：2023-10-29 16:16:52

这是我在 ANSI C 中的感知器实现:

#include <stdio.h>
#include <stdlib.h>
#include <math.h>

float randomFloat()
{
    srand(time(NULL));
    float r = (float)rand() / (float)RAND_MAX;
    return r;
}

int calculateOutput(float weights[], float x, float y)
{
    float sum = x * weights[0] + y * weights[1];
    return (sum >= 0) ? 1 : -1;
}

int main(int argc, char *argv[])
{
    // X, Y coordinates of the training set.
    float x[208], y[208];

    // Training set outputs.
    int outputs[208];

    int i = 0; // iterator

    FILE *fp;

    if ((fp = fopen("test1.txt", "r")) == NULL)
    {
        printf("Cannot open file.\n");
    }
    else
    {
        while (fscanf(fp, "%f %f %d", &x[i], &y[i], &outputs[i]) != EOF)
        {
            if (outputs[i] == 0)
            {
                outputs[i] = -1;
            }
            printf("%f   %f   %d\n", x[i], y[i], outputs[i]);
            i++;
        }
    }

    system("PAUSE");

    int patternCount = sizeof(x) / sizeof(int);

    float weights[2];
    weights[0] = randomFloat();
    weights[1] = randomFloat();

    float learningRate = 0.1;

    int iteration = 0;
    float globalError;

    do {
        globalError = 0;
        int p = 0; // iterator
        for (p = 0; p < patternCount; p++)
        {
            // Calculate output.
            int output = calculateOutput(weights, x[p], y[p]);

            // Calculate error.
            float localError = outputs[p] - output;

            if (localError != 0)
            {
                // Update weights.
                for (i = 0; i < 2; i++)
                {
                    float add = learningRate * localError;
                    if (i == 0)
                    {
                        add *= x[p];
                    }
                    else if (i == 1)
                    {
                        add *= y[p];
                    }
                    weights[i] +=  add;
                }
            }

            // Convert error to absolute value.
            globalError += fabs(localError);

            printf("Iteration %d Error %.2f %.2f\n", iteration, globalError, localError);

            iteration++;
        }

        system("PAUSE");

    } while (globalError != 0);

    system("PAUSE");
    return 0;
}

我正在使用的训练集:Data Set

我已经删除了所有不相关的代码。基本上它现在所做的是读取 test1.txt 文件并将值从它加载到三个数组:x、y、outputs.

然后有一个perceptron learning algorithm由于某种原因，它没有收敛到 0(globalError 应该收敛到 0)，因此我得到了一个无限的 do while 循环。

当我使用较小的训练集(例如 5 个点)时，效果很好。有什么想法可能是问题所在吗？

我写的这个算法和这个很相似C# Perceptron algorithm :

编辑:

这是一个训练集较小的例子:

#include <stdio.h>
#include <stdlib.h>
#include <math.h>

float randomFloat()
{
    float r = (float)rand() / (float)RAND_MAX;
    return r;
}

int calculateOutput(float weights[], float x, float y)
{
    float sum = x * weights[0] + y * weights[1];
    return (sum >= 0) ? 1 : -1;
}

int main(int argc, char *argv[])
{
    srand(time(NULL));

    // X coordinates of the training set.
    float x[] = { -3.2, 1.1, 2.7, -1 };

    // Y coordinates of the training set.
    float y[] = { 1.5, 3.3, 5.12, 2.1 };

    // The training set outputs.
    int outputs[] = { 1, -1, -1, 1 };

    int i = 0; // iterator

    FILE *fp;

    system("PAUSE");

    int patternCount = sizeof(x) / sizeof(int);

    float weights[2];
    weights[0] = randomFloat();
    weights[1] = randomFloat();

    float learningRate = 0.1;

    int iteration = 0;
    float globalError;

    do {
        globalError = 0;
        int p = 0; // iterator
        for (p = 0; p < patternCount; p++)
        {
            // Calculate output.
            int output = calculateOutput(weights, x[p], y[p]);

            // Calculate error.
            float localError = outputs[p] - output;

            if (localError != 0)
            {
                // Update weights.
                for (i = 0; i < 2; i++)
                {
                    float add = learningRate * localError;
                    if (i == 0)
                    {
                        add *= x[p];
                    }
                    else if (i == 1)
                    {
                        add *= y[p];
                    }
                    weights[i] +=  add;
                }
            }

            // Convert error to absolute value.
            globalError += fabs(localError);

            printf("Iteration %d Error %.2f\n", iteration, globalError);          
        }

        iteration++;

    } while (globalError != 0);

    // Display network generalisation.
    printf("X       Y     Output\n");
    float j, k;
    for (j = -1; j <= 1; j += .5)
    {
        for (j = -1; j <= 1; j += .5)
        {
            // Calculate output.
            int output = calculateOutput(weights, j, k);
            printf("%.2f  %.2f  %s\n", j, k, (output == 1) ? "Blue" : "Red");
        }
    }

    // Display modified weights.
    printf("Modified weights: %.2f %.2f\n", weights[0], weights[1]);

    system("PAUSE");
    return 0;
}

最佳答案

在您当前的代码中，perceptron成功学习了决策边界的方向，但无法翻译它。

    y                              y    ^                              ^    |  - + \\  +                   |  - \\ +   +    | -    +\\ +   +               | -   \\  + +   +    | - -    \\ +                  | - -  \\    +    | -  -  + \\  +                | -  -  \\ +   +    ---------------------> x       --------------------> x        stuck like this            need to get like this

^{(as someone pointed out, here is a more accurate version)}

The problem lies in the fact that your perceptron has no bias term, i.e. a third weight component connected to an input of value 1.

       w0   -----    x ---->|     |           |  f  |----> output (+1/-1)    y ---->|     |       w1   -----               ^ w2    1(bias) ---|

The following is how I corrected the problem:

#include <stdio.h>
#include <stdlib.h>
#include <math.h>
#include <time.h>

#define LEARNING_RATE    0.1
#define MAX_ITERATION    100

float randomFloat()
{
    return (float)rand() / (float)RAND_MAX;
}

int calculateOutput(float weights[], float x, float y)
{
    float sum = x * weights[0] + y * weights[1] + weights[2];
    return (sum >= 0) ? 1 : -1;
}

int main(int argc, char *argv[])
{
    srand(time(NULL));

    float x[208], y[208], weights[3], localError, globalError;
    int outputs[208], patternCount, i, p, iteration, output;

    FILE *fp;
    if ((fp = fopen("test1.txt", "r")) == NULL) {
        printf("Cannot open file.\n");
        exit(1);
    }

    i = 0;
    while (fscanf(fp, "%f %f %d", &x[i], &y[i], &outputs[i]) != EOF) {
        if (outputs[i] == 0) {
            outputs[i] = -1;
        }
        i++;
    }
    patternCount = i;

    weights[0] = randomFloat();
    weights[1] = randomFloat();
    weights[2] = randomFloat();

    iteration = 0;
    do {
        iteration++;
        globalError = 0;
        for (p = 0; p < patternCount; p++) {
            output = calculateOutput(weights, x[p], y[p]);

            localError = outputs[p] - output;
            weights[0] += LEARNING_RATE * localError * x[p];
            weights[1] += LEARNING_RATE * localError * y[p];
            weights[2] += LEARNING_RATE * localError;

            globalError += (localError*localError);
        }

        /* Root Mean Squared Error */
        printf("Iteration %d : RMSE = %.4f\n",
            iteration, sqrt(globalError/patternCount));
    } while (globalError > 0 && iteration <= MAX_ITERATION);

    printf("\nDecision boundary (line) equation: %.2f*x + %.2f*y + %.2f = 0\n",
        weights[0], weights[1], weights[2]);

    return 0;
}

... 输出如下:

Iteration 1 : RMSE = 0.7206
Iteration 2 : RMSE = 0.5189
Iteration 3 : RMSE = 0.4804
Iteration 4 : RMSE = 0.4804
Iteration 5 : RMSE = 0.3101
Iteration 6 : RMSE = 0.4160
Iteration 7 : RMSE = 0.4599
Iteration 8 : RMSE = 0.3922
Iteration 9 : RMSE = 0.0000

Decision boundary (line) equation: -2.37*x + -2.51*y + -7.55 = 0

下面是使用 MATLAB 的上述代码的简短动画，显示了 decision boundary在每次迭代中:

关于c - 感知器学习算法不收敛到 0，我们在Stack Overflow上找到一个类似的问题： https://stackoverflow.com/questions/1697243/

文章推荐： android - 从 fragmentActivity 刷新 fragment UI

文章推荐： android - 是否可以从 Android Wear SDK 获取 GPS 位置？

文章推荐： android - 打开卡上的文件夹

文章推荐： android - 抽屉导航中的背景图像和 ImageView

JavaFX DPI 感知
晚安，我正在与一些合作伙伴使用 javaFx 制作一个应用程序；我们的想法是它将在 Windows 和 Linux 中使用。我们进行了一些测试，发现应用程序在两种操作系统中的显示有所不同。我们正在使
winapi - 意外处理 DPI 感知
我有一项服务，可通过 CreateProcessAsUser 将可执行文件启动到用户 session 中，并在 STARTUPINFO 参数中指定桌面。它运行良好。我的可执行文件没有显示出来，也没有
hadoop 管道写入和 Rack 感知
当每个文件写入集群时，HDFS 会创建一个复制管道。假设有两个 Rack 1 和 5。根据 Rack 感知，第一个 block 将被保存到 Rack 1，其他两个复制 block 将被插入 Rack
python - 如何在不更改值的情况下使时间对象 TZ 感知？
我正在做一个 Django 项目，我对时区感到困惑。我有一个事件对象，它有 publish_start 和 publish_end 日期。控制台输出示例； campaingObject.publi
windows - 安装字体并让 Windows 感知
我在下面有一个函数，它通过将字体 (.ttf) 复制到 Windows 字体文件夹然后触发 WM_FONTCHANGE 消息将其安装到 Windows 中。但是，该字体不会立即在 Windows 资源
java - Stacktrace 感知 grep
是否有类似 grep 的 Unix/Linux 命令行工具可以理解由 log4j 或 logback 打印的日志文件中的 Java 堆栈跟踪？该工具应该理解堆栈跟踪由多行组成。典型的用例是在查看存储
Java 感知 merge 命令
每次我在我的 SCM 中看到诸如导入或方法签名更改(例如变量的重命名)之类的冲突时，我想知道是否有类似语言感知的 diff/merge 方法可以处理更烦人的小更改发生在共享项目上。有什么东西可以在 U
cassandra - token 感知 Astyanax 连接池在节点上连接而不在节点上分配连接
我使用 astyanax 连接池定义如下: ipSeeds = "LOAD_BALANCER_HOST:9160"; conPool.setSeeds(ipSeeds) .setDiscoveryTy
utf-8 - UTF8 感知 printf？
据我所知，OCaml 中的字符串只是简单的字节序列。他们没有编码的概念。这对于大多数用途来说都很好。但是，标准库的某些部分对以单字节字符集编码的字符串做出了假设，例如 printf 的对齐功能: #
utf-8 - UTF8 感知 printf？
据我所知，OCaml 中的字符串只是简单的字节序列。他们没有编码的概念。这对于大多数用途来说都很好。但是，标准库的某些部分对以单字节字符集编码的字符串做出了假设，例如 printf 的对齐功能: #
c# - 使用 Cookie 感知 WebClient
我正在使用 this enhanced version of WebClient登录网站: public class CookieAwareWebClient : WebClient {
android - ACL_ACCESS_DENIED 感知 API - Android
我正在尝试将 Awareness API 集成到一个新项目中，但我遇到了一条错误消息:ACL_ACCESS_DENIED 状态代码:7503。我也在其他项目中集成了 Awareness API，但上
java - session 感知 spring bean
有什么方法可以定义一个 spring bean，当 session 中的数据发生变化时，它会得到通知？如果可能的话，我还想知道纯 Java 解决方案。我想要的只是当我在 httpsession 中添
c++ - NUMA 感知 Cpp 容器
有没有方便有效的方式以 NUMA 感知方式使用 cpp 标准容器 API？我想在 cpp 环境中执行 OpenMP 并行稀疏矩阵 vector 乘法。要分配和初始化与 NUMA 域有关的 vecto
c++ - SetWindowPos() 跨进程 DPI 感知
我正在创建一个程序，它使用 SetWindowPos() 从另一个进程移动/调整窗口大小。我自己的程序是 PROCESS_PER_MONITOR_DPI_AWARE。其他程序可以是 PROCESS_D
java - JTA 感知 JDBC 连接池
我一直在研究许多 JDBC 连接池，但我有一个特定的要求，即池需要是 JTA 感知的，这给我留下了 Apache DBCP 和 OW2 XAPool 的简短列表。我查看的其他池(c3p0、Proxoo
php - 如何使 file_get_contents session 感知？
我有一个 php 脚本，可以在服务器上发出一系列请求。第一个请求将是登录请求。问题是 file_get_contents 似乎每次都创建一个新 session ，那么我怎样才能让它感知 sessio
numpy - 从整数创建 tz 感知 pandas 时间戳对象
我有一个整数，表示 unix 纪元之后的微秒数。 (格林威治标准时间) 如何使用 astype 将 1349863207154117 转换为 pandas.Timestamp("2012-10-10T
web-services - 如何使@WebService Spring 感知
我有一个 Web 服务，我正在尝试将变量 Autowiring 到其中。这是类(class): package com.xetius.isales.pr7.service; import java.u
wpf - 禁用 WPF 应用程序的 DPI 感知
再会! 我已经在 WPF 应用程序上工作了一段时间(作为一种学习体验，哦，天哪，这是一种学习体验)，它终于可以发布了。发布意味着将其安装在我的 HTPC 上，用于浏览我的电影收藏。我在运行 1920

太空狗

个人简介

我是一名优秀的程序员,十分优秀！

作者热门文章

滴滴打车优惠券免费领取

全站热门文章

首页

博学

6Ren·AI

商城

c - 感知器学习算法不收敛到 0