- html - 出于某种原因,IE8 对我的 Sass 文件中继承的 html5 CSS 不友好?
- JMeter 在响应断言中使用 span 标签的问题
- html - 在 :hover and :active? 上具有不同效果的 CSS 动画
- html - 相对于居中的 html 内容固定的 CSS 重复背景?
我正在尝试用 C 实现一个循环神经网络,但它不起作用。我在互联网上阅读了一些文档,但我不懂复杂的数学。所以我调整了多层感知器的计算。
在学习的几个步骤中,我的网络的输出是一个数字,但很快输出就变成了“不是数字”(-1,#IND00)。
1. 计算。
我的第一个问题是数值、误差和重量变化的计算。
我计算了两个神经元之间的前向链接 N1->N2
,通过以下方式:
(value of N2) += (value of N1) * (weight of link N1->N2)
(error of N1) += (error of N2) * (weight of link N1->N2)
和输出神经元 (error) = (value of neuron) - (target output)
(new weight) = (old weight) - derivative(value of N2) * (error of N2) * (value of N1) * learning_rate
N2->N1
,通过以下方式:
(value of N1) += (previous value of N2) * (weight of link N2->N1)
然后将来自所有前向和循环链接的 N1 的最终值传递给一个 sigmoid 函数 (tanh),除了输出神经元 (error of N2) += (previous error of N1) * (weight of link N2->N1)
(new weight) = (old weight) - derivative(value of N1) * (error of N1) * (previous value of N2) * learning_rate
rnnset()
,
rnnsetstart()
和
rnnlearn()
, 查看向前和向后传递,并且在这 3 个函数中禁用了循环链接(注释行/块)。
rnnsetstart()
必须在
rnnset()
之前调用,为了将最后一次前向传递的值存储在神经元变量
value_prev
中.
#include <stdio.h>
#include <time.h>
#include <math.h>
#include <malloc.h>
#include <stdlib.h>
#include "mlp.h"
typedef struct _neuron NEURON;
struct _neuron {
int layer;
double * weight;
int nbsynapsesin;
NEURON ** synapsesin;
double bias;
double value;
double value_prev;
double error;
double error_prev;
};
typedef struct _rnn RNN;
struct _rnn {
int * layersize;
int nbneurons;
NEURON * n;
};
typedef struct _config CONFIG;
struct _config {
int nbneurons;
int * layersize;
int nbsynapses;
int * synapses;
};
CONFIG * createconfig(int * layersize) {
CONFIG * conf = (CONFIG*)malloc(sizeof(CONFIG));
int i;
conf->nbneurons = 0;
for(i=1; i<layersize[0]+1; i++) conf->nbneurons += layersize[i];
conf->layersize = (int*)malloc((layersize[0]+1)*sizeof(int));
for(i=0; i<layersize[0]+1; i++) conf->layersize[i] = layersize[i];
conf->nbsynapses = 0;
for(i=1; i<layersize[0]; i++) conf->nbsynapses += layersize[i] * layersize[i+1];
conf->nbsynapses *= 2;
conf->synapses = (int*)malloc(2*conf->nbsynapses*sizeof(int));
// creation of the synapses:
int j,k=0,l,k2=0,k3=0;
for(i=1;i<layersize[0];i++) {
k3 += layersize[i];
for(j=0; j<layersize[i]; j++) {
for(l=0; l<layersize[i+1]; l++) {
// forward link/synapse:
conf->synapses[k] = k2+j;
k++;
conf->synapses[k] = k3+l;
k++;
// Recurrent link/synapse:
conf->synapses[k] = k3+l;
k++;
conf->synapses[k] = k2+j;
k++;
}
}
k2 += layersize[i];
}
return conf;
}
void freeconfig(CONFIG* conf) {
free(conf->synapses);
free(conf->layersize);
free(conf);
}
RNN * creaternn(CONFIG * conf) {
RNN * net = (RNN*)malloc(sizeof(RNN));
net->nbneurons = conf->nbneurons;
net->layersize = (int*)malloc((conf->layersize[0]+1)*sizeof(int));
int i;
for(i=0; i<conf->layersize[0]+1; i++) net->layersize[i] = conf->layersize[i];
net->n = (NEURON*)malloc(conf->nbneurons*sizeof(NEURON));
int j=0,k=0;
for(i=0; i<conf->nbneurons; i++) {
if(k==0) { k = conf->layersize[j+1]; j++; }
net->n[i].layer = j-1;
net->n[i].nbsynapsesin = 0;
k--;
}
k=0;
for(i=0; i<conf->nbsynapses; i++) {
k++;
net->n[conf->synapses[k]].nbsynapsesin++;
k++;
}
for(i=0; i<conf->nbneurons; i++) {
net->n[i].weight = (double*)malloc(net->n[i].nbsynapsesin*sizeof(double));
net->n[i].synapsesin = (NEURON**)malloc(net->n[i].nbsynapsesin*sizeof(NEURON*));
net->n[i].nbsynapsesin = 0;
}
// Link the incoming synapses with the neurons:
k=0;
for(i=0; i<conf->nbsynapses; i++) {
k++;
net->n[conf->synapses[k]].synapsesin[net->n[conf->synapses[k]].nbsynapsesin] = &(net->n[conf->synapses[k-1]]);
net->n[conf->synapses[k]].nbsynapsesin++;
k++;
}
// Initialization of the values, errors, and weights:
for(i=0; i<net->nbneurons; i++) {
for(j=0; j<net->n[i].nbsynapsesin; j++) {
net->n[i].weight[j] = 1.0 * (double)rand() / RAND_MAX - 1.0/2;
}
net->n[i].bias = 1.0 * (double)rand() / RAND_MAX - 1.0/2;
net->n[i].value = 0.0;
net->n[i].value_prev = 0.0;
net->n[i].error_prev = 0.0;
net->n[i].error = 0.0;
}
return net;
}
void freernn(RNN * net) {
int i;
for(i=0; i<net->nbneurons; i++) {
free(net->n[i].weight);
free(net->n[i].synapsesin);
}
free(net->n);
free(net->layersize);
free(net);
}
void rnnget(RNN * net, double * out) {
int i,k=0;
for(i=net->nbneurons-1; i>net->nbneurons-net->layersize[net->layersize[0]]-1; i--) { out[k] = net->n[i].value; k++; }
}
void rnnset(RNN * net, double * in) {
int i,j,k;
double v;
NEURON *ni,*nj;
// For each neuron:
for(i=0; i<net->nbneurons; i++) {
ni = &(net->n[i]);
if(i<net->layersize[1]) ni->value = in[i]; else ni->value = ni->bias;
// For each incoming synapse:
for(j=0; j<ni->nbsynapsesin; j++) {
nj = ni->synapsesin[j];
// If it is a forward link/synapse:
if(ni->layer > nj->layer) ni->value += nj->value * ni->weight[j];
// Uncomment the following line to activate reccurent links computation:
//else ni->value += nj->value_prev * ni->weight[j];
}
// If NOT the output layer, then tanh the value:
if(ni->layer != net->layersize[0]-1) ni->value = tanh(ni->value);
}
}
void rnnsetstart(RNN * net) {
int i,j;
NEURON *ni,*nj;
// For each neuron, update value_prev:
for(i=0; i<net->nbneurons; i++) {
ni = &(net->n[i]);
// If NOT the output layer, then the value is already computed by tanh:
if(ni->layer != net->layersize[0]-1) {
ni->value_prev = ni->value;
} else {
ni->value_prev = tanh(ni->value);
}
}
}
void rnnlearn(RNN * net, double * out, double learningrate) {
int i,j,k;
k=0;
NEURON *ni,*nj;
// Initialize error to zero for the output layer:
for(i=net->nbneurons-1; i>=net->nbneurons-net->layersize[net->layersize[0]]; i--) net->n[i].error = 0.0;
// Compute the error for output neurons:
for(i=net->nbneurons-1; i>=0; i--) {
ni = &(net->n[i]);
// If ni is an output neuron, update the error:
if(ni->layer == net->layersize[0]-1) {
ni->error += ni->value - out[k];
k++;
} else {
ni->error = 0.0;
}
// Uncomment the following block to activate reccurent links computation:
/*
// For each incoming synapse from output layer:
for(j=0; j<ni->nbsynapsesin; j++) {
nj = ni->synapsesin[j];
// If neuron nj is in output layer, then update the error:
if(nj->layer == net->layersize[0]-1) nj->error += ni->error_prev * ni->weight[j];
}
*/
}
// Compute error for all other neurons:
for(i=net->nbneurons-1; i>=0; i--) {
ni = &(net->n[i]);
// For each input synapse NOT from output layer:
for(j=0; j<ni->nbsynapsesin; j++) {
nj = ni->synapsesin[j];
// If neuron nj is NOT in output layer, then update the error:
if(nj->layer != net->layersize[0]-1) {
// If it is a forward link/synapse:
if(ni->layer > nj->layer) nj->error += ni->error * ni->weight[j];
// Uncomment the following line to activate reccurent links computation:
//else nj->error += ni->error_prev * ni->weight[j];
}
}
}
// Update weights:
for(i=0; i<net->nbneurons; i++) {
ni = &(net->n[i]);
double wchange,derivative;
// For the output layer:
if(ni->layer == net->layersize[0]-1) {
derivative = ni->error * learningrate;
// For each incoming synapse:
for(j=0; j<ni->nbsynapsesin; j++) {
nj = ni->synapsesin[j];
wchange = derivative;
// If it is a forward link/synapse:
if(ni->layer > nj->layer) wchange *= nj->value;
else wchange *= nj->value_prev;
ni->weight[j] -= wchange;
if(ni->weight[j] > 5) ni->weight[j] = 5;
if(ni->weight[j] < -5) ni->weight[j] = -5;
}
ni->bias -= derivative;
if(ni->bias > 5) ni->bias = 5;
if(ni->bias < -5) ni->bias = -5;
// For the other layers:
} else {
derivative = 1.0 - ni->value * ni->value;
derivative *= ni->error * learningrate;
// For each incoming synapse:
for(j=0; j<ni->nbsynapsesin; j++) {
nj = ni->synapsesin[j];
wchange = derivative;
// If it is a forward link/synapse:
if(ni->layer > nj->layer) wchange *= nj->value;
else wchange *= nj->value_prev;
ni->weight[j] -= wchange;
}
ni->bias -= derivative;
}
}
// Update error_prev:
for(i=0; i<net->nbneurons; i++) net->n[i].error_prev = net->n[i].error;
}
int main() {
srand(time(NULL));
int layersize[] = {1, 25, 12, 1};
int layersize_netrnn[] = { 4, 1, 25, 12, 1 };
mlp * netmlp = create_mlp (4, layersize);
CONFIG * configrnn = createconfig(layersize_netrnn);
RNN * netrnn = creaternn(configrnn);
double inc,outc;
double global_error = 1;
double global_error2 = 1;
int iter,i1=0,i2=0;
//////////////////////////////////////////////////////
// Training of the Multi-Layer Perceptron:
//////////////////////////////////////////////////////
while(global_error > 0.005 && i1<1000) {
for (iter=0; iter < 100; iter++) {
inc = 1.0*rand()/(RAND_MAX+1.0);
outc = inc*inc;
set_mlp(netmlp,&inc);
learn_mlp(netmlp,&outc,0.03);
}
global_error = 0;
int k;
for (k=0; k < 100; k++) {
inc = 1.0*rand()/(RAND_MAX+1.0);
outc = inc*inc;
set_mlp(netmlp,&inc);
get_mlp(netmlp,&outc);
mlp_float desired_out = inc*inc;
global_error += (desired_out - outc)*(desired_out - outc);
}
global_error /= 100;
global_error = sqrt(global_error);
i1++;
}
//////////////////////////////////////////////////////
// Training of the Recurrent Neural Network:
//////////////////////////////////////////////////////
while(global_error2 > 0.005 && i2<1000) {
for (iter=0; iter < 100; iter++) {
inc = 1.0*rand()/(RAND_MAX+1.0);
outc = inc*inc;
rnnsetstart(netrnn);
rnnset(netrnn,&inc);
double outc2;
rnnlearn(netrnn,&outc,0.03);
}
global_error2 = 0;
int k;
for (k=0; k < 100; k++) {
inc = 1.0*rand()/(RAND_MAX+1.0);
outc = inc*inc;
double desired_out = inc*inc;
rnnsetstart(netrnn);
rnnset(netrnn,&inc);
rnnget(netrnn,&outc);
global_error2 += (desired_out - outc)*(desired_out - outc);
}
global_error2 /= 100;
global_error2 = sqrt(global_error2);
if(!isnormal(global_error2)) global_error2 = 100;
i2++;
}
//////////////////////////////////////////////////////
// Test of performance for the both networks:
//////////////////////////////////////////////////////
global_error = 0;
global_error2 = 0;
int k;
for (k=0; k < 10000; k++) {
inc = 1.0*rand()/(RAND_MAX+1.0);
outc = inc*inc;
double desired_out = inc*inc;
rnnsetstart(netrnn);
rnnset(netrnn,&inc);
rnnget(netrnn,&outc);
global_error2 += (desired_out - outc)*(desired_out - outc);
set_mlp(netmlp,&inc);
get_mlp(netmlp,&outc);
global_error += (desired_out - outc)*(desired_out - outc);
}
global_error /= 10000;
global_error = sqrt(global_error);
printf("\n MLP: i: %5d error: %f",i1,global_error);
global_error2 /= 10000;
global_error2 = sqrt(global_error2);
printf("\n RNN: i: %5d error: %f",i2,global_error2);
free_mlp(netmlp);
freeconfig(configrnn);
freernn(netrnn);
}
和文件 mlp.h:
typedef double mlp_float;
typedef struct {
mlp_float *synaptic_weight;
mlp_float *neuron_value;
mlp_float *neuron_error_value;
mlp_float *input_neuron;
mlp_float *output_neuron;
mlp_float *output_error_value;
int *layer_index;
int *layer_size;
int *synapse_index;
int layer_number;
int neuron_number;
int synapse_number;
int input_layer_size;
int output_layer_size;
} mlp;
static mlp_float MAGICAL_WEIGHT_NUMBER = 1.0f;
static mlp_float MAGICAL_LEARNING_NUMBER = 0.4f;
void reinit_mlp(mlp * network) {
int i;
for (i = 0; i < network->synapse_number; i++) {
network->synaptic_weight[i] = /*0.001;*/MAGICAL_WEIGHT_NUMBER * (mlp_float)rand() / RAND_MAX - MAGICAL_WEIGHT_NUMBER/2;
}
}
mlp *create_mlp(int layer_number, int *layer_size) {
mlp *network = (mlp*)malloc(sizeof * network);
network->layer_number = layer_number;
network->layer_size = (int*)malloc(sizeof * network->layer_size * network->layer_number);
network->layer_index = (int*)malloc(sizeof * network->layer_index * network->layer_number);
int i;
network->neuron_number = 0;
for (i = 0; i < layer_number; i++) {
network->layer_size[i] = layer_size[i];
network->layer_index[i] = network->neuron_number;
network->neuron_number += layer_size[i];
}
network->neuron_value = (mlp_float*)malloc(sizeof * network->neuron_value * network->neuron_number);
network->neuron_error_value = (mlp_float*)malloc(sizeof * network->neuron_error_value * network->neuron_number);
network->input_layer_size = layer_size[0];
network->output_layer_size = layer_size[layer_number-1];
network->input_neuron = network->neuron_value;
network->output_neuron = &network->neuron_value[network->layer_index[layer_number-1]];
network->output_error_value = &network->neuron_error_value[network->layer_index[layer_number-1]];
network->synapse_index = (int*)malloc(sizeof * network->synapse_index * (network->layer_number-1));
network->synapse_number = 0;
for (i = 0; i < layer_number - 1; i++) {
network->synapse_index[i] = network->synapse_number;
network->synapse_number += (network->layer_size[i]+1) * network->layer_size[i+1];
}
network->synaptic_weight = (mlp_float*)malloc(sizeof * network->synaptic_weight * network->synapse_number);
for (i = 0; i < network->synapse_number; i++) {
network->synaptic_weight[i] = MAGICAL_WEIGHT_NUMBER * (mlp_float)rand() / RAND_MAX - MAGICAL_WEIGHT_NUMBER/2;
}
return network;
}
void free_mlp (mlp *network) {
free(network->layer_size);
free(network->layer_index);
free(network->neuron_value);
free(network->neuron_error_value);
free(network->synapse_index);
free(network->synaptic_weight);
free(network);
}
void set_mlp (mlp * network, mlp_float *vector) {
if (vector != NULL) {
int i;
for (i = 0; i < network->input_layer_size; i++) {
network->input_neuron[i] = vector[i];
}
}
int i;
int synapse_index;
synapse_index = 0;
for (i = 1; i < network->layer_number; i++) {
int j;
for (j = network->layer_index[i]; j < network->layer_index[i] + network->layer_size[i]; j++) {
mlp_float weighted_sum = 0.0;
int k;
for (k = network->layer_index[i-1]; k < network->layer_index[i-1] + network->layer_size[i-1]; k++) {
weighted_sum += network->neuron_value[k] * network->synaptic_weight[synapse_index];
synapse_index++;
}
weighted_sum += network->synaptic_weight[synapse_index];
synapse_index++;
network->neuron_value[j] = weighted_sum;
if (i != network->layer_number - 1) network->neuron_value[j] = tanh(network->neuron_value[j]);
}
}
}
void get_mlp (mlp *network, mlp_float *vector) {
int i;
for (i = 0; i < network->output_layer_size; i++) {
vector[i] = network->output_neuron[i];
}
}
void learn_mlp (mlp *network, mlp_float *desired_out, mlp_float learning_rate) {
int i;
mlp_float global_error = 0;
int synapse_index = network->synapse_index[network->layer_number-2];
for (i = 0; i < network->output_layer_size; i++) {
network->output_error_value[i] = network->output_neuron[i] - desired_out[i];
int j;
for (j = network->layer_index[network->layer_number-2]; j < network->layer_index[network->layer_number-2] + network->layer_size[network->layer_number-2]; j++) {
mlp_float weightChange;
weightChange = learning_rate * network->output_error_value[i] * network->neuron_value[j];
network->synaptic_weight[synapse_index] -= weightChange;
if (network->synaptic_weight[synapse_index] > 5) network->synaptic_weight[synapse_index] = 5;
if (network->synaptic_weight[synapse_index] < -5) network->synaptic_weight[synapse_index] = -5;
synapse_index++;
}
mlp_float weightChange;
weightChange = learning_rate * network->output_error_value[i];
network->synaptic_weight[synapse_index] -= weightChange;
if (network->synaptic_weight[synapse_index] > 5) network->synaptic_weight[synapse_index] = 5;
if (network->synaptic_weight[synapse_index] < -5) network->synaptic_weight[synapse_index] = -5;
synapse_index++;
}
for (i = network->layer_number - 2; i > 0; i--) {
int j;
int jj= 0;
int synapse_index = network->synapse_index[i-1];
for (j = network->layer_index[i]; j < network->layer_index[i] + network->layer_size[i]; j++,jj++) {
int k;
int synapse_index2 = network->synapse_index[i] + jj;
network->neuron_error_value[j] = 0;
for (k = network->layer_index[i+1]; k < network->layer_index[i+1] + network->layer_size[i+1]; k++) {
network->neuron_error_value[j] += network->synaptic_weight[synapse_index2] * network->neuron_error_value[k];
synapse_index2+=network->layer_size[i]+1;
}
for (k = network->layer_index[i-1]; k < network->layer_index[i-1] + network->layer_size[i-1]; k++) {
mlp_float weightChange;
weightChange = 1.0 - network->neuron_value[j] * network->neuron_value[j];
weightChange *= network->neuron_error_value[j] * learning_rate;
weightChange *= network->neuron_value[k];
network->synaptic_weight[synapse_index] -= weightChange;
synapse_index++;
}
mlp_float weightChange;
weightChange = 1.0 - network->neuron_value[j] * network->neuron_value[j];
weightChange *= network->neuron_error_value[j] * learning_rate;
network->synaptic_weight[synapse_index] -= weightChange;
synapse_index++;
}
}
}
void get_mlp_inputs (mlp *network, mlp_float *vector) {
if (vector != NULL) {
int i;
for (i = 0; i < network->input_layer_size; i++) {
vector[i] = network->input_neuron[i];
}
}
}
最佳答案
关于recurrent links的计算,终于找到了a document .如果我很好理解,我应该计算两个神经元之间的循环链接 N1<-N2
,通过以下方式:
(value of N1) += (previous value of N2) * (weight of link N1<-N2)
No error backpropagation through recurrent links
(new weight) = (old weight) - derivative(value of N1) * (error of N1) * (previous value of N2) * learning_rate
tanh
计算了输入神经元的值,但不应改变输入神经元的值。
#include <stdio.h>
#include <time.h>
#include <math.h>
#include <malloc.h>
#include <stdlib.h>
#include "mlp.h"
typedef struct _neuron NEURON;
struct _neuron {
int layer;
double * weight; // table of weights for incoming synapses
int nbsynapsesin; // number of incoming synapses
NEURON ** synapsesin; // table of pointer to the neurons from
// which are coming the synapses
double bias;
double value;
double value_prev;
double error;
double error_prev;
};
typedef struct _rnn RNN;
struct _rnn {
int * layersize;
int nbneurons;
NEURON * n;
};
typedef struct _config CONFIG;
struct _config {
int nbneurons;
int * layersize;
int nbsynapses;
int * synapses;
};
CONFIG * createconfig(int * layersize) {
CONFIG * conf = (CONFIG*)malloc(sizeof(CONFIG));
int i;
conf->nbneurons = 0;
for(i=1; i<layersize[0]+1; i++) conf->nbneurons += layersize[i];
conf->layersize = (int*)malloc((layersize[0]+1)*sizeof(int));
for(i=0; i<layersize[0]+1; i++) conf->layersize[i] = layersize[i];
// Compute the number of synapses:
conf->nbsynapses = 0;
for(i=1; i<layersize[0]; i++) conf->nbsynapses += layersize[i] * layersize[i+1];
conf->nbsynapses *= 2;
// Allocate the table of synapses:
conf->synapses = (int*)malloc(2*conf->nbsynapses*sizeof(int));
// creation of the synapses:
int j,k=0,l,k2=0,k3=0;
for(i=1;i<layersize[0];i++) {
k3 += layersize[i];
for(j=0; j<layersize[i]; j++) {
for(l=0; l<layersize[i+1]; l++) {
// forward link/synapse:
conf->synapses[k] = k2+j;
k++;
conf->synapses[k] = k3+l;
k++;
// Recurrent link/synapse:
conf->synapses[k] = k3+l;
k++;
conf->synapses[k] = k2+j;
k++;
}
}
k2 += layersize[i];
}
return conf;
}
void freeconfig(CONFIG* conf) {
free(conf->synapses);
free(conf->layersize);
free(conf);
}
RNN * creaternn(CONFIG * conf) {
RNN * net = (RNN*)malloc(sizeof(RNN));
net->nbneurons = conf->nbneurons;
net->layersize = (int*)malloc((conf->layersize[0]+1)*sizeof(int));
int i;
for(i=0; i<conf->layersize[0]+1; i++) net->layersize[i] = conf->layersize[i];
// Allocate the neuron table of the Recurrent Neural Network:
net->n = (NEURON*)malloc(conf->nbneurons*sizeof(NEURON));
// Initialize some neuron values:
int j=0,k=0;
for(i=0; i<conf->nbneurons; i++) {
if(k==0) { k = conf->layersize[j+1]; j++; }
net->n[i].layer = j-1;
net->n[i].nbsynapsesin = 0;
k--;
}
// Count the incoming synapses for each neuron:
k=0;
for(i=0; i<conf->nbsynapses; i++) {
k++;
net->n[conf->synapses[k]].nbsynapsesin++;
k++;
}
// Allocate weight table in neurons, and the table of pointer to neuron
// that represent the incoming synapses:
for(i=0; i<conf->nbneurons; i++) {
net->n[i].weight = (double*)malloc(net->n[i].nbsynapsesin*sizeof(double));
net->n[i].synapsesin = (NEURON**)malloc(net->n[i].nbsynapsesin*sizeof(NEURON*));
net->n[i].nbsynapsesin = 0;
}
// Link the incoming synapses with the neurons:
k=0;
for(i=0; i<conf->nbsynapses; i++) {
k++;
net->n[conf->synapses[k]].synapsesin[net->n[conf->synapses[k]].nbsynapsesin] = &(net->n[conf->synapses[k-1]]);
net->n[conf->synapses[k]].nbsynapsesin++;
k++;
}
// Initialization of the values, errors, and weights:
for(i=0; i<net->nbneurons; i++) {
for(j=0; j<net->n[i].nbsynapsesin; j++) {
net->n[i].weight[j] = 1.0 * (double)rand() / RAND_MAX - 1.0/2;
}
net->n[i].bias = 1.0 * (double)rand() / RAND_MAX - 1.0/2;
net->n[i].value = 0.0;
net->n[i].value_prev = 0.0;
net->n[i].error_prev = 0.0;
net->n[i].error = 0.0;
}
return net;
}
void freernn(RNN * net) {
int i;
for(i=0; i<net->nbneurons; i++) {
free(net->n[i].weight);
free(net->n[i].synapsesin);
}
free(net->n);
free(net->layersize);
free(net);
}
void rnnget(RNN * net, double * out) {
int i,k=0;
// Store the output of the network in the variable table "out":
for(i=net->nbneurons-1; i>=(net->nbneurons - net->layersize[net->layersize[0]]); i--) { out[k] = net->n[i].value; k++; }
}
void rnnsetstart(RNN * net) {
int i,j;
NEURON *ni,*nj;
// For each neuron, update value_prev:
for(i=0; i<net->nbneurons; i++) {
ni = &(net->n[i]);
// If NOT the output layer, then the value is already computed by tanh:
if(ni->layer != net->layersize[0]-1) ni->value_prev = ni->value;
else ni->value_prev = tanh(ni->value);
}
}
void rnnset(RNN * net, double * in) {
int i,j,k;
double v;
NEURON *ni,*nj;
// For each neuron:
for(i=0; i<net->nbneurons; i++) {
ni = &(net->n[i]);
// If it is an input neuron:
if(i<net->layersize[1]) ni->value = in[i];
else ni->value = ni->bias;
// If the neuron is NOT in input layer, then
// compute the value from the incoming synapses:
if(i>=net->layersize[1]) {
// For each incoming synapse:
for(j=0; j<ni->nbsynapsesin; j++) {
nj = ni->synapsesin[j];
// If the synapse is from input layer to output layer, then tanh the value:
if(nj->layer == 0 && ni->layer == (net->layersize[0]-1)) {
////////////////////////////////////////////////////////////////////////
// Uncomment the following line to enable reccurent links computation:
ni->value += tanh(nj->value_prev) * ni->weight[j];
////////////////////////////////////////////////////////////////////////
} else {
// If it is a forward link/synapse:
if(ni->layer > nj->layer) ni->value += nj->value * ni->weight[j];
////////////////////////////////////////////////////////////////////////
// Uncomment the following line to enable reccurent links computation:
else ni->value += nj->value_prev * ni->weight[j];
////////////////////////////////////////////////////////////////////////
}
}
}
// If NOT the input layer NOR the output layer, then tanh the value:
if(ni->layer != 0 && ni->layer != net->layersize[0]-1) ni->value = tanh(ni->value);
}
}
void rnnlearnstart(RNN * net) {
int i;
// For each neuron, initialize error_prev and value_prev for a
// new training cycle:
for(i=0; i<net->nbneurons; i++) { net->n[i].error_prev = 0.0; net->n[i].value_prev = 0.0; }
}
void rnnlearn(RNN * net, double * out, double learningrate) {
int i,j,k;
k=0;
NEURON *ni,*nj;
// Initialize error to zero for the output layer:
for(i=net->nbneurons-1; i>=net->nbneurons-net->layersize[net->layersize[0]]; i--) net->n[i].error = 0.0;
// Compute the error for output neurons, and
// initialize it to 0 for the other neurons:
for(i=net->nbneurons-1; i>=0; i--) {
ni = &(net->n[i]);
// If ni is an output neuron, update the error:
if(ni->layer == net->layersize[0]-1) {
ni->error += ni->value - out[k];
k++;
} else {
ni->error = 0.0;
}
}
// Compute error for all other neurons:
for(i=net->nbneurons-1; i>=0; i--) {
ni = &(net->n[i]);
// For each incoming synapse NOT from output layer:
for(j=0; j<ni->nbsynapsesin; j++) {
nj = ni->synapsesin[j];
// If it is a forward link/synapse:
if(ni->layer > nj->layer) nj->error += ni->error * ni->weight[j];
}
}
// Update weights:
for(i=0; i<net->nbneurons; i++) {
ni = &(net->n[i]);
double wchange,derivative;
// For the output layer:
if(ni->layer == net->layersize[0]-1) {
derivative = ni->error * learningrate;
// For each incoming synapse:
for(j=0; j<ni->nbsynapsesin; j++) {
nj = ni->synapsesin[j];
wchange = derivative;
// If it is a forward link/synapse:
if(ni->layer > nj->layer) wchange *= nj->value;
else wchange *= nj->value_prev;
ni->weight[j] -= wchange;
if(ni->weight[j] > 5) ni->weight[j] = 5;
if(ni->weight[j] < -5) ni->weight[j] = -5;
}
ni->bias -= derivative;
if(ni->bias > 5) ni->bias = 5;
if(ni->bias < -5) ni->bias = -5;
// For the other layers:
} else {
derivative = 1.0 - ni->value * ni->value;
derivative *= ni->error * learningrate;
// For each incoming synapse:
for(j=0; j<ni->nbsynapsesin; j++) {
nj = ni->synapsesin[j];
wchange = derivative;
// If it is a forward link/synapse:
if(ni->layer > nj->layer) wchange *= nj->value;
else wchange *= nj->value_prev;
ni->weight[j] -= wchange;
}
ni->bias -= derivative;
}
}
// Update error_prev:
for(i=0; i<net->nbneurons; i++) net->n[i].error_prev = net->n[i].error;
}
int main() {
srand(time(NULL));
int layersize[] = {1, 25, 12, 1};
int layersize_netrnn[] = { 4, 1, 25, 12, 1 };
mlp * netmlp = create_mlp (4, layersize);
srand(time(NULL));
CONFIG * configrnn = createconfig(layersize_netrnn);
RNN * netrnn = creaternn(configrnn);
double inc,outc;
double global_error = 1;
double global_error2 = 1;
int iter,i1=0,i2=0;
//////////////////////////////////////////////////////
// Training of the Multi-Layer Perceptron:
//////////////////////////////////////////////////////
while(global_error > 0.005 && i1<1000) {
for (iter=0; iter < 100; iter++) {
inc = 1.0*rand()/(RAND_MAX+1.0);
outc = inc*inc;
set_mlp(netmlp,&inc);
learn_mlp(netmlp,&outc,0.03);
}
global_error = 0;
int k;
for (k=0; k < 100; k++) {
inc = 1.0*rand()/(RAND_MAX+1.0);
outc = inc*inc;
set_mlp(netmlp,&inc);
get_mlp(netmlp,&outc);
mlp_float desired_out = inc*inc;
global_error += (desired_out - outc)*(desired_out - outc);
}
global_error /= 100;
global_error = sqrt(global_error);
i1++;
}
//////////////////////////////////////////////////////
// Training of the Recurrent Neural Network:
//////////////////////////////////////////////////////
while(global_error2 > 0.005 && i2<1000) {
rnnlearnstart(netrnn);
for (iter=0; iter < 100; iter++) {
inc = 1.0*rand()/(RAND_MAX+1.0);
outc = inc*inc;
rnnsetstart(netrnn);
rnnset(netrnn,&inc);
double outc2;
rnnlearn(netrnn,&outc,0.03);
}
global_error2 = 0;
int k;
for (k=0; k < 100; k++) {
inc = 1.0*rand()/(RAND_MAX+1.0);
outc = inc*inc;
double desired_out = inc*inc;
rnnsetstart(netrnn);
rnnset(netrnn,&inc);
rnnget(netrnn,&outc);
global_error2 += (desired_out - outc)*(desired_out - outc);
}
global_error2 /= 100;
global_error2 = sqrt(global_error2);
if(!isnormal(global_error2)) global_error2 = 100;
i2++;
}
//////////////////////////////////////////////////////
// Test of performance for the both networks:
//////////////////////////////////////////////////////
global_error = 0;
global_error2 = 0;
int k;
for (k=0; k < 10000; k++) {
inc = 1.0*rand()/(RAND_MAX+1.0);
outc = inc*inc;
double desired_out = inc*inc;
rnnsetstart(netrnn);
rnnset(netrnn,&inc);
rnnget(netrnn,&outc);
global_error2 += (desired_out - outc)*(desired_out - outc);
set_mlp(netmlp,&inc);
get_mlp(netmlp,&outc);
global_error += (desired_out - outc)*(desired_out - outc);
}
global_error /= 10000;
global_error = sqrt(global_error);
printf("\n MLP: Training cycles: %5d Error: %f",i1,global_error);
global_error2 /= 10000;
global_error2 = sqrt(global_error2);
printf("\n RNN: Training cycles: %5d Error: %f",i2,global_error2);
free_mlp(netmlp);
freeconfig(configrnn);
freernn(netrnn);
}
关于c - 循环神经网络实现,我们在Stack Overflow上找到一个类似的问题: https://stackoverflow.com/questions/39910695/
#include using namespace std; class C{ private: int value; public: C(){ value = 0;
这个问题已经有答案了: What is the difference between char a[] = ?string?; and char *p = ?string?;? (8 个回答) 已关闭
关闭。此题需要details or clarity 。目前不接受答案。 想要改进这个问题吗?通过 editing this post 添加详细信息并澄清问题. 已关闭 7 年前。 此帖子已于 8 个月
除了调试之外,是否有任何针对 c、c++ 或 c# 的测试工具,其工作原理类似于将独立函数复制粘贴到某个文本框,然后在其他文本框中输入参数? 最佳答案 也许您会考虑单元测试。我推荐你谷歌测试和谷歌模拟
我想在第二台显示器中移动一个窗口 (HWND)。问题是我尝试了很多方法,例如将分辨率加倍或输入负值,但它永远无法将窗口放在我的第二台显示器上。 关于如何在 C/C++/c# 中执行此操作的任何线索 最
我正在寻找 C/C++/C## 中不同类型 DES 的现有实现。我的运行平台是Windows XP/Vista/7。 我正在尝试编写一个 C# 程序,它将使用 DES 算法进行加密和解密。我需要一些实
很难说出这里要问什么。这个问题模棱两可、含糊不清、不完整、过于宽泛或夸夸其谈,无法以目前的形式得到合理的回答。如需帮助澄清此问题以便重新打开,visit the help center . 关闭 1
有没有办法强制将另一个 窗口置于顶部? 不是应用程序的窗口,而是另一个已经在系统上运行的窗口。 (Windows, C/C++/C#) 最佳答案 SetWindowPos(that_window_ha
假设您可以在 C/C++ 或 Csharp 之间做出选择,并且您打算在 Windows 和 Linux 服务器上运行同一服务器的多个实例,那么构建套接字服务器应用程序的最明智选择是什么? 最佳答案 如
你们能告诉我它们之间的区别吗? 顺便问一下,有什么叫C++库或C库的吗? 最佳答案 C++ 标准库 和 C 标准库 是 C++ 和 C 标准定义的库,提供给 C++ 和 C 程序使用。那是那些词的共同
下面的测试代码,我将输出信息放在注释中。我使用的是 gcc 4.8.5 和 Centos 7.2。 #include #include class C { public:
很难说出这里问的是什么。这个问题是含糊的、模糊的、不完整的、过于宽泛的或修辞性的,无法以目前的形式得到合理的回答。如需帮助澄清此问题以便重新打开它,visit the help center 。 已关
我的客户将使用名为 annoucement 的结构/类与客户通信。我想我会用 C++ 编写服务器。会有很多不同的类继承annoucement。我的问题是通过网络将这些类发送给客户端 我想也许我应该使用
我在 C# 中有以下函数: public Matrix ConcatDescriptors(IList> descriptors) { int cols = descriptors[0].Co
我有一个项目要编写一个函数来对某些数据执行某些操作。我可以用 C/C++ 编写代码,但我不想与雇主共享该函数的代码。相反,我只想让他有权在他自己的代码中调用该函数。是否可以?我想到了这两种方法 - 在
我使用的是编写糟糕的第 3 方 (C/C++) Api。我从托管代码(C++/CLI)中使用它。有时会出现“访问冲突错误”。这使整个应用程序崩溃。我知道我无法处理这些错误[如果指针访问非法内存位置等,
关闭。这个问题不符合Stack Overflow guidelines .它目前不接受答案。 我们不允许提问寻求书籍、工具、软件库等的推荐。您可以编辑问题,以便用事实和引用来回答。 关闭 7 年前。
已关闭。此问题不符合Stack Overflow guidelines 。目前不接受答案。 要求我们推荐或查找工具、库或最喜欢的场外资源的问题对于 Stack Overflow 来说是偏离主题的,因为
我有一些 C 代码,将使用 P/Invoke 从 C# 调用。我正在尝试为这个 C 函数定义一个 C# 等效项。 SomeData* DoSomething(); struct SomeData {
这个问题已经有答案了: Why are these constructs using pre and post-increment undefined behavior? (14 个回答) 已关闭 6
我是一名优秀的程序员,十分优秀!