[英]std::vector behavior, move and copy
我在空闲时间使用cpp做一个神经网络,以便获得更多有关C ++ 11的经验。 但是我遇到了一些我无法弄清楚自己的问题。
struct neuronsLayer
{
vector<real> ac;
neuronsLayer(int s)
{
std::cout<<"neuronLayer 1"<<std::endl;
ac = vector<real>(s,0.1f);
}
neuronsLayer(const neuronsLayer& nl)
{
std::cout<<"neuronLayer 2"<<std::endl;
ac = vector<real>(nl.ac);
}
neuronsLayer(neuronsLayer&& nl)
{
std::cout<<"neuronLayer 3"<<std::endl;
ac = std::move(nl.ac);
}
neuronsLayer operator=(const neuronsLayer& nl)
{
std::cout<<"neuronLayer 4"<<std::endl;
return neuronsLayer(nl);
}
neuronsLayer(){ std::cout<<"neuronLayer 5"<<std::endl;}
~neuronsLayer(){}
};
这是一个层实现,然后:
struct network
{
vector<neuronsLayer> hiddens;
vector<neuronsConnection> synaps;
real alpha;
//std::initializer_list
network(vector<int> layers)
{
alpha = 1.f;
hiddens = vector<neuronsLayer>();//+2
for(int& l : layers)
{
hiddens.push_back(neuronsLayer(l));
}
synaps = vector<neuronsConnection>();
for(int i = 0 ; i < layers.size() -1 ; i++)
{
synaps.push_back(std::move(neuronsConnection(layers[i],layers[i+1])));
}
}
void forward(vector<real> input)
{
hiddens[0].ac = input;
for (int layer = 0; layer < hiddens.size() -1; ++layer)
{
for(int i = 0 ; i < synaps[layer].x ; i++)
{
for(int j = 0 ; j < synaps[layer].y ; j++)
{
hiddens[layer+1].ac[i] += hiddens[layer].ac[j] * synaps[layer].w[i + synaps[layer].x * j]; //+ activation +biais
}
}
for(int i = 0 ; i < hiddens[layer].ac.size() ; i ++)
hiddens[layer+1].ac[i] = 1.f/(1+exp(-hiddens[layer+1].ac[i]));
}
}
void backward(vector<real> expected)
{
vector<real> error(expected);
for(int i = 0 ; i < error.size(); i ++)
{
error[i] = expected[i] - hiddens[hiddens.size() -1].ac[i];
}
for (int layer = 0; layer < hiddens.size() -1; ++layer)
{
for(int i = 0 ; i < synaps[layer].x ; i++)
{
for(int j = 0 ; j < synaps[layer].y ; j++)
{
real dw = error[i]*(1+2*exp(-hiddens[0].ac[i])/(1+exp(-hiddens[0].ac[i])));
synaps[layer].w[i + synaps[layer].x * j] += dw*alpha;
}
}
}
}
和主要:
int main(int argc, char** argv)
{
vector<int> net = {64,2};
network nn(net);
vector<float> o = {1,0};
vector<float> t = {0,1};
auto rOne = std::bind(std::normal_distribution<float>(6,1), std::default_random_engine{});
auto rTwo = std::bind(std::normal_distribution<float>(3,1), std::default_random_engine{});
auto gOne = [&](){
int x=rOne(),y=rOne();
//while(x=rOne > 8 or x < 0);
//while(y=rOne > 8 or y < 0);
std::vector<real> tbr (64,0);
tbr[x + y*8] = 1.0;
return tbr;
};
auto gTwo = [&](){
int x=rTwo(),y=rTwo();
//while(x=rTwo > 8 or x < 0);
//while(y=rTwo > 8 or y < 0);
std::vector<real> tbr (64,0);
tbr[x + y*8] = 1.0;
return tbr;
};
for(int i = 0 ; i < 5000 ; i++)
{
nn.forward(gOne());
nn.backward(o);
nn.forward(gTwo());
nn.backward(t);
}
我有一个主要问题和两个问题:
1)当执行向后调用时,我在执行过程中收到SEGFAULT,似乎hiddens [0]为空。 因此,我可能(有点轻描淡写)误解了举动的运作方式?
Program received signal SIGSEGV, Segmentation fault.
0x0000000000402159 in network::backward (this=0x7fffffffe190, expected=...) at dnn3.cpp:171
171 real dw = error[i]*(1+2*exp(-hiddens[0].ac[i])/(1+exp( hiddens[0].ac[i])));
(gdb) p i
$1 = 0
(gdb) p hiddens[0].ac[i]
$2 = (__gnu_cxx::__alloc_traits<std::allocator<float> >::value_type &) @0x3f0000003f000000: <error reading variable>
2)在此之前,程序的输出为:
neuronLayer 1
neuronLayer 3
neuronLayer 1
neuronLayer 3
neuronLayer 2
为什么复制构造函数被调用? 我仅创建2层,并且它们都是按照完全相同的过程生成的,并且只有其中之一正在使用此构造函数。 而且我不明白为什么需要它。
3)关于绑定对象rOne和rTwo,它们始终返回相同的值吗? 因为当我戳入gOne输出时,它似乎返回了相同值的两倍。 那正常吗?
在此先感谢Marc。
编辑:按要求:
(gdb) p hiddens
$1 = {<std::_Vector_base<neuronsLayer, std::allocator<neuronsLayer> >> = { _M_impl = {<std::allocator<neuronsLayer>> ={<__gnu_cxx::new_allocator<neuronsLayer>> = {<No data fields>}, <No data fields>},_M_start = 0x60c1a0, _M_finish = 0x60c1d0, _M_end_of_storage = 0x60c1d0}}, <No data fields>}
(gdb) p hiddens[0].ac
$2 = {<std::_Vector_base<float, std::allocator<float> >> = { _M_impl = {<std::allocator<float>> = {<__gnu_cxx::new_allocator<float>> = {<No data fields>}, <No data fields>}, _M_start = 0x3f0000003f000000, _M_finish = 0x3f0000003f000000, _M_end_of_storage = 0x60c2e0}}, <No data fields>}
编辑2:
Breakpoint 1, network::forward (this=0x7fffffffe190, input=...)
(gdb) p hiddens
$1 = {<std::_Vector_base<neuronsLayer, std::allocator<neuronsLayer> >> = {_M_impl = {<std::allocator<neuronsLayer>> = {<__gnu_cxx::new_allocator<neuronsLayer>> = {<No data fields>}, <No data fields>},_M_start = 0x60d1a0, _M_finish = 0x60d1d0, _M_end_of_storage = 0x60d1d0}}, <No data fields>}
(gdb) p hiddens[0]
$2 = (__gnu_cxx::__alloc_traits<std::allocator<neuronsLayer> >::value_type &) @0x60d1a0: { ac = {<std::_Vector_base<float, std::allocator<float> >> = { _M_impl = {<std::allocator<float>> = {<__gnu_cxx::new_allocator<float>> = {<No data fields>}, <No data fields>}, _M_start = 0x60d1e0, _M_finish = 0x60d2e0, _M_end_of_storage = 0x60d2e0}}, <No data fields>}}
(gdb) p hiddens[0].ac
$3 = {<std::_Vector_base<float, std::allocator<float> >> = { _M_impl = {<std::allocator<float>> = {<__gnu_cxx::new_allocator<float>> = {<No data fields>}, <No data fields>}, _M_start = 0x60d1e0, _M_finish = 0x60d2e0, _M_end_of_storage = 0x60d2e0}}, <No data fields>}
(gdb) p hiddens[1]
$4 = (__gnu_cxx::__alloc_traits<std::allocator<neuronsLayer> >::value_type &) @0x60d1b8: { ac = {<std::_Vector_base<float, std::allocator<float> >> = _M_impl = {<std::allocator<float>> = {<__gnu_cxx::new_allocator<float>> = {<No data fields>}, <No data fields>}, _M_start = 0x60d180, _M_finish = 0x60d188, _M_end_of_storage = 0x60d188}}, <No data fields>}}
(gdb) p hiddens[1].ac[0]
$5 = (__gnu_cxx::__alloc_traits<std::allocator<float> >::value_type &) @0x60d180: 0.100000001
(gdb) p hiddens[0].ac[0]
$6 = (__gnu_cxx::__alloc_traits<std::allocator<float> >::value_type &) @0x60d1e0: 0.100000001
neuronsLayer operator=(const neuronsLayer& nl)
{
std::cout<<"neuronLayer 4"<<std::endl;
return neuronsLayer(nl);
}
赋值运算符没有执行您想要的操作。 实际上,它确实根据传入的nl
复制了一个临时neuronsLayer
对象,而不修改其调用者的内容。
它应该是
neuronsLayer& operator=(const neuronsLayer& nl)
{
std::cout<<"neuronLayer 4"<<std::endl;
ac = nl.ac;
return *this;
}
编辑:按要求:
(gdb) p hiddens
$1 = {<std::_Vector_base<neuronsLayer, std::allocator<neuronsLayer> >> = { _M_impl = {<std::allocator<neuronsLayer>> ={<__gnu_cxx::new_allocator<neuronsLayer>> = {<No data fields>}, <No data fields>},_M_start = 0x60c1a0, _M_finish = 0x60c1d0, _M_end_of_storage = 0x60c1d0}}, <No data fields>}
(gdb) p hiddens[0].ac
$2 = {<std::_Vector_base<float, std::allocator<float> >> = { _M_impl = {<std::allocator<float>> = {<__gnu_cxx::new_allocator<float>> = {<No data fields>}, <No data fields>}, _M_start = 0x3f0000003f000000, _M_finish = 0x3f0000003f000000, _M_end_of_storage = 0x60c2e0}}, <No data fields>}
由于hiddens[0].ac
_M_start
等于_M_finish
,因此它为空,因此获取其第0个元素会导致分段错误。
声明:本站的技术帖子网页,遵循CC BY-SA 4.0协议,如果您需要转载,请注明本站网址或者原文地址。任何问题请咨询:yoyou2525@163.com.