Exception in main training loop: NaN is detected on forward computation of LinearFunction
Traceback (most recent call last):
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/training/trainer.py", line 299, in run
update()
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/training/updater.py", line 223, in update
self.update_core()
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/training/updater.py", line 234, in update_core
optimizer.update(loss_func, *in_arrays)
File "/home/user/anaconda3/lib/python3.6/site-packages/chainermn/optimizers.py", line 20, in update
loss = lossfun(*args, **kwds)
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/links/model/classifier.py", line 114, in __call__
self.y = self.predictor(*args, **kwargs)
File "examples/mnist/train_mnist.py", line 27, in __call__
h1 = F.relu(self.l1(x))
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/links/connection/linear.py", line 129, in __call__
return linear.linear(x, self.W, self.b)
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/functions/connection/linear.py", line 175, in linear
y, = LinearFunction().apply(args)
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/function_node.py", line 258, in apply
raise RuntimeError(msg)
Will finalize trainer extensions and updater before reraising the exception.
Exception in main training loop: NaN is detected on forward computation of LinearFunction
Traceback (most recent call last):
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/training/trainer.py", line 299, in run
update()
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/training/updater.py", line 223, in update
self.update_core()
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/training/updater.py", line 234, in update_core
optimizer.update(loss_func, *in_arrays)
File "/home/user/anaconda3/lib/python3.6/site-packages/chainermn/optimizers.py", line 20, in update
loss = lossfun(*args, **kwds)
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/links/model/classifier.py", line 114, in __call__
self.y = self.predictor(*args, **kwargs)
File "examples/mnist/train_mnist.py", line 27, in __call__
h1 = F.relu(self.l1(x))
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/links/connection/linear.py", line 129, in __call__
return linear.linear(x, self.W, self.b)
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/functions/connection/linear.py", line 175, in linear
y, = LinearFunction().apply(args)
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/function_node.py", line 258, in apply
raise RuntimeError(msg)
Will finalize trainer extensions and updater before reraising the exception.
Exception in main training loop: NaN is detected on forward computation of LinearFunction
Traceback (most recent call last):
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/training/trainer.py", line 299, in run
update()
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/training/updater.py", line 223, in update
self.update_core()
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/training/updater.py", line 234, in update_core
optimizer.update(loss_func, *in_arrays)
File "/home/user/anaconda3/lib/python3.6/site-packages/chainermn/optimizers.py", line 20, in update
loss = lossfun(*args, **kwds)
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/links/model/classifier.py", line 114, in __call__
self.y = self.predictor(*args, **kwargs)
File "examples/mnist/train_mnist.py", line 27, in __call__
h1 = F.relu(self.l1(x))
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/links/connection/linear.py", line 129, in __call__
return linear.linear(x, self.W, self.b)
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/functions/connection/linear.py", line 175, in linear
y, = LinearFunction().apply(args)
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/function_node.py", line 258, in apply
raise RuntimeError(msg)
Will finalize trainer extensions and updater before reraising the exception.
Traceback (most recent call last):
File "examples/mnist/train_mnist.py", line 124, in <module>
main()
File "examples/mnist/train_mnist.py", line 120, in main
trainer.run()
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/training/trainer.py", line 313, in run
six.reraise(*sys.exc_info())
File "/home/user/anaconda3/lib/python3.6/site-packages/six.py", line 693, in reraise
raise value
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/training/trainer.py", line 299, in run
update()
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/training/updater.py", line 223, in update
self.update_core()
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/training/updater.py", line 234, in update_core
optimizer.update(loss_func, *in_arrays)
File "/home/user/anaconda3/lib/python3.6/site-packages/chainermn/optimizers.py", line 20, in update
loss = lossfun(*args, **kwds)
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/links/model/classifier.py", line 114, in __call__
self.y = self.predictor(*args, **kwargs)
File "examples/mnist/train_mnist.py", line 27, in __call__
h1 = F.relu(self.l1(x))
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/links/connection/linear.py", line 129, in __call__
return linear.linear(x, self.W, self.b)
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/functions/connection/linear.py", line 175, in linear
y, = LinearFunction().apply(args)
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/function_node.py", line 258, in apply
raise RuntimeError(msg)
RuntimeError: NaN is detected on forward computation of LinearFunction
Exception in main training loop: NaN is detected on forward computation of LinearFunction
Traceback (most recent call last):
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/training/trainer.py", line 299, in run
update()
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/training/updater.py", line 223, in update
self.update_core()
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/training/updater.py", line 234, in update_core
optimizer.update(loss_func, *in_arrays)
File "/home/user/anaconda3/lib/python3.6/site-packages/chainermn/optimizers.py", line 20, in update
loss = lossfun(*args, **kwds)
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/links/model/classifier.py", line 114, in __call__
self.y = self.predictor(*args, **kwargs)
File "examples/mnist/train_mnist.py", line 27, in __call__
h1 = F.relu(self.l1(x))
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/links/connection/linear.py", line 129, in __call__
return linear.linear(x, self.W, self.b)
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/functions/connection/linear.py", line 175, in linear
y, = LinearFunction().apply(args)
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/function_node.py", line 258, in apply
raise RuntimeError(msg)
Will finalize trainer extensions and updater before reraising the exception.
Traceback (most recent call last):
File "examples/mnist/train_mnist.py", line 124, in <module>
main()
File "examples/mnist/train_mnist.py", line 120, in main
trainer.run()
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/training/trainer.py", line 313, in run
six.reraise(*sys.exc_info())
File "/home/user/anaconda3/lib/python3.6/site-packages/six.py", line 693, in reraise
raise value
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/training/trainer.py", line 299, in run
update()
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/training/updater.py", line 223, in update
self.update_core()
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/training/updater.py", line 234, in update_core
optimizer.update(loss_func, *in_arrays)
File "/home/user/anaconda3/lib/python3.6/site-packages/chainermn/optimizers.py", line 20, in update
loss = lossfun(*args, **kwds)
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/links/model/classifier.py", line 114, in __call__
self.y = self.predictor(*args, **kwargs)
File "examples/mnist/train_mnist.py", line 27, in __call__
h1 = F.relu(self.l1(x))
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/links/connection/linear.py", line 129, in __call__
return linear.linear(x, self.W, self.b)
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/functions/connection/linear.py", line 175, in linear
y, = LinearFunction().apply(args)
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/function_node.py", line 258, in apply
raise RuntimeError(msg)
RuntimeError: NaN is detected on forward computation of LinearFunction
Traceback (most recent call last):
File "examples/mnist/train_mnist.py", line 124, in <module>
main()
File "examples/mnist/train_mnist.py", line 120, in main
trainer.run()
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/training/trainer.py", line 313, in run
six.reraise(*sys.exc_info())
File "/home/user/anaconda3/lib/python3.6/site-packages/six.py", line 693, in reraise
raise value
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/training/trainer.py", line 299, in run
update()
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/training/updater.py", line 223, in update
self.update_core()
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/training/updater.py", line 234, in update_core
optimizer.update(loss_func, *in_arrays)
File "/home/user/anaconda3/lib/python3.6/site-packages/chainermn/optimizers.py", line 20, in update
loss = lossfun(*args, **kwds)
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/links/model/classifier.py", line 114, in __call__
self.y = self.predictor(*args, **kwargs)
File "examples/mnist/train_mnist.py", line 27, in __call__
h1 = F.relu(self.l1(x))
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/links/connection/linear.py", line 129, in __call__
return linear.linear(x, self.W, self.b)
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/functions/connection/linear.py", line 175, in linear
y, = LinearFunction().apply(args)
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/function_node.py", line 258, in apply
raise RuntimeError(msg)
RuntimeError: NaN is detected on forward computation of LinearFunction
Traceback (most recent call last):
File "examples/mnist/train_mnist.py", line 124, in <module>
main()
File "examples/mnist/train_mnist.py", line 120, in main
trainer.run()
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/training/trainer.py", line 313, in run
six.reraise(*sys.exc_info())
File "/home/user/anaconda3/lib/python3.6/site-packages/six.py", line 693, in reraise
raise value
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/training/trainer.py", line 299, in run
update()
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/training/updater.py", line 223, in update
self.update_core()
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/training/updater.py", line 234, in update_core
optimizer.update(loss_func, *in_arrays)
File "/home/user/anaconda3/lib/python3.6/site-packages/chainermn/optimizers.py", line 20, in update
loss = lossfun(*args, **kwds)
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/links/model/classifier.py", line 114, in __call__
self.y = self.predictor(*args, **kwargs)
File "examples/mnist/train_mnist.py", line 27, in __call__
h1 = F.relu(self.l1(x))
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/links/connection/linear.py", line 129, in __call__
return linear.linear(x, self.W, self.b)
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/functions/connection/linear.py", line 175, in linear
y, = LinearFunction().apply(args)
File "/home/user/anaconda3/lib/python3.6/site-packages/chainer/function_node.py", line 258, in apply
raise RuntimeError(msg)
RuntimeError: NaN is detected on forward computation of LinearFunction
-------------------------------------------------------
Primary job terminated normally, but 1 process returned
a non-zero exit code.. Per user-direction, the job has been aborted.
-------------------------------------------------------
--------------------------------------------------------------------------
mpiexec detected that one or more processes exited with non-zero status, thus causing
the job to be terminated. The first process to do so was:
Process name: [[4540,1],1]
Exit code: 1
--------------------------------------------------------------------------