When I train Transformer use by OpenNMT pytorch error is occur…
error
Process SpawnProcess-9:
Traceback (most recent call last):
File “/usr/lib/python3.6/multiprocessing/process.py”, line 258, in _bootstrap
self.run()
File “/usr/lib/python3.6/multiprocessing/process.py”, line 93, in run
self._target(*self._args, **self._kwargs)
File “/data/home/chanjun_park/OpenNMT-py/train.py”, line 127, in batch_producer
q.put(b, False)
File “/usr/lib/python3.6/multiprocessing/queues.py”, line 83, in put
raise Full
queue.Full
Traceback (most recent call last):
File “…/…/train.py”, line 196, in
main(opt)
File “…/…/train.py”, line 78, in main
p.join()
File “/usr/lib/python3.6/multiprocessing/process.py”, line 124, in join
res = self._popen.wait(timeout)
File “/usr/lib/python3.6/multiprocessing/popen_fork.py”, line 50, in wait
return self.poll(os.WNOHANG if timeout == 0.0 else 0)
File “/usr/lib/python3.6/multiprocessing/popen_fork.py”, line 28, in poll
pid, sts = os.waitpid(self.pid, flag)
File “…/…/train.py”, line 180, in signal_handler
raise Exception(msg)
Exception:– Tracebacks above this line can probably
be ignored –Traceback (most recent call last):
File “/data/home/chanjun_park/OpenNMT-py/train.py”, line 138, in run
single_main(opt, device_id, batch_queue, semaphore)
File “/data/home/chanjun_park/OpenNMT-py/onmt/train_single.py”, line 139, in main
valid_steps=opt.valid_steps)
File “/data/home/chanjun_park/OpenNMT-py/onmt/trainer.py”, line 224, in train
self._accum_batches(train_iter)):
File “/data/home/chanjun_park/OpenNMT-py/onmt/trainer.py”, line 162, in _accum_batches
for batch in iterator:
File “/data/home/chanjun_park/OpenNMT-py/onmt/train_single.py”, line 116, in _train_iter
batch = batch_queue.get()
File “/usr/lib/python3.6/multiprocessing/queues.py”, line 113, in get
return _ForkingPickler.loads(res)
File “/data/home/chanjun_park/.local/lib/python3.6/site-packages/torch/multiprocessing/reductions.py”, line 109, in rebuild_cuda_tensor
event_sync_required)
RuntimeError: CUDA error: unknown error
Do any have a solution?