I still have this problem in 1.3.0
```sh
/data1/zj/crnn.gluon/venv/bin/python /data1/zj/crnn.gluon/dataset.py
50761
Process Process-3:
Corrupt JPEG data: premature end of data segment
Traceback (most recent call last):
File "/usr/lib/python3.5/multiprocessing/process.py", line 249, in _bootstrap
self.run()
File "/usr/lib/python3.5/multiprocessing/process.py", line 93, in run
self._target(*self._args, **self._kwargs)
File
"/data1/zj/crnn.gluon/venv/lib/python3.5/site-packages/mxnet/gluon/data/dataloader.py",
line 169, in worker_loop
batch = batchify_fn([dataset[i] for i in samples])
File
"/data1/zj/crnn.gluon/venv/lib/python3.5/site-packages/mxnet/gluon/data/dataloader.py",
line 169, in <listcomp>
batch = batchify_fn([dataset[i] for i in samples])
File
"/data1/zj/crnn.gluon/venv/lib/python3.5/site-packages/mxnet/gluon/data/dataset.py",
line 131, in __getitem__
item = self._data[idx]
File
"/data1/zj/crnn.gluon/venv/lib/python3.5/site-packages/mxnet/gluon/data/vision/datasets.py",
line 257, in __getitem__
record = super(ImageRecordDataset, self).__getitem__(idx)
File
"/data1/zj/crnn.gluon/venv/lib/python3.5/site-packages/mxnet/gluon/data/dataset.py",
line 189, in __getitem__
return self._record.read_idx(self._record.keys[idx])
File
"/data1/zj/crnn.gluon/venv/lib/python3.5/site-packages/mxnet/recordio.py", line
265, in read_idx
return self.read()
File
"/data1/zj/crnn.gluon/venv/lib/python3.5/site-packages/mxnet/recordio.py", line
163, in read
ctypes.byref(size)))
File "/data1/zj/crnn.gluon/venv/lib/python3.5/site-packages/mxnet/base.py",
line 252, in check_call
raise MXNetError(py_str(_LIB.MXGetLastError()))
mxnet.base.MXNetError: [11:35:45] src/recordio.cc:65: Check failed: header[0]
== RecordIOWriter::kMagic Invalid RecordIO File
Stack trace returned 10 entries:
[bt] (0)
/data1/zj/crnn.gluon/venv/lib/python3.5/site-packages/mxnet/libmxnet.so(+0x36bac2)
[0x7f1e38c81ac2]
[bt] (1)
/data1/zj/crnn.gluon/venv/lib/python3.5/site-packages/mxnet/libmxnet.so(+0x36d5f83)
[0x7f1e3bfebf83]
[bt] (2)
/data1/zj/crnn.gluon/venv/lib/python3.5/site-packages/mxnet/libmxnet.so(MXRecordIOReaderReadRecord+0x2a)
[0x7f1e3b7b3bba]
[bt] (3)
/usr/lib/python3.5/lib-dynload/_ctypes.cpython-35m-x86_64-linux-gnu.so(ffi_call_unix64+0x4c)
[0x7f1e59e09e20]
[bt] (4)
/usr/lib/python3.5/lib-dynload/_ctypes.cpython-35m-x86_64-linux-gnu.so(ffi_call+0x2eb)
[0x7f1e59e0988b]
[bt] (5)
/usr/lib/python3.5/lib-dynload/_ctypes.cpython-35m-x86_64-linux-gnu.so(_ctypes_callproc+0x49a)
[0x7f1e59e0401a]
[bt] (6)
/usr/lib/python3.5/lib-dynload/_ctypes.cpython-35m-x86_64-linux-gnu.so(+0x9fcb)
[0x7f1e59df7fcb]
[bt] (7) /data1/zj/crnn.gluon/venv/bin/python(PyObject_Call+0x47) [0x5c1797]
[bt] (8) /data1/zj/crnn.gluon/venv/bin/python(PyEval_EvalFrameEx+0x4ec6)
[0x53bba6]
[bt] (9) /data1/zj/crnn.gluon/venv/bin/python(PyEval_EvalFrameEx+0x4b04)
[0x53b7e4]
Process Process-6:
Process Process-4:
Process Process-5:
Traceback (most recent call last):
File "/usr/lib/python3.5/multiprocessing/process.py", line 249, in _bootstrap
self.run()
File "/usr/lib/python3.5/multiprocessing/process.py", line 93, in run
self._target(*self._args, **self._kwargs)
File
"/data1/zj/crnn.gluon/venv/lib/python3.5/site-packages/mxnet/gluon/data/dataloader.py",
line 169, in worker_loop
batch = batchify_fn([dataset[i] for i in samples])
File
"/data1/zj/crnn.gluon/venv/lib/python3.5/site-packages/mxnet/gluon/data/dataloader.py",
line 169, in <listcomp>
batch = batchify_fn([dataset[i] for i in samples])
File
"/data1/zj/crnn.gluon/venv/lib/python3.5/site-packages/mxnet/gluon/data/dataset.py",
line 131, in __getitem__
item = self._data[idx]
File
"/data1/zj/crnn.gluon/venv/lib/python3.5/site-packages/mxnet/gluon/data/vision/datasets.py",
line 257, in __getitem__
record = super(ImageRecordDataset, self).__getitem__(idx)
File
"/data1/zj/crnn.gluon/venv/lib/python3.5/site-packages/mxnet/gluon/data/dataset.py",
line 189, in __getitem__
return self._record.read_idx(self._record.keys[idx])
File
"/data1/zj/crnn.gluon/venv/lib/python3.5/site-packages/mxnet/recordio.py", line
265, in read_idx
return self.read()
File
"/data1/zj/crnn.gluon/venv/lib/python3.5/site-packages/mxnet/recordio.py", line
163, in read
ctypes.byref(size)))
File "/data1/zj/crnn.gluon/venv/lib/python3.5/site-packages/mxnet/base.py",
line 252, in check_call
raise MXNetError(py_str(_LIB.MXGetLastError()))
mxnet.base.MXNetError: [11:35:45] src/recordio.cc:65: Check failed: header[0]
== RecordIOWriter::kMagic Invalid RecordIO File
Stack trace returned 10 entries:
[bt] (0)
/data1/zj/crnn.gluon/venv/lib/python3.5/site-packages/mxnet/libmxnet.so(+0x36bac2)
[0x7f1e38c81ac2]
[bt] (1)
/data1/zj/crnn.gluon/venv/lib/python3.5/site-packages/mxnet/libmxnet.so(+0x36d5f83)
[0x7f1e3bfebf83]
[bt] (2)
/data1/zj/crnn.gluon/venv/lib/python3.5/site-packages/mxnet/libmxnet.so(MXRecordIOReaderReadRecord+0x2a)
[0x7f1e3b7b3bba]
[bt] (3)
/usr/lib/python3.5/lib-dynload/_ctypes.cpython-35m-x86_64-linux-gnu.so(ffi_call_unix64+0x4c)
[0x7f1e59e09e20]
[bt] (4)
/usr/lib/python3.5/lib-dynload/_ctypes.cpython-35m-x86_64-linux-gnu.so(ffi_call+0x2eb)
[0x7f1e59e0988b]
[bt] (5)
/usr/lib/python3.5/lib-dynload/_ctypes.cpython-35m-x86_64-linux-gnu.so(_ctypes_callproc+0x49a)
[0x7f1e59e0401a]
[bt] (6)
/usr/lib/python3.5/lib-dynload/_ctypes.cpython-35m-x86_64-linux-gnu.so(+0x9fcb)
[0x7f1e59df7fcb]
[bt] (7) /data1/zj/crnn.gluon/venv/bin/python(PyObject_Call+0x47) [0x5c1797]
[bt] (8) /data1/zj/crnn.gluon/venv/bin/python(PyEval_EvalFrameEx+0x4ec6)
[0x53bba6]
[bt] (9) /data1/zj/crnn.gluon/venv/bin/python(PyEval_EvalFrameEx+0x4b04)
[0x53b7e4]
Traceback (most recent call last):
Traceback (most recent call last):
File "/usr/lib/python3.5/multiprocessing/process.py", line 249, in _bootstrap
self.run()
File "/usr/lib/python3.5/multiprocessing/process.py", line 249, in _bootstrap
self.run()
File "/usr/lib/python3.5/multiprocessing/process.py", line 93, in run
self._target(*self._args, **self._kwargs)
File
"/data1/zj/crnn.gluon/venv/lib/python3.5/site-packages/mxnet/gluon/data/dataloader.py",
line 169, in worker_loop
batch = batchify_fn([dataset[i] for i in samples])
File "/usr/lib/python3.5/multiprocessing/process.py", line 93, in run
self._target(*self._args, **self._kwargs)
File
"/data1/zj/crnn.gluon/venv/lib/python3.5/site-packages/mxnet/gluon/data/dataloader.py",
line 169, in <listcomp>
batch = batchify_fn([dataset[i] for i in samples])
File
"/data1/zj/crnn.gluon/venv/lib/python3.5/site-packages/mxnet/gluon/data/dataloader.py",
line 169, in worker_loop
batch = batchify_fn([dataset[i] for i in samples])
File
"/data1/zj/crnn.gluon/venv/lib/python3.5/site-packages/mxnet/gluon/data/dataset.py",
line 131, in __getitem__
item = self._data[idx]
File
"/data1/zj/crnn.gluon/venv/lib/python3.5/site-packages/mxnet/gluon/data/dataloader.py",
line 169, in <listcomp>
batch = batchify_fn([dataset[i] for i in samples])
File
"/data1/zj/crnn.gluon/venv/lib/python3.5/site-packages/mxnet/gluon/data/vision/datasets.py",
line 257, in __getitem__
record = super(ImageRecordDataset, self).__getitem__(idx)
File
"/data1/zj/crnn.gluon/venv/lib/python3.5/site-packages/mxnet/gluon/data/dataset.py",
line 131, in __getitem__
item = self._data[idx]
File
"/data1/zj/crnn.gluon/venv/lib/python3.5/site-packages/mxnet/gluon/data/dataset.py",
line 189, in __getitem__
return self._record.read_idx(self._record.keys[idx])
File
"/data1/zj/crnn.gluon/venv/lib/python3.5/site-packages/mxnet/gluon/data/vision/datasets.py",
line 257, in __getitem__
record = super(ImageRecordDataset, self).__getitem__(idx)
File
"/data1/zj/crnn.gluon/venv/lib/python3.5/site-packages/mxnet/recordio.py", line
265, in read_idx
return self.read()
File
"/data1/zj/crnn.gluon/venv/lib/python3.5/site-packages/mxnet/gluon/data/dataset.py",
line 189, in __getitem__
return self._record.read_idx(self._record.keys[idx])
File
"/data1/zj/crnn.gluon/venv/lib/python3.5/site-packages/mxnet/recordio.py", line
163, in read
ctypes.byref(size)))
File
"/data1/zj/crnn.gluon/venv/lib/python3.5/site-packages/mxnet/recordio.py", line
265, in read_idx
return self.read()
File "/data1/zj/crnn.gluon/venv/lib/python3.5/site-packages/mxnet/base.py",
line 252, in check_call
raise MXNetError(py_str(_LIB.MXGetLastError()))
File
"/data1/zj/crnn.gluon/venv/lib/python3.5/site-packages/mxnet/recordio.py", line
163, in read
ctypes.byref(size)))
File "/data1/zj/crnn.gluon/venv/lib/python3.5/site-packages/mxnet/base.py",
line 252, in check_call
raise MXNetError(py_str(_LIB.MXGetLastError()))
mxnet.base.MXNetError: [11:35:45] src/recordio.cc:65: Check failed: header[0]
== RecordIOWriter::kMagic Invalid RecordIO File
Stack trace returned 10 entries:
[bt] (0)
/data1/zj/crnn.gluon/venv/lib/python3.5/site-packages/mxnet/libmxnet.so(+0x36bac2)
[0x7f1e38c81ac2]
[bt] (1)
/data1/zj/crnn.gluon/venv/lib/python3.5/site-packages/mxnet/libmxnet.so(+0x36d5f83)
[0x7f1e3bfebf83]
[bt] (2)
/data1/zj/crnn.gluon/venv/lib/python3.5/site-packages/mxnet/libmxnet.so(MXRecordIOReaderReadRecord+0x2a)
[0x7f1e3b7b3bba]
[bt] (3)
/usr/lib/python3.5/lib-dynload/_ctypes.cpython-35m-x86_64-linux-gnu.so(ffi_call_unix64+0x4c)
[0x7f1e59e09e20]
[bt] (4)
/usr/lib/python3.5/lib-dynload/_ctypes.cpython-35m-x86_64-linux-gnu.so(ffi_call+0x2eb)
[0x7f1e59e0988b]
[bt] (5)
/usr/lib/python3.5/lib-dynload/_ctypes.cpython-35m-x86_64-linux-gnu.so(_ctypes_callproc+0x49a)
[0x7f1e59e0401a]
[bt] (6)
/usr/lib/python3.5/lib-dynload/_ctypes.cpython-35m-x86_64-linux-gnu.so(+0x9fcb)
[0x7f1e59df7fcb]
[bt] (7) /data1/zj/crnn.gluon/venv/bin/python(PyObject_Call+0x47) [0x5c1797]
[bt] (8) /data1/zj/crnn.gluon/venv/bin/python(PyEval_EvalFrameEx+0x4ec6)
[0x53bba6]
[bt] (9) /data1/zj/crnn.gluon/venv/bin/python(PyEval_EvalFrameEx+0x4b04)
[0x53b7e4]
mxnet.base.MXNetError: [11:35:45] src/recordio.cc:65: Check failed: header[0]
== RecordIOWriter::kMagic Invalid RecordIO File
Stack trace returned 10 entries:
[bt] (0)
/data1/zj/crnn.gluon/venv/lib/python3.5/site-packages/mxnet/libmxnet.so(+0x36bac2)
[0x7f1e38c81ac2]
[bt] (1)
/data1/zj/crnn.gluon/venv/lib/python3.5/site-packages/mxnet/libmxnet.so(+0x36d5f83)
[0x7f1e3bfebf83]
[bt] (2)
/data1/zj/crnn.gluon/venv/lib/python3.5/site-packages/mxnet/libmxnet.so(MXRecordIOReaderReadRecord+0x2a)
[0x7f1e3b7b3bba]
[bt] (3)
/usr/lib/python3.5/lib-dynload/_ctypes.cpython-35m-x86_64-linux-gnu.so(ffi_call_unix64+0x4c)
[0x7f1e59e09e20]
[bt] (4)
/usr/lib/python3.5/lib-dynload/_ctypes.cpython-35m-x86_64-linux-gnu.so(ffi_call+0x2eb)
[0x7f1e59e0988b]
[bt] (5)
/usr/lib/python3.5/lib-dynload/_ctypes.cpython-35m-x86_64-linux-gnu.so(_ctypes_callproc+0x49a)
[0x7f1e59e0401a]
[bt] (6)
/usr/lib/python3.5/lib-dynload/_ctypes.cpython-35m-x86_64-linux-gnu.so(+0x9fcb)
[0x7f1e59df7fcb]
[bt] (7) /data1/zj/crnn.gluon/venv/bin/python(PyObject_Call+0x47) [0x5c1797]
[bt] (8) /data1/zj/crnn.gluon/venv/bin/python(PyEval_EvalFrameEx+0x4ec6)
[0x53bba6]
[bt] (9) /data1/zj/crnn.gluon/venv/bin/python(PyEval_EvalFrameEx+0x4b04)
[0x53b7e4]
Corrupt JPEG data: premature end of data segment
Traceback (most recent call last):
File "/data1/zj/crnn.gluon/dataset.py", line 148, in <module>
Process Process-2:
for i, (img, label) in enumerate(data_loader):
File
"/data1/zj/crnn.gluon/venv/lib/python3.5/site-packages/mxnet/gluon/data/dataloader.py",
line 242, in __next__
if self._rcvd_idx in self._data_buffer:
KeyboardInterrupt
Traceback (most recent call last):
File "/usr/lib/python3.5/multiprocessing/process.py", line 249, in _bootstrap
self.run()
File "/usr/lib/python3.5/multiprocessing/process.py", line 93, in run
self._target(*self._args, **self._kwargs)
File
"/data1/zj/crnn.gluon/venv/lib/python3.5/site-packages/mxnet/gluon/data/dataloader.py",
line 166, in worker_loop
idx, samples = key_queue.get()
File "/usr/lib/python3.5/multiprocessing/queues.py", line 94, in get
res = self._recv_bytes()
File "/usr/lib/python3.5/multiprocessing/connection.py", line 216, in
recv_bytes
buf = self._recv_bytes(maxlength)
File "/usr/lib/python3.5/multiprocessing/connection.py", line 407, in
_recv_bytes
buf = self._recv(4)
File "/usr/lib/python3.5/multiprocessing/connection.py", line 379, in _recv
chunk = read(handle, remaining)
KeyboardInterrupt
Exception in thread Thread-1:
Traceback (most recent call last):
File "/usr/lib/python3.5/threading.py", line 914, in _bootstrap_inner
self.run()
File "/usr/lib/python3.5/threading.py", line 862, in run
self._target(*self._args, **self._kwargs)
File
"/data1/zj/crnn.gluon/venv/lib/python3.5/site-packages/mxnet/gluon/data/dataloader.py",
line 175, in fetcher_loop
idx, batch = data_queue.get()
File "/usr/lib/python3.5/multiprocessing/queues.py", line 345, in get
return ForkingPickler.loads(res)
File
"/data1/zj/crnn.gluon/venv/lib/python3.5/site-packages/mxnet/gluon/data/dataloader.py",
line 56, in rebuild_ndarray
fd = fd.detach()
File "/usr/lib/python3.5/multiprocessing/resource_sharer.py", line 57, in
detach
with _resource_sharer.get_connection(self._id) as conn:
File "/usr/lib/python3.5/multiprocessing/resource_sharer.py", line 87, in
get_connection
c = Client(address, authkey=process.current_process().authkey)
File "/usr/lib/python3.5/multiprocessing/connection.py", line 487, in Client
c = SocketClient(address)
File "/usr/lib/python3.5/multiprocessing/connection.py", line 614, in
SocketClient
s.connect(address)
FileNotFoundError: [Errno 2] No such file or directory
Process finished with exit code 1
```
the code is
```python
from mxnet.gluon.data import DataLoader
from mxnet.gluon.data.vision.datasets import ImageRecordDataset
from mxnet.gluon.data.vision.transforms import ToTensor
dataset = ImageRecordDataset('/data1/zj/data/crnn/txt/val.rec')
data_loader = DataLoader(dataset.transform_first(ToTensor()), 1, shuffle=True,
num_workers=6)
print(len(dataset))
start = time.time()
for i, (img, label) in enumerate(data_loader):
if (i + 1) % 10 == 0:
print(time.time() - start)
start = time.time()
```
[ Full content available at:
https://github.com/apache/incubator-mxnet/issues/9974 ]
This message was relayed via gitbox.apache.org for [email protected]