Hi -

I'm trying to use DGL (Deep Graph Library) DGLDataset API with the RAPIDS
cuda DataFrame API.   Am getting this error:

module 'pyarrow.lib' has no attribute '_CRecordBatchReader'


Wonder if you see anything obvious in the stack trace that might help me debug?



Here's the full stack trace:


<ipython-input-5-81f2b1833437> in __init__(self)     10   """     11
def __init__(self):---> 12     super(UserSimsSingleFileDataset,
self).__init__(name='UserSimsDataset', verbose=False)     13      14
  # One quirk of DGLDataset is that process() and __len__ (load, save)
are called immediately after super(),
/opt/conda/lib/python3.7/site-packages/dgl/data/dgl_dataset.py in
__init__(self, name, url, raw_dir, save_dir, hash_key, force_reload,
verbose)     91             self._save_dir = save_dir     92 ---> 93
      self._load()     94      95     def download(self):
/opt/conda/lib/python3.7/site-packages/dgl/data/dgl_dataset.py in
_load(self)    176         if not load_flag:    177
self._download()--> 178             self.process()    179
self.save()    180             if self.verbose:
<ipython-input-5-81f2b1833437> in process(self)     20      21
import gcsfs---> 22     import cudf     23     self.rows_per_batch =
10000     24     gs = gcsfs.GCSFileSystem()
/opt/conda/lib/python3.7/site-packages/cudf/__init__.py in <module>
  9 import rmm     10 ---> 11 from cudf import core, datasets, testing
    12 from cudf._version import get_versions     13 from
cudf.api.extensions import (
/opt/conda/lib/python3.7/site-packages/cudf/core/__init__.py in
<module>      1 # Copyright (c) 2018-2020, NVIDIA CORPORATION.      2
----> 3 from cudf.core import buffer, column, column_accessor, common
    4 from cudf.core.buffer import Buffer      5 from
cudf.core.dataframe import DataFrame, from_pandas, merge
/opt/conda/lib/python3.7/site-packages/cudf/core/column/__init__.py in
<module>      1 # Copyright (c) 2020-2021, NVIDIA CORPORATION.      2
----> 3 from cudf.core.column.categorical import CategoricalColumn
 4 from cudf.core.column.column import (      5     ColumnBase,
/opt/conda/lib/python3.7/site-packages/cudf/core/column/categorical.py
in <module>     20      21 import cudf---> 22 from cudf import _lib as
libcudf     23 from cudf._lib.scalar import as_device_scalar     24
from cudf._lib.transform import bools_to_mask
/opt/conda/lib/python3.7/site-packages/cudf/_lib/__init__.py in
<module>      2 import numpy as np      3 ----> 4 from . import (
5     avro,      6     binaryop,
cudf/_lib/gpuarrow.pyx in init cudf._lib.gpuarrow()
AttributeError: module 'pyarrow.lib' has no attribute '_CRecordBatchReader'

Reply via email to