raulcd opened a new issue, #47051: URL: https://github.com/apache/arrow/issues/47051
### Describe the bug, including details regarding any error messages, version, and platform. There are several Python tests failing on [the verify-rc-source-windows](https://github.com/ursacomputing/crossbow/actions/runs/16185190432/job/45689333538): This is a follow up of the issue: - https://github.com/apache/arrow/issues/47033 Because it is unrelated to the original fixed issue. As seen on the original issue this started when those were merged: https://github.com/apache/arrow/compare/6822857775bafc765b9e75a09e0b7470ce1a957b...3dd8b66f0cd78182c3effeab2c140e6418c3e754 See a trimmed log for the failures: <details> ``` ================================== FAILURES =================================== __________________________ test_set_write_batch_size __________________________ .... C:\tmp\arrow-verify-release\conda-env\lib\site-packages\pandas\_testing\asserters.py:690: AssertionError _____________________ test_parquet_incremental_file_build _____________________ tempdir = WindowsPath('C:/Users/runneradmin/AppData/Local/Temp/pytest-of-runneradmin/pytest-0/test_parquet_incremental_file_0') @pytest.mark.pandas def test_parquet_incremental_file_build(tempdir): df = _test_dataframe(100) df['unique_id'] = 0 arrow_table = pa.Table.from_pandas(df, preserve_index=False) out = pa.BufferOutputStream() writer = pq.ParquetWriter(out, arrow_table.schema, version='2.6') frames = [] for i in range(10): df['unique_id'] = i arrow_table = pa.Table.from_pandas(df, preserve_index=False) writer.write_table(arrow_table) frames.append(df.copy()) writer.close() buf = out.getvalue() result = _read_table(pa.BufferReader(buf)) expected = pd.concat(frames, ignore_index=True) > tm.assert_frame_equal(result.to_pandas(), expected) pyarrow\tests\parquet\test_parquet_writer.py:68: _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ left = array([ 88, 94, 107, 145, 47, 170, 196, 151, 117, 166, 22, 183, 192, 204, 33, 216, 67, 179, 78, 154, 251,...5, 174, 202, 39, 74, 234, 207, 87, 168, 101, 135, 174, 200, 223, 122, 223, 129, 44, 118], dtype=uint8) right = array([172, 10, 127, 140, 47, 170, 196, 151, 117, 166, 22, 183, 192, 204, 33, 216, 67, 179, 78, 154, 251,...5, 174, 202, 39, 74, 234, 207, 87, 168, 101, 135, 174, 200, 223, 122, 88, 94, 107, 145], dtype=uint8) err_msg = None def _raise(left, right, err_msg) -> NoReturn: if err_msg is None: if left.shape != right.shape: raise_assert_detail( obj, f"{obj} shapes are different", left.shape, right.shape ) diff = 0 for left_arr, right_arr in zip(left, right): # count up differences if not array_equivalent(left_arr, right_arr, strict_nan=strict_nan): diff += 1 diff = diff * 100.0 / left.size msg = f"{obj} values are different ({np.round(diff, 5)} %)" > raise_assert_detail(obj, msg, left, right, index_values=index_values) E AssertionError: DataFrame.iloc[:, 0] (column name="uint8") are different E E DataFrame.iloc[:, 0] (column name="uint8") values are different (8.0 %) E [index]: [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, ...] E [left]: [88, 94, 107, 145, 47, 170, 196, 151, 117, 166, 22, 183, 192, 204, 33, 216, 67, 179, 78, 154, 251, 82, 162, 219, 195, 118, 125, 139, 103, 125, 229, 216, 9, 164, 116, 108, 211, 222, 161, 159, 21, 81, 89, 165, 242, 214, 102, 98, 36, 183, 5, 112, 87, 58, 43, 76, 70, 60, 75, 228, 216, 189, 132, 14, 88, 154, 178, 246, 140, 205, 204, 69, 58, 57, 41, 98, 193, 66, 72, 122, 230, 125, 174, 202, 39, 74, 234, 207, 87, 168, 101, 135, 174, 200, 223, 122, 0, 0, 0, 0, ...] E [right]: [172, 10, 127, 140, 47, 170, 196, 151, 117, 166, 22, 183, 192, 204, 33, 216, 67, 179, 78, 154, 251, 82, 162, 219, 195, 118, 125, 139, 103, 125, 229, 216, 9, 164, 116, 108, 211, 222, 161, 159, 21, 81, 89, 165, 242, 214, 102, 98, 36, 183, 5, 112, 87, 58, 43, 76, 70, 60, 75, 228, 216, 189, 132, 14, 88, 154, 178, 246, 140, 205, 204, 69, 58, 57, 41, 98, 193, 66, 72, 122, 230, 125, 174, 202, 39, 74, 234, 207, 87, 168, 101, 135, 174, 200, 223, 122, 88, 94, 107, 145, ...] C:\tmp\arrow-verify-release\conda-env\lib\site-packages\pandas\_testing\asserters.py:690: AssertionError _______________________ test_parquet_writer_context_obj _______________________ tempdir = WindowsPath('C:/Users/runneradmin/AppData/Local/Temp/pytest-of-runneradmin/pytest-0/test_parquet_writer_context_ob0') @pytest.mark.pandas def test_parquet_writer_context_obj(tempdir): df = _test_dataframe(100) df['unique_id'] = 0 arrow_table = pa.Table.from_pandas(df, preserve_index=False) out = pa.BufferOutputStream() with pq.ParquetWriter(out, arrow_table.schema, version='2.6') as writer: frames = [] for i in range(10): df['unique_id'] = i arrow_table = pa.Table.from_pandas(df, preserve_index=False) writer.write_table(arrow_table) frames.append(df.copy()) buf = out.getvalue() result = _read_table(pa.BufferReader(buf)) expected = pd.concat(frames, ignore_index=True) > tm.assert_frame_equal(result.to_pandas(), expected) pyarrow\tests\parquet\test_parquet_writer.py:125: _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ left = array([ 88, 94, 107, 145, 47, 170, 196, 151, 117, 166, 22, 183, 192, 204, 33, 216, 67, 179, 78, 154, 251,...5, 174, 202, 39, 74, 234, 207, 87, 168, 101, 135, 174, 200, 223, 122, 223, 129, 44, 118], dtype=uint8) right = array([172, 10, 127, 140, 47, 170, 196, 151, 117, 166, 22, 183, 192, 204, 33, 216, 67, 179, 78, 154, 251,...5, 174, 202, 39, 74, 234, 207, 87, 168, 101, 135, 174, 200, 223, 122, 88, 94, 107, 145], dtype=uint8) err_msg = None def _raise(left, right, err_msg) -> NoReturn: if err_msg is None: if left.shape != right.shape: raise_assert_detail( obj, f"{obj} shapes are different", left.shape, right.shape ) diff = 0 for left_arr, right_arr in zip(left, right): # count up differences if not array_equivalent(left_arr, right_arr, strict_nan=strict_nan): diff += 1 diff = diff * 100.0 / left.size msg = f"{obj} values are different ({np.round(diff, 5)} %)" > raise_assert_detail(obj, msg, left, right, index_values=index_values) E AssertionError: DataFrame.iloc[:, 0] (column name="uint8") are different E E DataFrame.iloc[:, 0] (column name="uint8") values are different (8.0 %) E [index]: [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, ...] E [left]: [88, 94, 107, 145, 47, 170, 196, 151, 117, 166, 22, 183, 192, 204, 33, 216, 67, 179, 78, 154, 251, 82, 162, 219, 195, 118, 125, 139, 103, 125, 229, 216, 9, 164, 116, 108, 211, 222, 161, 159, 21, 81, 89, 165, 242, 214, 102, 98, 36, 183, 5, 112, 87, 58, 43, 76, 70, 60, 75, 228, 216, 189, 132, 14, 88, 154, 178, 246, 140, 205, 204, 69, 58, 57, 41, 98, 193, 66, 72, 122, 230, 125, 174, 202, 39, 74, 234, 207, 87, 168, 101, 135, 174, 200, 223, 122, 85, 144, 50, 30, ...] E [right]: [172, 10, 127, 140, 47, 170, 196, 151, 117, 166, 22, 183, 192, 204, 33, 216, 67, 179, 78, 154, 251, 82, 162, 219, 195, 118, 125, 139, 103, 125, 229, 216, 9, 164, 116, 108, 211, 222, 161, 159, 21, 81, 89, 165, 242, 214, 102, 98, 36, 183, 5, 112, 87, 58, 43, 76, 70, 60, 75, 228, 216, 189, 132, 14, 88, 154, 178, 246, 140, 205, 204, 69, 58, 57, 41, 98, 193, 66, 72, 122, 230, 125, 174, 202, 39, 74, 234, 207, 87, 168, 101, 135, 174, 200, 223, 122, 88, 94, 107, 145, ...] C:\tmp\arrow-verify-release\conda-env\lib\site-packages\pandas\_testing\asserters.py:690: AssertionError _______________ test_parquet_writer_context_obj_with_exception ________________ tempdir = WindowsPath('C:/Users/runneradmin/AppData/Local/Temp/pytest-of-runneradmin/pytest-0/test_parquet_writer_context_ob1') @pytest.mark.pandas def test_parquet_writer_context_obj_with_exception(tempdir): df = _test_dataframe(100) df['unique_id'] = 0 arrow_table = pa.Table.from_pandas(df, preserve_index=False) out = pa.BufferOutputStream() error_text = 'Artificial Error' try: with pq.ParquetWriter(out, arrow_table.schema, version='2.6') as writer: frames = [] for i in range(10): df['unique_id'] = i arrow_table = pa.Table.from_pandas(df, preserve_index=False) writer.write_table(arrow_table) frames.append(df.copy()) if i == 5: raise ValueError(error_text) except Exception as e: assert str(e) == error_text buf = out.getvalue() result = _read_table(pa.BufferReader(buf)) expected = pd.concat(frames, ignore_index=True) > tm.assert_frame_equal(result.to_pandas(), expected) pyarrow\tests\parquet\test_parquet_writer.py:157: _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ left = array([ 88, 94, 107, 145, 47, 170, 196, 151, 117, 166, 22, 183, 192, 204, 33, 216, 67, 179, 78, 154, 251,..., 174, 202, 39, 74, 234, 207, 87, 168, 101, 135, 174, 200, 223, 122, 223, 129, 44, 118], dtype=uint8) right = array([172, 10, 127, 140, 47, 170, 196, 151, 117, 166, 22, 183, 192, 204, 33, 216, 67, 179, 78, 154, 251,..., 174, 202, 39, 74, 234, 207, 87, 168, 101, 135, 174, 200, 223, 122, 88, 94, 107, 145], dtype=uint8) err_msg = None def _raise(left, right, err_msg) -> NoReturn: if err_msg is None: if left.shape != right.shape: raise_assert_detail( obj, f"{obj} shapes are different", left.shape, right.shape ) diff = 0 for left_arr, right_arr in zip(left, right): # count up differences if not array_equivalent(left_arr, right_arr, strict_nan=strict_nan): diff += 1 diff = diff * 100.0 / left.size msg = f"{obj} values are different ({np.round(diff, 5)} %)" > raise_assert_detail(obj, msg, left, right, index_values=index_values) E AssertionError: DataFrame.iloc[:, 0] (column name="uint8") are different E E DataFrame.iloc[:, 0] (column name="uint8") values are different (8.0 %) E [index]: [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, ...] E [left]: [88, 94, 107, 145, 47, 170, 196, 151, 117, 166, 22, 183, 192, 204, 33, 216, 67, 179, 78, 154, 251, 82, 162, 219, 195, 118, 125, 139, 103, 125, 229, 216, 9, 164, 116, 108, 211, 222, 161, 159, 21, 81, 89, 165, 242, 214, 102, 98, 36, 183, 5, 112, 87, 58, 43, 76, 70, 60, 75, 228, 216, 189, 132, 14, 88, 154, 178, 246, 140, 205, 204, 69, 58, 57, 41, 98, 193, 66, 72, 122, 230, 125, 174, 202, 39, 74, 234, 207, 87, 168, 101, 135, 174, 200, 223, 122, 192, 202, 212, 222, ...] E [right]: [172, 10, 127, 140, 47, 170, 196, 151, 117, 166, 22, 183, 192, 204, 33, 216, 67, 179, 78, 154, 251, 82, 162, 219, 195, 118, 125, 139, 103, 125, 229, 216, 9, 164, 116, 108, 211, 222, 161, 159, 21, 81, 89, 165, 242, 214, 102, 98, 36, 183, 5, 112, 87, 58, 43, 76, 70, 60, 75, 228, 216, 189, 132, 14, 88, 154, 178, 246, 140, 205, 204, 69, 58, 57, 41, 98, 193, 66, 72, 122, 230, 125, 174, 202, 39, 74, 234, 207, 87, 168, 101, 135, 174, 200, 223, 122, 88, 94, 107, 145, ...] C:\tmp\arrow-verify-release\conda-env\lib\site-packages\pandas\_testing\asserters.py:690: AssertionError __________________ test_parquet_writer_write_wrappers[None] ___________________ tempdir = WindowsPath('C:/Users/runneradmin/AppData/Local/Temp/pytest-of-runneradmin/pytest-0/test_parquet_writer_write_wrap0') filesystem = None @pytest.mark.pandas @pytest.mark.parametrize("filesystem", [ None, fs.LocalFileSystem(), ]) def test_parquet_writer_write_wrappers(tempdir, filesystem): df = _test_dataframe(100) table = pa.Table.from_pandas(df, preserve_index=False) batch = pa.RecordBatch.from_pandas(df, preserve_index=False) path_table = str(tempdir / 'data_table.parquet') path_batch = str(tempdir / 'data_batch.parquet') with pq.ParquetWriter( path_table, table.schema, filesystem=filesystem, version='2.6' ) as writer: writer.write_table(table) result = _read_table(path_table).to_pandas() > tm.assert_frame_equal(result, df) pyarrow\tests\parquet\test_parquet_writer.py:178: _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ left = array([ 88, 94, 107, 145, 47, 170, 196, 151, 117, 166, 22, 183, 192, 204, 33, 216, 67, 179, 78, 154, 251,...30, 125, 174, 202, 39, 74, 234, 207, 87, 168, 101, 135, 174, 200, 223, 122, 223, 129, 44, 118], dtype=uint8) right = array([172, 10, 127, 140, 47, 170, 196, 151, 117, 166, 22, 183, 192, 204, 33, 216, 67, 179, 78, 154, 251,...30, 125, 174, 202, 39, 74, 234, 207, 87, 168, 101, 135, 174, 200, 223, 122, 88, 94, 107, 145], dtype=uint8) err_msg = None def _raise(left, right, err_msg) -> NoReturn: if err_msg is None: if left.shape != right.shape: raise_assert_detail( obj, f"{obj} shapes are different", left.shape, right.shape ) diff = 0 for left_arr, right_arr in zip(left, right): # count up differences if not array_equivalent(left_arr, right_arr, strict_nan=strict_nan): diff += 1 diff = diff * 100.0 / left.size msg = f"{obj} values are different ({np.round(diff, 5)} %)" > raise_assert_detail(obj, msg, left, right, index_values=index_values) E AssertionError: DataFrame.iloc[:, 0] (column name="uint8") are different E E DataFrame.iloc[:, 0] (column name="uint8") values are different (8.0 %) E [index]: [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99] E [left]: [88, 94, 107, 145, 47, 170, 196, 151, 117, 166, 22, 183, 192, 204, 33, 216, 67, 179, 78, 154, 251, 82, 162, 219, 195, 118, 125, 139, 103, 125, 229, 216, 9, 164, 116, 108, 211, 222, 161, 159, 21, 81, 89, 165, 242, 214, 102, 98, 36, 183, 5, 112, 87, 58, 43, 76, 70, 60, 75, 228, 216, 189, 132, 14, 88, 154, 178, 246, 140, 205, 204, 69, 58, 57, 41, 98, 193, 66, 72, 122, 230, 125, 174, 202, 39, 74, 234, 207, 87, 168, 101, 135, 174, 200, 223, 122, 223, 129, 44, 118] E [right]: [172, 10, 127, 140, 47, 170, 196, 151, 117, 166, 22, 183, 192, 204, 33, 216, 67, 179, 78, 154, 251, 82, 162, 219, 195, 118, 125, 139, 103, 125, 229, 216, 9, 164, 116, 108, 211, 222, 161, 159, 21, 81, 89, 165, 242, 214, 102, 98, 36, 183, 5, 112, 87, 58, 43, 76, 70, 60, 75, 228, 216, 189, 132, 14, 88, 154, 178, 246, 140, 205, 204, 69, 58, 57, 41, 98, 193, 66, 72, 122, 230, 125, 174, 202, 39, 74, 234, 207, 87, 168, 101, 135, 174, 200, 223, 122, 88, 94, 107, 145] C:\tmp\arrow-verify-release\conda-env\lib\site-packages\pandas\_testing\asserters.py:690: AssertionError _______________ test_parquet_writer_write_wrappers[filesystem1] _______________ tempdir = WindowsPath('C:/Users/runneradmin/AppData/Local/Temp/pytest-of-runneradmin/pytest-0/test_parquet_writer_write_wrap1') filesystem = <pyarrow._fs.LocalFileSystem object at 0x00000204EB1BBCB0> @pytest.mark.pandas @pytest.mark.parametrize("filesystem", [ None, fs.LocalFileSystem(), ]) def test_parquet_writer_write_wrappers(tempdir, filesystem): df = _test_dataframe(100) table = pa.Table.from_pandas(df, preserve_index=False) batch = pa.RecordBatch.from_pandas(df, preserve_index=False) path_table = str(tempdir / 'data_table.parquet') path_batch = str(tempdir / 'data_batch.parquet') with pq.ParquetWriter( path_table, table.schema, filesystem=filesystem, version='2.6' ) as writer: writer.write_table(table) result = _read_table(path_table).to_pandas() > tm.assert_frame_equal(result, df) pyarrow\tests\parquet\test_parquet_writer.py:178: _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ left = array([ 88, 94, 107, 145, 47, 170, 196, 151, 117, 166, 22, 183, 192, 204, 33, 216, 67, 179, 78, 154, 251,...30, 125, 174, 202, 39, 74, 234, 207, 87, 168, 101, 135, 174, 200, 223, 122, 85, 144, 50, 30], dtype=uint8) right = array([172, 10, 127, 140, 47, 170, 196, 151, 117, 166, 22, 183, 192, 204, 33, 216, 67, 179, 78, 154, 251,...30, 125, 174, 202, 39, 74, 234, 207, 87, 168, 101, 135, 174, 200, 223, 122, 88, 94, 107, 145], dtype=uint8) err_msg = None def _raise(left, right, err_msg) -> NoReturn: if err_msg is None: if left.shape != right.shape: raise_assert_detail( obj, f"{obj} shapes are different", left.shape, right.shape ) diff = 0 for left_arr, right_arr in zip(left, right): # count up differences if not array_equivalent(left_arr, right_arr, strict_nan=strict_nan): diff += 1 diff = diff * 100.0 / left.size msg = f"{obj} values are different ({np.round(diff, 5)} %)" > raise_assert_detail(obj, msg, left, right, index_values=index_values) E AssertionError: DataFrame.iloc[:, 0] (column name="uint8") are different E E DataFrame.iloc[:, 0] (column name="uint8") values are different (8.0 %) E [index]: [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99] E [left]: [88, 94, 107, 145, 47, 170, 196, 151, 117, 166, 22, 183, 192, 204, 33, 216, 67, 179, 78, 154, 251, 82, 162, 219, 195, 118, 125, 139, 103, 125, 229, 216, 9, 164, 116, 108, 211, 222, 161, 159, 21, 81, 89, 165, 242, 214, 102, 98, 36, 183, 5, 112, 87, 58, 43, 76, 70, 60, 75, 228, 216, 189, 132, 14, 88, 154, 178, 246, 140, 205, 204, 69, 58, 57, 41, 98, 193, 66, 72, 122, 230, 125, 174, 202, 39, 74, 234, 207, 87, 168, 101, 135, 174, 200, 223, 122, 85, 144, 50, 30] E [right]: [172, 10, 127, 140, 47, 170, 196, 151, 117, 166, 22, 183, 192, 204, 33, 216, 67, 179, 78, 154, 251, 82, 162, 219, 195, 118, 125, 139, 103, 125, 229, 216, 9, 164, 116, 108, 211, 222, 161, 159, 21, 81, 89, 165, 242, 214, 102, 98, 36, 183, 5, 112, 87, 58, 43, 76, 70, 60, 75, 228, 216, 189, 132, 14, 88, 154, 178, 246, 140, 205, 204, 69, 58, 57, 41, 98, 193, 66, 72, 122, 230, 125, 174, 202, 39, 74, 234, 207, 87, 168, 101, 135, 174, 200, 223, 122, 88, 94, 107, 145] C:\tmp\arrow-verify-release\conda-env\lib\site-packages\pandas\_testing\asserters.py:690: AssertionError _________________ test_parquet_writer_filesystem_local[None] __________________ tempdir = WindowsPath('C:/Users/runneradmin/AppData/Local/Temp/pytest-of-runneradmin/pytest-0/test_parquet_writer_filesystem0') filesystem = None @pytest.mark.pandas @pytest.mark.parametrize("filesystem", [ None, fs.LocalFileSystem(), ]) def test_parquet_writer_filesystem_local(tempdir, filesystem): df = _test_dataframe(100) table = pa.Table.from_pandas(df, preserve_index=False) path = str(tempdir / 'data.parquet') with pq.ParquetWriter( path, table.schema, filesystem=filesystem, version='2.6' ) as writer: writer.write_table(table) result = _read_table(path).to_pandas() > tm.assert_frame_equal(result, df) pyarrow\tests\parquet\test_parquet_writer.py:264: _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ left = array([ 88, 94, 107, 145, 47, 170, 196, 151, 117, 166, 22, 183, 192, 204, 33, 216, 67, 179, 78, 154, 251,...30, 125, 174, 202, 39, 74, 234, 207, 87, 168, 101, 135, 174, 200, 223, 122, 223, 129, 44, 118], dtype=uint8) right = array([172, 10, 127, 140, 47, 170, 196, 151, 117, 166, 22, 183, 192, 204, 33, 216, 67, 179, 78, 154, 251,...30, 125, 174, 202, 39, 74, 234, 207, 87, 168, 101, 135, 174, 200, 223, 122, 88, 94, 107, 145], dtype=uint8) err_msg = None def _raise(left, right, err_msg) -> NoReturn: if err_msg is None: if left.shape != right.shape: raise_assert_detail( obj, f"{obj} shapes are different", left.shape, right.shape ) diff = 0 for left_arr, right_arr in zip(left, right): # count up differences if not array_equivalent(left_arr, right_arr, strict_nan=strict_nan): diff += 1 diff = diff * 100.0 / left.size msg = f"{obj} values are different ({np.round(diff, 5)} %)" > raise_assert_detail(obj, msg, left, right, index_values=index_values) E AssertionError: DataFrame.iloc[:, 0] (column name="uint8") are different E E DataFrame.iloc[:, 0] (column name="uint8") values are different (8.0 %) E [index]: [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99] E [left]: [88, 94, 107, 145, 47, 170, 196, 151, 117, 166, 22, 183, 192, 204, 33, 216, 67, 179, 78, 154, 251, 82, 162, 219, 195, 118, 125, 139, 103, 125, 229, 216, 9, 164, 116, 108, 211, 222, 161, 159, 21, 81, 89, 165, 242, 214, 102, 98, 36, 183, 5, 112, 87, 58, 43, 76, 70, 60, 75, 228, 216, 189, 132, 14, 88, 154, 178, 246, 140, 205, 204, 69, 58, 57, 41, 98, 193, 66, 72, 122, 230, 125, 174, 202, 39, 74, 234, 207, 87, 168, 101, 135, 174, 200, 223, 122, 223, 129, 44, 118] E [right]: [172, 10, 127, 140, 47, 170, 196, 151, 117, 166, 22, 183, 192, 204, 33, 216, 67, 179, 78, 154, 251, 82, 162, 219, 195, 118, 125, 139, 103, 125, 229, 216, 9, 164, 116, 108, 211, 222, 161, 159, 21, 81, 89, 165, 242, 214, 102, 98, 36, 183, 5, 112, 87, 58, 43, 76, 70, 60, 75, 228, 216, 189, 132, 14, 88, 154, 178, 246, 140, 205, 204, 69, 58, 57, 41, 98, 193, 66, 72, 122, 230, 125, 174, 202, 39, 74, 234, 207, 87, 168, 101, 135, 174, 200, 223, 122, 88, 94, 107, 145] C:\tmp\arrow-verify-release\conda-env\lib\site-packages\pandas\_testing\asserters.py:690: AssertionError ______________ test_parquet_writer_filesystem_local[filesystem1] ______________ tempdir = WindowsPath('C:/Users/runneradmin/AppData/Local/Temp/pytest-of-runneradmin/pytest-0/test_parquet_writer_filesystem1') filesystem = <pyarrow._fs.LocalFileSystem object at 0x00000204EB1BBD30> @pytest.mark.pandas @pytest.mark.parametrize("filesystem", [ None, fs.LocalFileSystem(), ]) def test_parquet_writer_filesystem_local(tempdir, filesystem): df = _test_dataframe(100) table = pa.Table.from_pandas(df, preserve_index=False) path = str(tempdir / 'data.parquet') with pq.ParquetWriter( path, table.schema, filesystem=filesystem, version='2.6' ) as writer: writer.write_table(table) result = _read_table(path).to_pandas() > tm.assert_frame_equal(result, df) pyarrow\tests\parquet\test_parquet_writer.py:264: _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ left = array([ 88, 94, 107, 145, 47, 170, 196, 151, 117, 166, 22, 183, 192, 204, 33, 216, 67, 179, 78, 154, 251,...30, 125, 174, 202, 39, 74, 234, 207, 87, 168, 101, 135, 174, 200, 223, 122, 0, 0, 0, 0], dtype=uint8) right = array([172, 10, 127, 140, 47, 170, 196, 151, 117, 166, 22, 183, 192, 204, 33, 216, 67, 179, 78, 154, 251,...30, 125, 174, 202, 39, 74, 234, 207, 87, 168, 101, 135, 174, 200, 223, 122, 88, 94, 107, 145], dtype=uint8) err_msg = None def _raise(left, right, err_msg) -> NoReturn: if err_msg is None: if left.shape != right.shape: raise_assert_detail( obj, f"{obj} shapes are different", left.shape, right.shape ) diff = 0 for left_arr, right_arr in zip(left, right): # count up differences if not array_equivalent(left_arr, right_arr, strict_nan=strict_nan): diff += 1 diff = diff * 100.0 / left.size msg = f"{obj} values are different ({np.round(diff, 5)} %)" > raise_assert_detail(obj, msg, left, right, index_values=index_values) E AssertionError: DataFrame.iloc[:, 0] (column name="uint8") are different E E DataFrame.iloc[:, 0] (column name="uint8") values are different (8.0 %) E [index]: [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99] E [left]: [88, 94, 107, 145, 47, 170, 196, 151, 117, 166, 22, 183, 192, 204, 33, 216, 67, 179, 78, 154, 251, 82, 162, 219, 195, 118, 125, 139, 103, 125, 229, 216, 9, 164, 116, 108, 211, 222, 161, 159, 21, 81, 89, 165, 242, 214, 102, 98, 36, 183, 5, 112, 87, 58, 43, 76, 70, 60, 75, 228, 216, 189, 132, 14, 88, 154, 178, 246, 140, 205, 204, 69, 58, 57, 41, 98, 193, 66, 72, 122, 230, 125, 174, 202, 39, 74, 234, 207, 87, 168, 101, 135, 174, 200, 223, 122, 0, 0, 0, 0] E [right]: [172, 10, 127, 140, 47, 170, 196, 151, 117, 166, 22, 183, 192, 204, 33, 216, 67, 179, 78, 154, 251, 82, 162, 219, 195, 118, 125, 139, 103, 125, 229, 216, 9, 164, 116, 108, 211, 222, 161, 159, 21, 81, 89, 165, 242, 214, 102, 98, 36, 183, 5, 112, 87, 58, 43, 76, 70, 60, 75, 228, 216, 189, 132, 14, 88, 154, 178, 246, 140, 205, 204, 69, 58, 57, 41, 98, 193, 66, 72, 122, 230, 125, 174, 202, 39, 74, 234, 207, 87, 168, 101, 135, 174, 200, 223, 122, 88, 94, 107, 145] C:\tmp\arrow-verify-release\conda-env\lib\site-packages\pandas\_testing\asserters.py:690: AssertionError _________________________ test_write_dataset_parquet __________________________ tempdir = WindowsPath('C:/Users/runneradmin/AppData/Local/Temp/pytest-of-runneradmin/pytest-0/test_write_dataset_parquet0') @pytest.mark.numpy @pytest.mark.parquet def test_write_dataset_parquet(tempdir): table = pa.table([ pa.array(range(20), type="uint32"), pa.array(np.arange("2012-01-01", 20, dtype="datetime64[D]").astype( "datetime64[ns]")), pa.array(np.repeat(['a', 'b'], 10)) ], names=["f1", "f2", "part"]) # using default "parquet" format string base_dir = tempdir / 'parquet_dataset' ds.write_dataset(table, base_dir, format="parquet") # check that all files are present file_paths = list(base_dir.rglob("*")) expected_paths = [base_dir / "part-0.parquet"] assert set(file_paths) == set(expected_paths) # check Table roundtrip with default version result = ds.dataset(base_dir, format="parquet").to_table() assert result.equals(table) # using custom options for version in ["1.0", "2.4", "2.6"]: format = ds.ParquetFileFormat() opts = format.make_write_options(version=version) assert "<pyarrow.dataset.ParquetFileWriteOptions" in repr(opts) base_dir = tempdir / f'parquet_dataset_version{version}' ds.write_dataset(table, base_dir, format=format, file_options=opts) meta = pq.read_metadata(base_dir / "part-0.parquet") expected_version = "1.0" if version == "1.0" else "2.6" assert meta.format_version == expected_version # ensure version is actually honored based on supported datatypes result = ds.dataset(base_dir, format="parquet").to_table() schema = table.schema if version == "1.0": # uint32 is written as int64 schema = schema.set(0, schema.field(0).with_type(pa.int64())) if version in ("1.0", "2.4"): schema = schema.set(1, schema.field(1).with_type(pa.timestamp("us"))) expected = table.cast(schema) > assert result.equals(expected) E assert False E + where False = equals(pyarrow.Table\nf1: int64\nf2: timestamp[us]\npart: string\n----\nf1: [[0,1,2,3,4,...,15,16,17,18,19]]\nf2: [[2012-01-01 00:00:00.000000,2012-01-02 00:00:00.000000,2012-01-03 00:00:00.000000,2012-01-04 00:00:00.000000,2012-01-05 00:00:00.000000,...,2012-01-16 00:00:00.000000,2012-01-17 00:00:00.000000,2012-01-18 00:00:00.000000,2012-01-19 00:00:00.000000,2012-01-20 00:00:00.000000]]\npart: [["a","a","a","a","a",...,"b","b","b","b","b"]]) E + where equals = pyarrow.Table\nf1: int64\nf2: timestamp[us]\npart: string\n----\nf1: [[16,17,18,19,4,...,15,141733920800,150323855394,158913789988,167503724582]]\nf2: [[2012-01-01 00:00:00.000000,2012-01-02 00:00:00.000000,2012-01-03 00:00:00.000000,2012-01-04 00:00:00.000000,2012-01-05 00:00:00.000000,...,2012-01-16 00:00:00.000000,2012-01-17 00:00:00.000000,2012-01-18 00:00:00.000000,2012-01-19 00:00:00.000000,2012-01-20 00:00:00.000000]]\npart: [["a","a","a","a","a",...,"b","b","b","b","b"]].equals pyarrow\tests\test_dataset.py:4842: AssertionError ============================== warnings summary =============================== pyarrow/tests/parquet/test_data_types.py: 3 warnings pyarrow/tests/parquet/test_pandas.py: 2 warnings pyarrow/tests/parquet/test_parquet_file.py: 1 warning pyarrow/tests/test_pandas.py: 4 warnings C:\tmp\arrow-verify-release\conda-env\lib\site-packages\pandas\core\dtypes\missing.py:577: DeprecationWarning: The truth value of an empty array is ambiguous. Returning False, but in future this will result in an error. Use `array.size > 0` to check that an array is not empty. if not lib.array_equivalent_object(left[~mask], right[~mask]): pyarrow/tests/test_pandas.py::TestConvertMetadata::test_empty_list_metadata pyarrow/tests/test_pandas.py::TestConvertListTypes::test_empty_list_roundtrip C:\tmp\arrow-verify-release\conda-env\lib\site-packages\pandas\core\dtypes\missing.py:576: DeprecationWarning: The truth value of an empty array is ambiguous. Returning False, but in future this will result in an error. Use `array.size > 0` to check that an array is not empty. return lib.array_equivalent_object(left, right) -- Docs: https://docs.pytest.org/en/stable/how-to/capture-warnings.html =========================== short test summary info =========================== FAILED pyarrow/tests/parquet/test_basic.py::test_set_write_batch_size - AssertionError FAILED pyarrow/tests/parquet/test_basic.py::test_set_dictionary_pagesize_limit - AssertionError FAILED pyarrow/tests/parquet/test_basic.py::test_chunked_table_write - AssertionError FAILED pyarrow/tests/parquet/test_data_types.py::test_parquet_2_6_roundtrip[1000] - AssertionError: DataFrame.iloc[:, 0] (column name="uint8") are different DataFrame.iloc[:, 0] (column name="uint8") values are different (1.6 %) [index]: [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, ...] [left]: [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, ...] [right]: [224, 225, 226, 227, 228, 229, 230, 231, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, ...] FAILED pyarrow/tests/parquet/test_pandas.py::test_spark_flavor_preserves_pandas_metadata - AssertionError: DataFrame.iloc[:, 0] (column name="uint8") are different DataFrame.iloc[:, 0] (column name="uint8") values are different (8.0 %) [index]: [0, 10, 20, 30, 40, 50, 60, 70, 80, 90, 100, 110, 120, 130, 140, 150, 160, 170, 180, 190, 200, 210, 220, 230, 240, 250, 260, 270, 280, 290, 300, 310, 320, 330, 340, 350, 360, 370, 380, 390, 400, 410, 420, 430, 440, 450, 460, 470, 480, 490, 500, 510, 520, 530, 540, 550, 560, 570, 580, 590, 600, 610, 620, 630, 640, 650, 660, 670, 680, 690, 700, 710, 720, 730, 740, 750, 760, 770, 780, 790, 800, 810, 820, 830, 840, 850, 860, 870, 880, 890, 900, 910, 920, 930, 940, 950, 960, 970, 980, 990] [left]: [88, 94, 107, 145, 47, 170, 196, 151, 117, 166, 22, 183, 192, 204, 33, 216, 67, 179, 78, 154, 251, 82, 162, 219, 195, 118, 125, 139, 103, 125, 229, 216, 9, 164, 116, 108, 211, 222, 161, 159, 21, 81, 89, 165, 242, 214, 102, 98, 36, 183, 5, 112, 87, 58, 43, 76, 70, 60, 75, 228, 216, 189, 132, 14, 88, 154, 178, 246, 140, 205, 204, 69, 58, 57, 41, 98, 193, 66, 72, 122, 230, 125, 174, 202, 39, 74, 234, 207, 87, 168, 101, 135, 174, 200, 223, 122, 1, 0, 0, 0] [right]: [172, 10, 127, 140, 47, 170, 196, 151, 117, 166, 22, 183, 192, 204, 33, 216, 67, 179, 78, 154, 251, 82, 162, 219, 195, 118, 125, 139, 103, 125, 229, 216, 9, 164, 116, 108, 211, 222, 161, 159, 21, 81, 89, 165, 242, 214, 102, 98, 36, 183, 5, 112, 87, 58, 43, 76, 70, 60, 75, 228, 216, 189, 132, 14, 88, 154, 178, 246, 140, 205, 204, 69, 58, 57, 41, 98, 193, 66, 72, 122, 230, 125, 174, 202, 39, 74, 234, 207, 87, 168, 101, 135, 174, 200, 223, 122, 88, 94, 107, 145] FAILED pyarrow/tests/parquet/test_parquet_file.py::test_read_single_row_group - AssertionError: DataFrame.iloc[:, 0] (column name="uint8") are different DataFrame.iloc[:, 0] (column name="uint8") values are different (0.32 %) [index]: [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, ...] [left]: [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, ...] [right]: [192, 193, 194, 195, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, ...] FAILED pyarrow/tests/parquet/test_parquet_file.py::test_read_single_row_group_with_column_subset - AssertionError: DataFrame.iloc[:, 0] (column name="uint8") are different DataFrame.iloc[:, 0] (column name="uint8") values are different (0.3 %) [index]: [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, ...] [left]: [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, ...] [right]: [192, 193, 194, 195, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, ...] FAILED pyarrow/tests/parquet/test_parquet_file.py::test_read_multiple_row_groups - AssertionError: DataFrame.iloc[:, 0] (column name="uint8") are different DataFrame.iloc[:, 0] (column name="uint8") values are different (0.32 %) [index]: [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, ...] [left]: [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, ...] [right]: [192, 193, 194, 195, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, ...] FAILED pyarrow/tests/parquet/test_parquet_file.py::test_read_multiple_row_groups_with_column_subset - AssertionError: DataFrame.iloc[:, 0] (column name="uint8") are different DataFrame.iloc[:, 0] (column name="uint8") values are different (0.32 %) [index]: [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, ...] [left]: [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, ...] [right]: [192, 193, 194, 195, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, ...] FAILED pyarrow/tests/parquet/test_parquet_file.py::test_iter_batches_columns_reader[300] - AssertionError: DataFrame.iloc[:, 0] (column name="uint8") are different DataFrame.iloc[:, 0] (column name="uint8") values are different (2.66667 %) [index]: [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, ...] [left]: [224, 225, 226, 227, 228, 229, 230, 231, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, ...] [right]: [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, ...] FAILED pyarrow/tests/parquet/test_parquet_file.py::test_iter_batches_columns_reader[1000] - AssertionError: DataFrame.iloc[:, 0] (column name="uint8") are different DataFrame.iloc[:, 0] (column name="uint8") values are different (1.6 %) [index]: [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, ...] [left]: [224, 225, 226, 227, 228, 229, 230, 231, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, ...] [right]: [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, ...] FAILED pyarrow/tests/parquet/test_parquet_file.py::test_iter_batches_columns_reader[1300] - AssertionError: DataFrame.iloc[:, 0] (column name="uint8") are different DataFrame.iloc[:, 0] (column name="uint8") values are different (1.84615 %) [index]: [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, ...] [left]: [224, 225, 226, 227, 228, 229, 230, 231, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, ...] [right]: [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, ...] FAILED pyarrow/tests/parquet/test_parquet_writer.py::test_parquet_incremental_file_build - AssertionError: DataFrame.iloc[:, 0] (column name="uint8") are different DataFrame.iloc[:, 0] (column name="uint8") values are different (8.0 %) [index]: [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, ...] [left]: [88, 94, 107, 145, 47, 170, 196, 151, 117, 166, 22, 183, 192, 204, 33, 216, 67, 179, 78, 154, 251, 82, 162, 219, 195, 118, 125, 139, 103, 125, 229, 216, 9, 164, 116, 108, 211, 222, 161, 159, 21, 81, 89, 165, 242, 214, 102, 98, 36, 183, 5, 112, 87, 58, 43, 76, 70, 60, 75, 228, 216, 189, 132, 14, 88, 154, 178, 246, 140, 205, 204, 69, 58, 57, 41, 98, 193, 66, 72, 122, 230, 125, 174, 202, 39, 74, 234, 207, 87, 168, 101, 135, 174, 200, 223, 122, 0, 0, 0, 0, ...] [right]: [172, 10, 127, 140, 47, 170, 196, 151, 117, 166, 22, 183, 192, 204, 33, 216, 67, 179, 78, 154, 251, 82, 162, 219, 195, 118, 125, 139, 103, 125, 229, 216, 9, 164, 116, 108, 211, 222, 161, 159, 21, 81, 89, 165, 242, 214, 102, 98, 36, 183, 5, 112, 87, 58, 43, 76, 70, 60, 75, 228, 216, 189, 132, 14, 88, 154, 178, 246, 140, 205, 204, 69, 58, 57, 41, 98, 193, 66, 72, 122, 230, 125, 174, 202, 39, 74, 234, 207, 87, 168, 101, 135, 174, 200, 223, 122, 88, 94, 107, 145, ...] FAILED pyarrow/tests/parquet/test_parquet_writer.py::test_parquet_writer_context_obj - AssertionError: DataFrame.iloc[:, 0] (column name="uint8") are different DataFrame.iloc[:, 0] (column name="uint8") values are different (8.0 %) [index]: [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, ...] [left]: [88, 94, 107, 145, 47, 170, 196, 151, 117, 166, 22, 183, 192, 204, 33, 216, 67, 179, 78, 154, 251, 82, 162, 219, 195, 118, 125, 139, 103, 125, 229, 216, 9, 164, 116, 108, 211, 222, 161, 159, 21, 81, 89, 165, 242, 214, 102, 98, 36, 183, 5, 112, 87, 58, 43, 76, 70, 60, 75, 228, 216, 189, 132, 14, 88, 154, 178, 246, 140, 205, 204, 69, 58, 57, 41, 98, 193, 66, 72, 122, 230, 125, 174, 202, 39, 74, 234, 207, 87, 168, 101, 135, 174, 200, 223, 122, 85, 144, 50, 30, ...] [right]: [172, 10, 127, 140, 47, 170, 196, 151, 117, 166, 22, 183, 192, 204, 33, 216, 67, 179, 78, 154, 251, 82, 162, 219, 195, 118, 125, 139, 103, 125, 229, 216, 9, 164, 116, 108, 211, 222, 161, 159, 21, 81, 89, 165, 242, 214, 102, 98, 36, 183, 5, 112, 87, 58, 43, 76, 70, 60, 75, 228, 216, 189, 132, 14, 88, 154, 178, 246, 140, 205, 204, 69, 58, 57, 41, 98, 193, 66, 72, 122, 230, 125, 174, 202, 39, 74, 234, 207, 87, 168, 101, 135, 174, 200, 223, 122, 88, 94, 107, 145, ...] FAILED pyarrow/tests/parquet/test_parquet_writer.py::test_parquet_writer_context_obj_with_exception - AssertionError: DataFrame.iloc[:, 0] (column name="uint8") are different DataFrame.iloc[:, 0] (column name="uint8") values are different (8.0 %) [index]: [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, ...] [left]: [88, 94, 107, 145, 47, 170, 196, 151, 117, 166, 22, 183, 192, 204, 33, 216, 67, 179, 78, 154, 251, 82, 162, 219, 195, 118, 125, 139, 103, 125, 229, 216, 9, 164, 116, 108, 211, 222, 161, 159, 21, 81, 89, 165, 242, 214, 102, 98, 36, 183, 5, 112, 87, 58, 43, 76, 70, 60, 75, 228, 216, 189, 132, 14, 88, 154, 178, 246, 140, 205, 204, 69, 58, 57, 41, 98, 193, 66, 72, 122, 230, 125, 174, 202, 39, 74, 234, 207, 87, 168, 101, 135, 174, 200, 223, 122, 192, 202, 212, 222, ...] [right]: [172, 10, 127, 140, 47, 170, 196, 151, 117, 166, 22, 183, 192, 204, 33, 216, 67, 179, 78, 154, 251, 82, 162, 219, 195, 118, 125, 139, 103, 125, 229, 216, 9, 164, 116, 108, 211, 222, 161, 159, 21, 81, 89, 165, 242, 214, 102, 98, 36, 183, 5, 112, 87, 58, 43, 76, 70, 60, 75, 228, 216, 189, 132, 14, 88, 154, 178, 246, 140, 205, 204, 69, 58, 57, 41, 98, 193, 66, 72, 122, 230, 125, 174, 202, 39, 74, 234, 207, 87, 168, 101, 135, 174, 200, 223, 122, 88, 94, 107, 145, ...] FAILED pyarrow/tests/parquet/test_parquet_writer.py::test_parquet_writer_write_wrappers[None] - AssertionError: DataFrame.iloc[:, 0] (column name="uint8") are different DataFrame.iloc[:, 0] (column name="uint8") values are different (8.0 %) [index]: [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99] [left]: [88, 94, 107, 145, 47, 170, 196, 151, 117, 166, 22, 183, 192, 204, 33, 216, 67, 179, 78, 154, 251, 82, 162, 219, 195, 118, 125, 139, 103, 125, 229, 216, 9, 164, 116, 108, 211, 222, 161, 159, 21, 81, 89, 165, 242, 214, 102, 98, 36, 183, 5, 112, 87, 58, 43, 76, 70, 60, 75, 228, 216, 189, 132, 14, 88, 154, 178, 246, 140, 205, 204, 69, 58, 57, 41, 98, 193, 66, 72, 122, 230, 125, 174, 202, 39, 74, 234, 207, 87, 168, 101, 135, 174, 200, 223, 122, 223, 129, 44, 118] [right]: [172, 10, 127, 140, 47, 170, 196, 151, 117, 166, 22, 183, 192, 204, 33, 216, 67, 179, 78, 154, 251, 82, 162, 219, 195, 118, 125, 139, 103, 125, 229, 216, 9, 164, 116, 108, 211, 222, 161, 159, 21, 81, 89, 165, 242, 214, 102, 98, 36, 183, 5, 112, 87, 58, 43, 76, 70, 60, 75, 228, 216, 189, 132, 14, 88, 154, 178, 246, 140, 205, 204, 69, 58, 57, 41, 98, 193, 66, 72, 122, 230, 125, 174, 202, 39, 74, 234, 207, 87, 168, 101, 135, 174, 200, 223, 122, 88, 94, 107, 145] FAILED pyarrow/tests/parquet/test_parquet_writer.py::test_parquet_writer_write_wrappers[filesystem1] - AssertionError: DataFrame.iloc[:, 0] (column name="uint8") are different DataFrame.iloc[:, 0] (column name="uint8") values are different (8.0 %) [index]: [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99] [left]: [88, 94, 107, 145, 47, 170, 196, 151, 117, 166, 22, 183, 192, 204, 33, 216, 67, 179, 78, 154, 251, 82, 162, 219, 195, 118, 125, 139, 103, 125, 229, 216, 9, 164, 116, 108, 211, 222, 161, 159, 21, 81, 89, 165, 242, 214, 102, 98, 36, 183, 5, 112, 87, 58, 43, 76, 70, 60, 75, 228, 216, 189, 132, 14, 88, 154, 178, 246, 140, 205, 204, 69, 58, 57, 41, 98, 193, 66, 72, 122, 230, 125, 174, 202, 39, 74, 234, 207, 87, 168, 101, 135, 174, 200, 223, 122, 85, 144, 50, 30] [right]: [172, 10, 127, 140, 47, 170, 196, 151, 117, 166, 22, 183, 192, 204, 33, 216, 67, 179, 78, 154, 251, 82, 162, 219, 195, 118, 125, 139, 103, 125, 229, 216, 9, 164, 116, 108, 211, 222, 161, 159, 21, 81, 89, 165, 242, 214, 102, 98, 36, 183, 5, 112, 87, 58, 43, 76, 70, 60, 75, 228, 216, 189, 132, 14, 88, 154, 178, 246, 140, 205, 204, 69, 58, 57, 41, 98, 193, 66, 72, 122, 230, 125, 174, 202, 39, 74, 234, 207, 87, 168, 101, 135, 174, 200, 223, 122, 88, 94, 107, 145] FAILED pyarrow/tests/parquet/test_parquet_writer.py::test_parquet_writer_filesystem_local[None] - AssertionError: DataFrame.iloc[:, 0] (column name="uint8") are different DataFrame.iloc[:, 0] (column name="uint8") values are different (8.0 %) [index]: [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99] [left]: [88, 94, 107, 145, 47, 170, 196, 151, 117, 166, 22, 183, 192, 204, 33, 216, 67, 179, 78, 154, 251, 82, 162, 219, 195, 118, 125, 139, 103, 125, 229, 216, 9, 164, 116, 108, 211, 222, 161, 159, 21, 81, 89, 165, 242, 214, 102, 98, 36, 183, 5, 112, 87, 58, 43, 76, 70, 60, 75, 228, 216, 189, 132, 14, 88, 154, 178, 246, 140, 205, 204, 69, 58, 57, 41, 98, 193, 66, 72, 122, 230, 125, 174, 202, 39, 74, 234, 207, 87, 168, 101, 135, 174, 200, 223, 122, 223, 129, 44, 118] [right]: [172, 10, 127, 140, 47, 170, 196, 151, 117, 166, 22, 183, 192, 204, 33, 216, 67, 179, 78, 154, 251, 82, 162, 219, 195, 118, 125, 139, 103, 125, 229, 216, 9, 164, 116, 108, 211, 222, 161, 159, 21, 81, 89, 165, 242, 214, 102, 98, 36, 183, 5, 112, 87, 58, 43, 76, 70, 60, 75, 228, 216, 189, 132, 14, 88, 154, 178, 246, 140, 205, 204, 69, 58, 57, 41, 98, 193, 66, 72, 122, 230, 125, 174, 202, 39, 74, 234, 207, 87, 168, 101, 135, 174, 200, 223, 122, 88, 94, 107, 145] FAILED pyarrow/tests/parquet/test_parquet_writer.py::test_parquet_writer_filesystem_local[filesystem1] - AssertionError: DataFrame.iloc[:, 0] (column name="uint8") are different DataFrame.iloc[:, 0] (column name="uint8") values are different (8.0 %) [index]: [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99] [left]: [88, 94, 107, 145, 47, 170, 196, 151, 117, 166, 22, 183, 192, 204, 33, 216, 67, 179, 78, 154, 251, 82, 162, 219, 195, 118, 125, 139, 103, 125, 229, 216, 9, 164, 116, 108, 211, 222, 161, 159, 21, 81, 89, 165, 242, 214, 102, 98, 36, 183, 5, 112, 87, 58, 43, 76, 70, 60, 75, 228, 216, 189, 132, 14, 88, 154, 178, 246, 140, 205, 204, 69, 58, 57, 41, 98, 193, 66, 72, 122, 230, 125, 174, 202, 39, 74, 234, 207, 87, 168, 101, 135, 174, 200, 223, 122, 0, 0, 0, 0] [right]: [172, 10, 127, 140, 47, 170, 196, 151, 117, 166, 22, 183, 192, 204, 33, 216, 67, 179, 78, 154, 251, 82, 162, 219, 195, 118, 125, 139, 103, 125, 229, 216, 9, 164, 116, 108, 211, 222, 161, 159, 21, 81, 89, 165, 242, 214, 102, 98, 36, 183, 5, 112, 87, 58, 43, 76, 70, 60, 75, 228, 216, 189, 132, 14, 88, 154, 178, 246, 140, 205, 204, 69, 58, 57, 41, 98, 193, 66, 72, 122, 230, 125, 174, 202, 39, 74, 234, 207, 87, 168, 101, 135, 174, 200, 223, 122, 88, 94, 107, 145] FAILED pyarrow/tests/test_dataset.py::test_write_dataset_parquet - assert False + where False = equals(pyarrow.Table\nf1: int64\nf2: timestamp[us]\npart: string\n----\nf1: [[0,1,2,3,4,...,15,16,17,18,19]]\nf2: [[2012-01-01 00:00:00.000000,2012-01-02 00:00:00.000000,2012-01-03 00:00:00.000000,2012-01-04 00:00:00.000000,2012-01-05 00:00:00.000000,...,2012-01-16 00:00:00.000000,2012-01-17 00:00:00.000000,2012-01-18 00:00:00.000000,2012-01-19 00:00:00.000000,2012-01-20 00:00:00.000000]]\npart: [["a","a","a","a","a",...,"b","b","b","b","b"]]) + where equals = pyarrow.Table\nf1: int64\nf2: timestamp[us]\npart: string\n----\nf1: [[16,17,18,19,4,...,15,141733920800,150323855394,158913789988,167503724582]]\nf2: [[2012-01-01 00:00:00.000000,2012-01-02 00:00:00.000000,2012-01-03 00:00:00.000000,2012-01-04 00:00:00.000000,2012-01-05 00:00:00.000000,...,2012-01-16 00:00:00.000000,2012-01-17 00:00:00.000000,2012-01-18 00:00:00.000000,2012-01-19 00:00:00.000000,2012-01-20 00:00:00.000000]]\npart: [["a","a","a","a","a",...,"b","b","b","b","b"]].equals = 20 failed, 7489 passed, 478 skipped, 16 xfailed, 2 xpassed, 12 warnings in 161.27s (0:02:41) = ``` </details> ### Component(s) Release, Python -- This is an automated message from the Apache Git Service. To respond to the message, please log on to GitHub and use the URL above to go to the specific comment. To unsubscribe, e-mail: issues-unsubscr...@arrow.apache.org.apache.org For queries about this service, please contact Infrastructure at: us...@infra.apache.org