pitrou commented on pull request #8770: URL: https://github.com/apache/arrow/pull/8770#issuecomment-733919445
Parquet benchmarks: ``` 199 BM_PlainDecodingSpacedFloat/32768/100 5.506 GiB/sec 18.466 GiB/sec 235.349 {'run_name': 'BM_PlainDecodingSpacedFloat/32768/100', 'run_type': 'iteration', 'repetitions': 0, 'repetition_index': 0, 'threads': 1, 'iterations': 31377, 'null_percent': 1.0} 177 BM_PlainEncodingSpacedBoolean/32768/10000 11.377 GiB/sec 33.462 GiB/sec 194.106 {'run_name': 'BM_PlainEncodingSpacedBoolean/32768/10000', 'run_type': 'iteration', 'repetitions': 0, 'repetition_index': 0, 'threads': 1, 'iterations': 259382, 'null_percent': 100.0} 179 BM_PlainDecodingSpacedBoolean/32768/100 1.358 GiB/sec 3.572 GiB/sec 163.120 {'run_name': 'BM_PlainDecodingSpacedBoolean/32768/100', 'run_type': 'iteration', 'repetitions': 0, 'repetition_index': 0, 'threads': 1, 'iterations': 31133, 'null_percent': 1.0} 282 BM_PlainEncodingSpacedFloat/32768/100 6.276 GiB/sec 15.605 GiB/sec 148.621 {'run_name': 'BM_PlainEncodingSpacedFloat/32768/100', 'run_type': 'iteration', 'repetitions': 0, 'repetition_index': 0, 'threads': 1, 'iterations': 35719, 'null_percent': 1.0} 152 BM_ArrowBinaryDict/EncodeLowLevel/262144 82.896 MiB/sec 203.718 MiB/sec 145.751 {'run_name': 'BM_ArrowBinaryDict/EncodeLowLevel/262144', 'run_type': 'iteration', 'repetitions': 0, 'repetition_index': 0, 'threads': 1, 'iterations': 38} 298 BM_PlainEncodingSpacedDouble/32768/10000 115.446 GiB/sec 262.819 GiB/sec 127.654 {'run_name': 'BM_PlainEncodingSpacedDouble/32768/10000', 'run_type': 'iteration', 'repetitions': 0, 'repetition_index': 0, 'threads': 1, 'iterations': 330346, 'null_percent': 100.0} 247 BM_PlainDecodingSpacedDouble/32768/100 9.953 GiB/sec 22.653 GiB/sec 127.594 {'run_name': 'BM_PlainDecodingSpacedDouble/32768/100', 'run_type': 'iteration', 'repetitions': 0, 'repetition_index': 0, 'threads': 1, 'iterations': 28669, 'null_percent': 1.0} 207 BM_PlainEncodingSpacedFloat/32768/10000 57.732 GiB/sec 130.097 GiB/sec 125.348 {'run_name': 'BM_PlainEncodingSpacedFloat/32768/10000', 'run_type': 'iteration', 'repetitions': 0, 'repetition_index': 0, 'threads': 1, 'iterations': 330727, 'null_percent': 100.0} 203 BM_PlainDecodingSpacedFloat/32768/1 21.382 GiB/sec 36.628 GiB/sec 71.298 {'run_name': 'BM_PlainDecodingSpacedFloat/32768/1', 'run_type': 'iteration', 'repetitions': 0, 'repetition_index': 0, 'threads': 1, 'iterations': 122797, 'null_percent': 0.01} 231 BM_PlainEncodingSpacedDouble/32768/100 10.467 GiB/sec 17.029 GiB/sec 62.697 {'run_name': 'BM_PlainEncodingSpacedDouble/32768/100', 'run_type': 'iteration', 'repetitions': 0, 'repetition_index': 0, 'threads': 1, 'iterations': 30042, 'null_percent': 1.0} 256 BM_PlainEncodingSpacedFloat/32768/5000 1008.863 MiB/sec 1.592 GiB/sec 61.538 {'run_name': 'BM_PlainEncodingSpacedFloat/32768/5000', 'run_type': 'iteration', 'repetitions': 0, 'repetition_index': 0, 'threads': 1, 'iterations': 5619, 'null_percent': 50.0} 273 BM_PlainEncodingSpacedDouble/32768/5000 2.022 GiB/sec 3.201 GiB/sec 58.281 {'run_name': 'BM_PlainEncodingSpacedDouble/32768/5000', 'run_type': 'iteration', 'repetitions': 0, 'repetition_index': 0, 'threads': 1, 'iterations': 5712, 'null_percent': 50.0} 162 BM_PlainDecodingSpacedFloat/32768/5000 981.563 MiB/sec 1.516 GiB/sec 58.168 {'run_name': 'BM_PlainDecodingSpacedFloat/32768/5000', 'run_type': 'iteration', 'repetitions': 0, 'repetition_index': 0, 'threads': 1, 'iterations': 5473, 'null_percent': 50.0} 173 BM_PlainDecodingSpacedDouble/32768/5000 1.891 GiB/sec 2.991 GiB/sec 58.157 {'run_name': 'BM_PlainDecodingSpacedDouble/32768/5000', 'run_type': 'iteration', 'repetitions': 0, 'repetition_index': 0, 'threads': 1, 'iterations': 5401, 'null_percent': 50.0} 238 BM_PlainDecodingSpacedBoolean/32768/5000 250.841 MiB/sec 384.756 MiB/sec 53.386 {'run_name': 'BM_PlainDecodingSpacedBoolean/32768/5000', 'run_type': 'iteration', 'repetitions': 0, 'repetition_index': 0, 'threads': 1, 'iterations': 5585, 'null_percent': 50.0} 264 BM_PlainEncodingSpacedBoolean/32768/5000 234.661 MiB/sec 353.009 MiB/sec 50.433 {'run_name': 'BM_PlainEncodingSpacedBoolean/32768/5000', 'run_type': 'iteration', 'repetitions': 0, 'repetition_index': 0, 'threads': 1, 'iterations': 5211, 'null_percent': 50.0} 286 BM_PlainDecodingSpacedFloat/32768/1000 2.531 GiB/sec 3.739 GiB/sec 47.699 {'run_name': 'BM_PlainDecodingSpacedFloat/32768/1000', 'run_type': 'iteration', 'repetitions': 0, 'repetition_index': 0, 'threads': 1, 'iterations': 14280, 'null_percent': 10.0} 229 BM_PlainEncodingSpacedFloat/32768/1000 2.680 GiB/sec 3.783 GiB/sec 41.159 {'run_name': 'BM_PlainEncodingSpacedFloat/32768/1000', 'run_type': 'iteration', 'repetitions': 0, 'repetition_index': 0, 'threads': 1, 'iterations': 15210, 'null_percent': 10.0} 251 BM_PlainDecodingSpacedDouble/32768/1 25.016 GiB/sec 34.929 GiB/sec 39.627 {'run_name': 'BM_PlainDecodingSpacedDouble/32768/1', 'run_type': 'iteration', 'repetitions': 0, 'repetition_index': 0, 'threads': 1, 'iterations': 71628, 'null_percent': 0.01} 201 BM_PlainDecodingSpacedDouble/32768/1000 4.987 GiB/sec 6.893 GiB/sec 38.224 {'run_name': 'BM_PlainDecodingSpacedDouble/32768/1000', 'run_type': 'iteration', 'repetitions': 0, 'repetition_index': 0, 'threads': 1, 'iterations': 14031, 'null_percent': 10.0} 244 BM_PlainEncodingSpacedBoolean/32768/100 664.198 MiB/sec 913.312 MiB/sec 37.506 {'run_name': 'BM_PlainEncodingSpacedBoolean/32768/100', 'run_type': 'iteration', 'repetitions': 0, 'repetition_index': 0, 'threads': 1, 'iterations': 14952, 'null_percent': 1.0} 239 BM_PlainEncodingSpacedDouble/32768/1000 5.174 GiB/sec 7.071 GiB/sec 36.652 {'run_name': 'BM_PlainEncodingSpacedDouble/32768/1000', 'run_type': 'iteration', 'repetitions': 0, 'repetition_index': 0, 'threads': 1, 'iterations': 14708, 'null_percent': 10.0} 230 BM_PlainDecodingSpacedBoolean/32768/1000 678.559 MiB/sec 857.465 MiB/sec 26.366 {'run_name': 'BM_PlainDecodingSpacedBoolean/32768/1000', 'run_type': 'iteration', 'repetitions': 0, 'repetition_index': 0, 'threads': 1, 'iterations': 15333, 'null_percent': 10.0} 102 BM_WriteInt64Column<Repetition::OPTIONAL, Compression::LZ4>/1048576 332.343 MiB/sec 409.541 MiB/sec 23.228 {'run_name': 'BM_WriteInt64Column<Repetition::OPTIONAL, Compression::LZ4>/1048576', 'run_type': 'iteration', 'repetitions': 0, 'repetition_index': 0, 'threads': 1, 'iterations': 109} 185 BM_PlainEncodingSpacedFloat/32768/1 17.571 GiB/sec 21.578 GiB/sec 22.805 {'run_name': 'BM_PlainEncodingSpacedFloat/32768/1', 'run_type': 'iteration', 'repetitions': 0, 'repetition_index': 0, 'threads': 1, 'iterations': 100736, 'null_percent': 0.01} 176 BM_PlainEncodingSpacedBoolean/32768/1000 450.133 MiB/sec 545.271 MiB/sec 21.136 {'run_name': 'BM_PlainEncodingSpacedBoolean/32768/1000', 'run_type': 'iteration', 'repetitions': 0, 'repetition_index': 0, 'threads': 1, 'iterations': 9948, 'null_percent': 10.0} 187 BM_PlainDecodingSpacedBoolean/32768/1 4.496 GiB/sec 5.314 GiB/sec 18.200 {'run_name': 'BM_PlainDecodingSpacedBoolean/32768/1', 'run_type': 'iteration', 'repetitions': 0, 'repetition_index': 0, 'threads': 1, 'iterations': 103077, 'null_percent': 0.01} 25 BM_WriteColumn<false,Int64Type> 1.057 GiB/sec 1.220 GiB/sec 15.454 {'run_name': 'BM_WriteColumn<false,Int64Type>', 'run_type': 'iteration', 'repetitions': 0, 'repetition_index': 0, 'threads': 1, 'iterations': 10} 39 BM_ReadColumn<true,BooleanType>/5/10 250.138 MiB/sec 283.639 MiB/sec 13.393 {'run_name': 'BM_ReadColumn<true,BooleanType>/5/10', 'run_type': 'iteration', 'repetitions': 0, 'repetition_index': 0, 'threads': 1, 'iterations': 18} 75 BM_WriteInt64Column<Repetition::REQUIRED, Compression::LZ4>/1048576 1.084 GiB/sec 1.216 GiB/sec 12.132 {'run_name': 'BM_WriteInt64Column<Repetition::REQUIRED, Compression::LZ4>/1048576', 'run_type': 'iteration', 'repetitions': 0, 'repetition_index': 0, 'threads': 1, 'iterations': 443} 115 BM_RleEncoding/32768/1 724.153 MiB/sec 810.490 MiB/sec 11.923 {'run_name': 'BM_RleEncoding/32768/1', 'run_type': 'iteration', 'repetitions': 0, 'repetition_index': 0, 'threads': 1, 'iterations': 8141} 92 BM_RleEncoding/1024/1 706.002 MiB/sec 788.645 MiB/sec 11.706 {'run_name': 'BM_RleEncoding/1024/1', 'run_type': 'iteration', 'repetitions': 0, 'repetition_index': 0, 'threads': 1, 'iterations': 232581} 106 BM_WriteInt64Column<Repetition::REPEATED>/1048576 218.593 MiB/sec 243.729 MiB/sec 11.499 {'run_name': 'BM_WriteInt64Column<Repetition::REPEATED>/1048576', 'run_type': 'iteration', 'repetitions': 0, 'repetition_index': 0, 'threads': 1, 'iterations': 77} 109 BM_RleEncoding/65536/1 729.356 MiB/sec 811.227 MiB/sec 11.225 {'run_name': 'BM_RleEncoding/65536/1', 'run_type': 'iteration', 'repetitions': 0, 'repetition_index': 0, 'threads': 1, 'iterations': 4076} 89 BM_RleEncoding/4096/1 725.079 MiB/sec 804.486 MiB/sec 10.952 {'run_name': 'BM_RleEncoding/4096/1', 'run_type': 'iteration', 'repetitions': 0, 'repetition_index': 0, 'threads': 1, 'iterations': 64655} 7 BM_ReadColumn<false,Int32Type>/-1/10 1.811 GiB/sec 2.008 GiB/sec 10.851 {'run_name': 'BM_ReadColumn<false,Int32Type>/-1/10', 'run_type': 'iteration', 'repetitions': 0, 'repetition_index': 0, 'threads': 1, 'iterations': 32} 58 BM_ReadColumn<false,Int32Type>/-1/1 5.426 GiB/sec 5.999 GiB/sec 10.568 {'run_name': 'BM_ReadColumn<false,Int32Type>/-1/1', 'run_type': 'iteration', 'repetitions': 0, 'repetition_index': 0, 'threads': 1, 'iterations': 89} 87 BM_ReadInt64Column<Repetition::REQUIRED, Compression::ZSTD>/65536/1024 12.156 GiB/sec 11.951 GiB/sec -1.682 {'run_name': 'BM_ReadInt64Column<Repetition::REQUIRED, Compression::ZSTD>/65536/1024', 'run_type': 'iteration', 'repetitions': 0, 'repetition_index': 0, 'threads': 1, 'iterations': 69528} [...] 204 BM_PlainEncodingBoolean/65536 802.645 MiB/sec 707.974 MiB/sec -11.795 {'run_name': 'BM_PlainEncodingBoolean/65536', 'run_type': 'iteration', 'repetitions': 0, 'repetition_index': 0, 'threads': 1, 'iterations': 8937} 132 BM_RleEncoding/65536/8 482.792 MiB/sec 424.143 MiB/sec -12.148 {'run_name': 'BM_RleEncoding/65536/8', 'run_type': 'iteration', 'repetitions': 0, 'repetition_index': 0, 'threads': 1, 'iterations': 2684} 15 BM_WriteColumn<true,DoubleType> 622.954 MiB/sec 498.484 MiB/sec -19.981 {'run_name': 'BM_WriteColumn<true,DoubleType>', 'run_type': 'iteration', 'repetitions': 0, 'repetition_index': 0, 'threads': 1, 'iterations': 6} 16 BM_WriteColumn<true,Int64Type> 668.120 MiB/sec 526.837 MiB/sec -21.146 {'run_name': 'BM_WriteColumn<true,Int64Type>', 'run_type': 'iteration', 'repetitions': 0, 'repetition_index': 0, 'threads': 1, 'iterations': 6} 34 BM_WriteColumn<true,Int32Type> 362.327 MiB/sec 256.361 MiB/sec -29.246 {'run_name': 'BM_WriteColumn<true,Int32Type>', 'run_type': 'iteration', 'repetitions': 0, 'repetition_index': 0, 'threads': 1, 'iterations': 6} 27 BM_WriteColumn<true,BooleanType> 101.732 MiB/sec 69.602 MiB/sec -31.583 {'run_name': 'BM_WriteColumn<true,BooleanType>', 'run_type': 'iteration', 'repetitions': 0, 'repetition_index': 0, 'threads': 1, 'iterations': 7} 60 BM_ReadColumn<true,BooleanType>/-1/1 480.372 MiB/sec 219.376 MiB/sec -54.332 {'run_name': 'BM_ReadColumn<true,BooleanType>/-1/1', 'run_type': 'iteration', 'repetitions': 0, 'repetition_index': 0, 'threads': 1, 'iterations': 32} 289 BM_ArrowBinaryDict/EncodeLowLevel/1048576 316.208 MiB/sec 131.127 MiB/sec -58.531 {'run_name': 'BM_ArrowBinaryDict/EncodeLowLevel/1048576', 'run_type': 'iteration', 'repetitions': 0, 'repetition_index': 0, 'threads': 1, 'iterations': 37} ``` ---------------------------------------------------------------- This is an automated message from the Apache Git Service. To respond to the message, please log on to GitHub and use the URL above to go to the specific comment. For queries about this service, please contact Infrastructure at: us...@infra.apache.org