This is an automated email from the ASF dual-hosted git repository.
kszucs pushed a change to branch release-4.0.0
in repository https://gitbox.apache.org/repos/asf/arrow.git.
from 5489bbf ARROW-10255: [JS] Reorganize exports for ESM tree-shaking
add 7679260 ARROW-12200: [R] Export and document list_compute_functions
add 9ea2890 ARROW-10421: [R] Use gc_memory_pool in more places
add ac38410 ARROW-12238: [JS] Remove trailing spaces and consistently add
space after //
add c2f665b ARROW-12279: [Rust][DataFusion] Add test for null handling in
hash join (ARROW-12266)
add 2fd4f80 ARROW-11982: [Rust] Donate Ballista Distributed Compute
Platform
add 5b5c058 ARROW-12300: [C++] Remove linking of cuda runtime library
add df12dee ARROW-12209: [JS] Copy all src files into the the TypeScript
package
add 493b205 MINOR: [JS] correct comment in build file (#9955)
add 113a515 ARROW-12239: [JS] Switch to yarn
add dc182fd ARROW-12305: [JS] Update generate.py to python3 and new
versions of pyarrow
add 60d1678 MINOR: [JS] remove superfluous space (#9953)
add 24da9fa MINOR: [JS] Correct build commands (#9960)
add 6bace6e ARROW-12170: [Rust][DataFusion] Introduce repartition
optimization
add 6ddaaa8 ARROW-12254: [Rust][DataFusion] Stop polling limit input once
limit is reached
add 53b462b ARROW-12278: [Rust][DataFusion] Use Timestamp(Nanosecond,
None) for SQL TIMESTAMP Type
add 75c8cd6 ARROW-11328: [R] Collecting zero columns from a dataset
returns entire dataset
add c0ce2b1 ARROW-12098: [R] Catch cpp build failures on linux
add 3dc01c5 ARROW-11795: [MATLAB] Migrate MATLAB Interface for Apache
Arrow design doc to Markdown
add 868b543 ARROW-12208: [C++] Add the ability to run async tasks without
using the CPU thread pool
add a077d67 ARROW-11589: [R] Add methods for modifying Schemas
add aa27b4c ARROW-11766: [R] Better handling for missing compression
codecs on Linux
add f3d2d2d ARROW-12263: [Dev][Packaging] Move Crossbow to Archery
add 4822483 ARROW-12197: [R] dplyr bindings for cast, dictionary_encode
add c5bc1a2 ARROW-12320: [CI] REPO arg missing from conda-cpp-valgrind
add e20a8b2 ARROW-12327: [Dev] Use pull request's head remote when
submitting crossbow jobs via the comment bot
add 604379e ARROW-12328: [Rust] [Ballista] Fix formatting
add 19891d0 ARROW-12329: [Rust] [Ballista] Add Ballista README
add 552969f ARROW-12267: [Rust] Implement support for timestamps in JSON
writer
add 13c334e ARROW-12251: [Rust] Add Ballista to CI
add c2dc1d9 ARROW-12281: [JS] Remove shx, trash, and rimraf and update
learna for yarn
add 4d7150a ARROW-12274: [JS] Document how to run tests without building
bundles
add fdb055f MINOR: Fix link to definition of minor (#9989)
add f1f4f2b Tag Ballista PRs (#9986)
add 5b08205 ARROW-12313: [Rust] [Ballista] Update benchmark docs for
Ballista
add 077fe64 ARROW-12299: [Python] Recognize new filesytems in
pq.write_to_dataset
add af4c8fc ARROW-12140: [C++][CI] Fix Valgrind failures in Grouper tests
add 6e61023 ARROW-11984: [C++][Gandiva] Implement SHA1 and SHA256
functions
add 632b2c1 ARROW-12069: [C++][Gandiva] Implement IN expressions for
Decimal type
add b43a689 ARROW-12146: [C++][Gandiva] Implement
CONVERT_FROM(expression, replacement char) function
add 91a658a ARROW-12323: [C++][Gandiva] Implement castTIME(timestamp)
function
add 66e1d2b ARROW-11972: [C++][R][Python][Dataset] Extract IPC/Parquet
fragment scan options
add 745cdb6 ARROW-12314: [Python] Accept columns as set in parquet
read_pandas
add 4c6e1b9 ARROW-11761: [C++] Increase public API testing
add 4801e43 ARROW-6248: [Python][C++] Raise better exception on HDFS file
open error
add b385fcd ARROW-12333: [JS] Remove jest-environment-node-debug and do
not emit from typescript by default
add f0bdcdb ARROW-12303: [JS] Use iterator instead of yield
add bc5a63b ARROW-12236: [R][CI] Add check that all docs pages are listed
in _pkgdown.yml
add c51c19e ARROW-12342: [Packaging] Fix tabulation in crossbow templates
for submitting nightly builds
add 62f8c20 ARROW-12326: [C++] Avoid needless c-ares detection
add 2c77f3b ARROW-12352: [CI][R][Windows] Remove needless workaround for
MSYS2
add 7224920 ARROW-11752: [R] Replace usage of testthat::expect_is()
add 1ed6819 ARROW-12277: [Rust][DataFusion] Implement Sum/Count/Min/Max
aggregates for Timestamp(_,_)
add a102ba2 ARROW-12288: [C++] Create Scanner interface
add 57d430e ARROW-12332: [Rust] [Ballista] Add simple api server in
scheduler
add a49d6e2 ARROW-12248: [C++] Avoid looking up ARROW_DEFAULT_MEMORY_POOL
environment variable too late
add d7558bf ARROW-11839: [C++] Use xsimd for generation of accelerated
bit-unpacking
add 00a4436 ARROW-12357: [Archery] Bump Jinja2 version requirement
add a5f3b35 ARROW-11070: [C++][Compute] Implement power kernel
add 5db4092 ARROW-12316: [C++] Prefer mimalloc on Apple
add ab3a08c ARROW-12304: [R] Update news and polish docs for 4.0
add 7cec72d ARROW-12309: [JS] Make es2015 bundles the default
add c0445d6 ARROW-12269: [JS] Move to eslint
add 9fc589f ARROW-12354: [Packaging][RPM] Use
apache.jfrog.io/artifactory/ instead of apache.bintray.com/
add 798a9b4 ARROW-12351: [CI][Ruby] Use ruby/setup-ruby instead of
actions/setup-ruby
add 2863fdd ARROW-11924: [C++] Add streaming version of
FileSystem::GetFileInfo
add fe83dca ARROW-12361: [Rust] [DataFusion] Allow users to override
physical optimization rules
add c3f55a4 ARROW-12294: [Rust] Fix boolean kleene kernels with no
remainder
add 635ae77 ARROW-12374: [CI][C++][cron] Use Ubuntu 20.04 instead of 16.04
add fb892c63 ARROW-12330: [Developer] Restore values at counters column of
Archery benchmark
add 9c85e54 ARROW-12287: [C++] Create enumerating generator
add 31c8c75 ARROW-12262: [Doc] Enable S3 and Flight in docs build
add 6f2e05d ARROW-11677: [C++][Docs] Add basic C++ datasets documentation
add e99e70d ARROW-12220: [C++][CI] Thread sanitizer failure
add cb7a624 ARROW-12379: [C++] Fix ThreadSanitizer failure in
SerialExecutor
add 8f35024 ARROW-12385: [R] [CI] fix cran picking in CI
add a5356c3 ARROW-12353: [Packaging][deb] Rename -archive-keyring to
-apt-source
add a865dc9 ARROW-12375: [Release] Remove rebase post-release scripts
add ccdbbe3 ARROW-12384: [JS] Use let/const and clean up eslint rules
add 568046a ARROW-11475: [C++] Revert "Upgrade mimalloc"
add 05ec438 ARROW-12161: [C++][Dataset] Revert async CSV reader in
datasets
add b5045ed ARROW-12382: [C++] Bundle xsimd if runtime SIMD level is set
add 894fab0 ARROW-11468: [R] Allow user to pass schema to
read_json_arrow()
add df20489 ARROW-12370: [R] Bindings for power kernel
add c7485b7 ARROW-11477: [R][Doc] Reorganize and improve README and
vignette content
add 5794290 ARROW-12273: [JS] [Rust] Remove coveralls
add 02cdeab ARROW-12376: [Dev] Log traceback for unexpected exceptions in
archery trigger-bot
add d575858 ARROW-11797: [C++][Dataset] Provide batch stream Scanner
methods
add 818c57c ARROW-12381: [Packaging][Python] macOS wheels are built with
wrong package kind
add 1c0641d ARROW-12017: [R] [Documentation] Make proper developing arrow
docs
add 1e6819c ARROW-12057: [Python] Remove direct usage of pandas' Block
subclasses (partly)
add 15137e2 ARROW-7215: [C++][Gandiva] Implement
castVARCHAR(numeric_type) functions
add 9178c13 ARROW-12337: [Rust] add DoubleEndedIterator and
ExactSizeIterator traits
add 61935aa ARROW-12250: [Rust] [Parquet] Fix failing arrow_writer test
add 645c3f9 ARROW-11472: [Python][CI] Remove temporary pin of numpy in
kartothek integration build
add 1251f53 ARROW-12317: [Rust] JSON writer support for time, duration
and date
add 95b8f99 ARROW-12397: [Rust] [DataFusion] Simplify readme example
add 26a5a04 ARROW-12390: [Rust] Inline from_trusted_len_iter,
try_from_trusted_len_iter, extend_from_slice
add c394a20 ARROW-12246: [CI] Sync conda recipes with upstream feedstock
add d4ca31f ARROW-12396: [Python][Docs] Clarify serialization/filesystem
docstrings about deprecated status
add 926452b ARROW-12188: [Docs] Switch to pydata-sphinx-theme for the
main sphinx docs
add 150224c ARROW-12151: [Docs] Add Jira component + summary conventions
to the docs
add 2da0a37 ARROW-9731: [C++][Python][R][Dataset] Implement Scanner::Head
add 22bebf8 ARROW-11568: [C++][Compute] Rewrite mode kernel
add d11aaf4 ARROW-12383: [JS] Upgrade dependencies
add fac30e7 ARROW-12408: [R] Delete Scan()
add cd4df5e ARROW-8900: [C++][Python] Expose Proxy Options as parameters
for S3FileSystem
add 1cabc80 ARROW-12401: [R] Fix guard around dataset___Scanner__TakeRows
add 28ed8f7 ARROW-12406: [R] Fix checkbashism violation in configure
add 04e5256 ARROW-12409: [R] Remove LazyData from DESCRIPTION
add 04b6de6 ARROW-12405: [Packaging] Fix apt artifact patterns and
artifact uploading from travis
add 45847e1 ARROW-12389: [R] [Docs] Add note about autocasting
add 49455ec ARROW-12367: [C++] Stop producing when PushGenerator was
destroyed
add ec6436e ARROW-12402: [Rust] [DataFusion] Implement SQL metrics example
add 958c19a ARROW-12335: [Rust] [Ballista] Use latest DataFusion
add 6888c41 ARROW-6103: [Release][Java] Remove mvn release plugin
add d7f90ca ARROW-12400: [Rust] Re-enable tests in arrow::array::transform
No new revisions were added by this update.
Summary of changes:
.env | 2 +-
.github/workflows/archery.yml | 5 +-
.github/workflows/cpp.yml | 2 +-
.github/workflows/cpp_cron.yml | 10 +-
.github/workflows/dev.yml | 2 +-
.github/workflows/dev_pr/labeler.yml | 3 +
.github/workflows/dev_pr/title_check.md | 2 +-
.github/workflows/js.yml | 2 +-
.github/workflows/r.yml | 2 +
.github/workflows/ruby.yml | 2 +-
.github/workflows/rust.yml | 18 +-
ci/conda_env_sphinx.yml | 2 +-
ci/docker/conda-integration.dockerfile | 1 +
ci/docker/conda-python-kartothek.dockerfile | 4 +-
ci/docker/linux-apt-docs.dockerfile | 19 +-
ci/docker/ubuntu-20.10-cpp.dockerfile | 137 +
ci/etc/rprofile | 90 +-
ci/scripts/cpp_build.sh | 4 +-
ci/scripts/docs_build.sh | 6 +-
ci/scripts/integration_kartothek.sh | 3 +-
ci/scripts/js_build.sh | 9 +-
ci/scripts/js_test.sh | 4 +-
ci/scripts/python_wheel_macos_build.sh | 2 +-
ci/scripts/python_wheel_manylinux_build.sh | 2 +-
ci/scripts/python_wheel_windows_build.bat | 2 +-
ci/scripts/r_pkgdown_check.sh | 41 +
ci/scripts/r_test.sh | 19 +-
ci/scripts/r_windows_build.sh | 5 -
cpp/apidoc/Doxyfile | 1 +
cpp/cmake_modules/Find-c-aresAlt.cmake | 71 +
cpp/cmake_modules/FindOpenSSLAlt.cmake | 54 +
cpp/cmake_modules/FindgRPCAlt.cmake | 247 +-
cpp/cmake_modules/SetupCxxFlags.cmake | 1 +
cpp/cmake_modules/ThirdpartyToolchain.cmake | 85 +-
cpp/examples/arrow/CMakeLists.txt | 5 +
.../arrow/dataset_documentation_example.cc | 355 +
cpp/src/arrow/CMakeLists.txt | 3 +
cpp/src/arrow/compute/api_scalar.cc | 1 +
cpp/src/arrow/compute/api_scalar.h | 14 +
.../arrow/compute/kernels/aggregate_benchmark.cc | 40 +-
cpp/src/arrow/compute/kernels/aggregate_mode.cc | 560 +-
.../arrow/compute/kernels/aggregate_quantile.cc | 67 +-
cpp/src/arrow/compute/kernels/aggregate_test.cc | 2 +-
cpp/src/arrow/compute/kernels/hash_aggregate.cc | 13 +-
cpp/src/arrow/compute/kernels/scalar_arithmetic.cc | 87 +
.../compute/kernels/scalar_arithmetic_test.cc | 110 +-
cpp/src/arrow/compute/kernels/util_internal.h | 90 +
cpp/src/arrow/compute/kernels/vector_sort.cc | 13 +-
cpp/src/arrow/csv/reader.cc | 234 +-
cpp/src/arrow/csv/reader.h | 11 +-
cpp/src/arrow/csv/reader_test.cc | 25 +-
cpp/src/arrow/dataset/dataset.h | 23 +-
cpp/src/arrow/dataset/dataset_internal.h | 2 +-
cpp/src/arrow/dataset/dataset_test.cc | 4 +-
cpp/src/arrow/dataset/discovery.h | 88 +-
cpp/src/arrow/dataset/file_base.cc | 101 +-
cpp/src/arrow/dataset/file_base.h | 20 +-
cpp/src/arrow/dataset/file_csv.cc | 74 +-
cpp/src/arrow/dataset/file_csv.h | 6 +
cpp/src/arrow/dataset/file_csv_test.cc | 16 +-
cpp/src/arrow/dataset/file_ipc.cc | 32 +-
cpp/src/arrow/dataset/file_ipc.h | 22 +-
cpp/src/arrow/dataset/file_ipc_test.cc | 31 +-
cpp/src/arrow/dataset/file_parquet.cc | 58 +-
cpp/src/arrow/dataset/file_parquet.h | 124 +-
cpp/src/arrow/dataset/file_parquet_test.cc | 5 +-
cpp/src/arrow/dataset/file_test.cc | 29 -
cpp/src/arrow/dataset/partition.h | 26 +-
cpp/src/arrow/dataset/scanner.cc | 387 +-
cpp/src/arrow/dataset/scanner.h | 291 +-
cpp/src/arrow/dataset/scanner_internal.h | 99 +-
cpp/src/arrow/dataset/scanner_test.cc | 226 +-
cpp/src/arrow/dataset/test_util.h | 216 +-
cpp/src/arrow/dataset/type_fwd.h | 2 +
cpp/src/arrow/filesystem/filesystem.cc | 66 +-
cpp/src/arrow/filesystem/filesystem.h | 46 +-
cpp/src/arrow/filesystem/filesystem_test.cc | 11 +-
cpp/src/arrow/filesystem/mockfs.cc | 20 +-
cpp/src/arrow/filesystem/mockfs.h | 11 +
cpp/src/arrow/filesystem/s3fs.cc | 288 +-
cpp/src/arrow/filesystem/s3fs.h | 23 +-
cpp/src/arrow/filesystem/s3fs_test.cc | 31 +
cpp/src/arrow/filesystem/test_util.cc | 23 +-
cpp/src/arrow/filesystem/test_util.h | 11 +-
cpp/src/arrow/flight/CMakeLists.txt | 15 +-
cpp/src/arrow/gpu/CMakeLists.txt | 4 +-
cpp/src/arrow/io/hdfs.cc | 20 +-
cpp/src/arrow/io/interfaces.cc | 5 +-
cpp/src/arrow/io/util_internal.h | 11 +
cpp/src/arrow/memory_pool.cc | 88 +-
cpp/src/arrow/public_api_test.cc | 32 +-
cpp/src/arrow/record_batch.h | 9 -
cpp/src/arrow/testing/future_util.h | 14 +-
cpp/src/arrow/type_fwd.h | 2 +
cpp/src/arrow/util/async_generator.h | 402 +-
cpp/src/arrow/util/async_generator_test.cc | 188 +-
cpp/src/arrow/util/bit_run_reader.h | 16 +-
cpp/src/arrow/util/bpacking.cc | 7 +
cpp/src/arrow/util/bpacking_avx2.cc | 114 +-
cpp/src/arrow/util/bpacking_avx2_codegen.py | 203 -
cpp/src/arrow/util/bpacking_avx512.cc | 114 +-
cpp/src/arrow/util/bpacking_avx512_codegen.py | 186 -
.../mod.rs => cpp/src/arrow/util/bpacking_neon.cc | 21 +-
.../src/arrow/util/bpacking_neon.h | 24 +-
cpp/src/arrow/util/bpacking_simd128_generated.h | 2138 +++
cpp/src/arrow/util/bpacking_simd256_generated.h | 1270 ++
cpp/src/arrow/util/bpacking_simd512_generated.h | 836 +
cpp/src/arrow/util/bpacking_simd_codegen.py | 209 +
cpp/src/arrow/util/bpacking_simd_internal.h | 138 +
cpp/src/arrow/util/config.h.cmake | 6 +
cpp/src/arrow/util/formatting.cc | 18 +
cpp/src/arrow/util/formatting.h | 16 +
cpp/src/arrow/util/future.h | 2 +-
cpp/src/arrow/util/future_test.cc | 33 +-
cpp/src/arrow/util/thread_pool.cc | 79 +
cpp/src/arrow/util/thread_pool.h | 87 +-
cpp/src/arrow/util/thread_pool_test.cc | 137 +
.../double-conversion/double-conversion.cc | 20 +-
.../vendored/double-conversion/double-conversion.h | 11 +
cpp/src/gandiva/CMakeLists.txt | 17 +-
cpp/src/gandiva/basic_decimal_scalar.h | 2 +
cpp/src/gandiva/decimal_scalar.h | 19 +
cpp/src/gandiva/dex.h | 43 +
cpp/src/gandiva/dex_visitor.h | 3 +
cpp/src/gandiva/expr_decomposer.cc | 12 +
cpp/src/gandiva/expr_decomposer.h | 1 +
cpp/src/gandiva/expr_validator.cc | 5 +
cpp/src/gandiva/expr_validator.h | 1 +
cpp/src/gandiva/formatting_utils.h | 69 +
cpp/src/gandiva/function_registry_common.h | 20 +
cpp/src/gandiva/function_registry_datetime.cc | 3 +
cpp/src/gandiva/function_registry_hash.cc | 12 +-
cpp/src/gandiva/function_registry_string.cc | 21 +
cpp/src/gandiva/gdv_function_stubs.cc | 664 +-
cpp/src/gandiva/gdv_function_stubs.h | 42 +
cpp/src/gandiva/gdv_function_stubs_test.cc | 130 +
cpp/src/gandiva/hash_utils.cc | 134 +
cpp/src/gandiva/{node_visitor.h => hash_utils.h} | 46 +-
cpp/src/gandiva/hash_utils_test.cc | 164 +
cpp/src/gandiva/in_holder.h | 19 +
cpp/src/gandiva/jni/jni_common.cc | 12 +
cpp/src/gandiva/llvm_generator.cc | 75 +-
cpp/src/gandiva/llvm_generator.h | 1 +
cpp/src/gandiva/node.h | 44 +
cpp/src/gandiva/node_visitor.h | 1 +
cpp/src/gandiva/precompiled/hash.cc | 2 +-
cpp/src/gandiva/precompiled/string_ops.cc | 64 +
cpp/src/gandiva/precompiled/string_ops_test.cc | 58 +
cpp/src/gandiva/precompiled/time.cc | 11 +
cpp/src/gandiva/precompiled/time_test.cc | 19 +
cpp/src/gandiva/precompiled/types.h | 7 +
cpp/src/gandiva/proto/Types.proto | 5 +
cpp/src/gandiva/tests/decimal_test.cc | 66 +
cpp/src/gandiva/tests/hash_test.cc | 287 +-
cpp/src/gandiva/tests/in_expr_test.cc | 61 +
cpp/src/gandiva/tests/utf8_test.cc | 50 +
cpp/src/gandiva/tree_expr_builder.cc | 12 +
cpp/src/gandiva/tree_expr_builder.h | 3 +
cpp/src/jni/dataset/jni_wrapper.cc | 47 +-
cpp/thirdparty/versions.txt | 7 +-
dev/archery/archery/benchmark/codec.py | 1 +
dev/archery/archery/benchmark/google.py | 5 +-
dev/archery/archery/bot.py | 231 +-
dev/archery/archery/cli.py | 18 +
.../archery/archery/crossbow/__init__.py | 14 +-
dev/archery/archery/crossbow/cli.py | 352 +
.../archery/crossbow/core.py} | 871 +-
dev/archery/archery/crossbow/reports.py | 302 +
.../tests/fixtures/crossbow-job.yaml | 0
.../tests/fixtures/crossbow-success-message.md | 0
.../archery/archery/crossbow/tests/test_core.py | 16 +-
.../archery/crossbow/tests/test_crossbow_cli.py | 66 +-
.../archery/crossbow/tests/test_reports.py} | 33 +-
dev/archery/archery/tests/test_benchmarks.py | 37 +
dev/archery/archery/tests/test_bot.py | 55 +-
dev/archery/conftest.py | 70 +
dev/archery/setup.py | 11 +-
.../{00-prepare-test.rb => 01-prepare-test.rb} | 8 +-
dev/release/{00-prepare.sh => 01-prepare.sh} | 72 +-
dev/release/{01-perform.sh => 03-binary-submit.sh} | 46 +-
.../release/04-binary-download.sh | 24 +-
dev/release/{03-binary.sh => 05-binary-upload.sh} | 17 +-
dev/release/binary-task.rb | 2 +-
dev/release/generate_force_push_script.py | 61 -
dev/release/post-09-docs.sh | 1 +
dev/release/post-11-java.sh | 69 +
dev/release/rat_exclude_files.txt | 15 +-
dev/release/verify-apt.sh | 39 +-
dev/release/verify-release-candidate.sh | 8 +-
dev/release/verify-yum.sh | 23 +-
...version10.2numpy1.17python3.6.____cpython.yaml} | 35 +-
...version10.2numpy1.17python3.7.____cpython.yaml} | 35 +-
...version10.2numpy1.17python3.8.____cpython.yaml} | 35 +-
...version10.2numpy1.19python3.9.____cpython.yaml} | 33 +-
...versionNonenumpy1.17python3.6.____cpython.yaml} | 33 +-
...versionNonenumpy1.17python3.7.____cpython.yaml} | 33 +-
...versionNonenumpy1.17python3.8.____cpython.yaml} | 33 +-
...versionNonenumpy1.19python3.9.____cpython.yaml} | 31 +-
... => osx_64_numpy1.17python3.6.____cpython.yaml} | 28 +-
... => osx_64_numpy1.17python3.7.____cpython.yaml} | 28 +-
... => osx_64_numpy1.17python3.8.____cpython.yaml} | 29 +-
... => osx_64_numpy1.19python3.9.____cpython.yaml} | 26 +-
...n.yaml => osx_arm64_python3.8.____cpython.yaml} | 36 +-
...n.yaml => osx_arm64_python3.9.____cpython.yaml} | 34 +-
...versionNonenumpy1.17python3.6.____cpython.yaml} | 20 +-
...versionNonenumpy1.17python3.7.____cpython.yaml} | 20 +-
...versionNonenumpy1.17python3.8.____cpython.yaml} | 20 +-
...versionNonenumpy1.19python3.9.____cpython.yaml} | 18 +-
dev/tasks/conda-recipes/.scripts/logging_utils.sh | 30 +
dev/tasks/conda-recipes/arrow-cpp/bld-arrow.bat | 14 +
dev/tasks/conda-recipes/arrow-cpp/bld-pyarrow.bat | 14 +-
dev/tasks/conda-recipes/arrow-cpp/build-arrow.sh | 39 +-
dev/tasks/conda-recipes/arrow-cpp/build-pyarrow.sh | 14 +-
dev/tasks/conda-recipes/arrow-cpp/meta.yaml | 97 +-
dev/tasks/conda-recipes/azure.linux.yml | 37 +-
dev/tasks/conda-recipes/azure.osx.yml | 49 +-
dev/tasks/conda-recipes/azure.win.yml | 42 +-
dev/tasks/conda-recipes/build_steps.sh | 4 +
dev/tasks/conda-recipes/drone-steps.sh | 6 +-
dev/tasks/conda-recipes/run_docker_build.sh | 4 +
dev/tasks/docker-tests/azure.linux.yml | 8 +-
dev/tasks/docker-tests/github.linux.yml | 34 +-
dev/tasks/gandiva-jars/build-cpp-linux.sh | 1 +
dev/tasks/gandiva-jars/build-cpp-osx.sh | 3 +-
dev/tasks/gandiva-jars/github.linux.yml | 31 +-
dev/tasks/gandiva-jars/github.osx.yml | 34 +-
dev/tasks/linux-packages/Rakefile | 2 +-
.../Rakefile | 6 +-
.../apt/debian-bullseye/Dockerfile | 0
.../apt/debian-buster/Dockerfile | 0
.../apt/ubuntu-bionic/Dockerfile | 0
.../apt/ubuntu-focal/Dockerfile | 0
.../apt/ubuntu-groovy/Dockerfile | 0
.../apt/ubuntu-xenial/Dockerfile | 0
.../debian/apache-arrow-apt-source.install} | 0
.../apache-arrow-apt-source/debian/changelog | 0
.../debian/compat | 0
.../debian/control | 6 +-
.../debian/copyright | 0
.../debian/rules | 8 +-
.../debian/source/format | 0
.../apache-arrow-archive-keyring/debian/changelog | 29 -
.../apache-arrow-release/yum/Apache-Arrow.repo | 6 +-
dev/tasks/linux-packages/github.linux.amd64.yml | 52 +-
dev/tasks/linux-packages/travis.linux.arm64.yml | 24 +-
dev/tasks/macros.jinja | 198 +
dev/tasks/nightlies.sample.yml | 27 +-
dev/tasks/nuget-packages/github.linux.yml | 60 +-
dev/tasks/python-sdist/github.yml | 56 +-
dev/tasks/python-wheels/github.linux.amd64.yml | 75 +-
dev/tasks/python-wheels/github.osx.yml | 44 +-
dev/tasks/python-wheels/github.windows.yml | 68 +-
dev/tasks/python-wheels/travis.linux.arm64.yml | 34 +-
dev/tasks/r/azure.linux.yml | 6 +-
dev/tasks/r/github.devdocs.yml | 92 +
dev/tasks/requirements-crossbow.txt | 7 -
dev/tasks/tasks.yml | 650 +-
dev/tasks/verify-rc/github.linux.yml | 29 +-
.../verify-rc/{github.osx.yml => github.macos.yml} | 29 +-
dev/tasks/verify-rc/github.win.yml | 29 +-
docker-compose.yml | 4 +-
docs/requirements.txt | 2 +-
docs/source/_static/arrow.png | Bin 0 -> 21636 bytes
docs/source/_static/favicon.ico | Bin 0 -> 15086 bytes
docs/source/_static/theme_overrides.css | 53 +
docs/source/_templates/docs-sidebar.html | 19 +
docs/source/_templates/layout.html | 14 +-
docs/source/conf.py | 14 +-
docs/source/cpp/api.rst | 1 +
docs/source/cpp/api/array.rst | 4 -
docs/source/cpp/api/compute.rst | 4 -
.../source/cpp/api/{filesystem.rst => dataset.rst} | 55 +-
docs/source/cpp/api/filesystem.rst | 4 -
docs/source/cpp/api/io.rst | 4 -
docs/source/cpp/api/ipc.rst | 4 -
docs/source/cpp/compute.rst | 8 +-
docs/source/cpp/dataset.rst | 403 +
.../dataset_documentation_example.rst} | 24 +-
docs/source/cpp/examples/index.rst | 1 +
.../cpp/examples/row_columnar_conversion.rst | 2 +-
docs/source/cpp/getting_started.rst | 1 +
docs/source/cpp/io.rst | 2 +
docs/source/cpp/memory.rst | 4 -
docs/source/cpp/parquet.rst | 4 -
docs/source/developers/contributing.rst | 8 +-
docs/source/developers/cpp/windows.rst | 2 +-
docs/source/developers/crossbow.rst | 42 +-
docs/source/format/Guidelines.rst | 2 +
docs/source/format/IPC.rst | 2 +
docs/source/format/Layout.rst | 2 +
docs/source/format/Metadata.rst | 2 +
docs/source/python/api/compute.rst | 2 +
docs/source/python/dataset.rst | 38 +-
docs/source/python/plasma.rst | 3 -
docs/source/status.rst | 2 +-
.../apache/arrow/gandiva/expression/InNode.java | 34 +-
.../arrow/gandiva/expression/TreeBuilder.java | 6 +
.../arrow/gandiva/evaluator/BaseEvaluatorTest.java | 13 +-
.../arrow/gandiva/evaluator/ProjectorTest.java | 279 +-
java/pom.xml | 12 +-
js/.eslintignore | 1 +
js/.eslintrc.js | 87 +
js/.gitignore | 2 +-
js/DEVELOP.md | 39 +-
js/README.md | 3 +-
js/bin/integration.js | 2 +-
js/bin/json-to-arrow.js | 2 +-
js/examples/read_file.html | 2 +-
js/gulp/argv.js | 4 -
js/gulp/arrow-task.js | 10 +-
js/gulp/closure-task.js | 8 +-
js/gulp/package-task.js | 8 +-
js/gulp/test-task.js | 18 +-
js/gulp/util.js | 4 +-
js/gulpfile.js | 8 +-
js/jest.coverage.config.js | 14 +-
js/lerna.json | 3 +-
js/npm-release.sh | 6 +-
js/package-lock.json | 17908 -------------------
js/package.json | 52 +-
js/perf/index.js | 32 +-
js/perf/table_config.js | 8 +-
js/src/bin/arrow2csv.ts | 32 +-
js/src/builder.ts | 25 +-
js/src/builder/buffer.ts | 6 +-
js/src/builder/dictionary.ts | 4 +-
js/src/builder/map.ts | 2 +-
js/src/builder/run.ts | 3 +-
js/src/builder/union.ts | 2 -
js/src/builder/valid.ts | 2 +-
js/src/column.ts | 2 +-
js/src/compute/dataframe.ts | 75 +-
js/src/compute/predicate.ts | 6 +-
js/src/data.ts | 17 +-
.../fb/.eslintrc.js} | 17 +-
js/src/fb/File.ts | 18 +-
js/src/fb/Message.ts | 42 +-
js/src/fb/Schema.ts | 136 +-
js/src/io/adapters.ts | 20 +-
js/src/io/file.ts | 11 +-
js/src/io/interfaces.ts | 13 +-
js/src/io/node/iterable.ts | 6 +-
js/src/io/node/reader.ts | 4 +-
js/src/io/node/writer.ts | 2 +-
js/src/io/stream.ts | 13 +-
js/src/io/whatwg/builder.ts | 4 +-
js/src/io/whatwg/writer.ts | 2 +-
js/src/ipc/metadata/file.ts | 8 +-
js/src/ipc/metadata/json.ts | 5 +-
js/src/ipc/metadata/message.ts | 14 +-
js/src/ipc/reader.ts | 20 +-
js/src/ipc/writer.ts | 9 +-
js/src/recordbatch.ts | 4 +-
js/src/schema.ts | 4 +-
js/src/table.ts | 10 +-
js/src/type.ts | 89 +-
js/src/util/args.ts | 20 +-
js/src/util/bit.ts | 52 +-
js/src/util/bn.ts | 19 +-
js/src/util/buffer.ts | 12 +-
js/src/util/compat.ts | 1 +
js/src/util/int.ts | 24 +-
js/src/util/math.ts | 8 +-
js/src/util/recordbatch.ts | 9 +-
js/src/util/vector.ts | 6 +-
js/src/vector/chunked.ts | 66 +-
js/src/vector/float.ts | 6 +-
js/src/vector/index.ts | 4 +-
js/src/vector/int.ts | 12 +-
js/src/vector/map.ts | 8 +-
js/src/vector/row.ts | 9 +-
js/src/vector/struct.ts | 3 +-
js/src/visitor.ts | 12 +-
js/src/visitor/indexof.ts | 4 +-
js/src/visitor/iterator.ts | 34 +-
js/src/visitor/jsontypeassembler.ts | 4 +-
js/src/visitor/jsonvectorassembler.ts | 22 +-
js/src/visitor/set.ts | 3 +-
js/src/visitor/vectorloader.ts | 4 +-
js/{jest.coverage.config.js => test/.eslintrc.js} | 23 +-
js/test/Arrow.ts | 4 +-
js/test/data/tables/generate.py | 15 +-
js/test/generate-test-data.ts | 13 +-
js/test/inference/column.ts | 2 +
js/test/inference/nested.ts | 4 +-
js/test/jest-extensions.ts | 4 +-
js/test/unit/bit-tests.ts | 41 +
js/test/unit/builders/date-tests.ts | 4 +-
js/test/unit/builders/utils.ts | 9 +-
js/test/unit/generated-data-validators.ts | 6 +-
js/test/unit/ipc/helpers.ts | 3 -
js/test/unit/ipc/reader/from-inference-tests.ts | 2 +-
js/test/unit/ipc/reader/json-reader-tests.ts | 1 -
js/test/unit/ipc/reader/streams-dom-tests.ts | 2 -
js/test/unit/ipc/reader/streams-node-tests.ts | 3 -
js/test/unit/ipc/writer/json-writer-tests.ts | 1 -
js/test/unit/ipc/writer/stream-writer-tests.ts | 2 +-
js/test/unit/ipc/writer/streams-dom-tests.ts | 9 +-
js/test/unit/ipc/writer/streams-node-tests.ts | 9 +-
js/test/unit/recordbatch/record-batch-tests.ts | 30 +-
js/test/unit/table-tests.ts | 57 +-
js/test/unit/table/assign-tests.ts | 4 +
js/test/unit/table/serialize-tests.ts | 20 +-
js/{jest.coverage.config.js => test/unit/utils.ts} | 17 +-
js/test/unit/vector/numeric-vector-tests.ts | 2 +
js/test/unit/visitor-tests.ts | 4 +-
js/tsconfig.json | 6 +-
js/tsconfig/tsconfig.base.json | 2 +-
js/tsconfig/tsconfig.bin.cjs.json | 2 +-
js/tsconfig/tsconfig.es2015.cjs.json | 2 +-
js/tsconfig/tsconfig.es2015.cls.json | 2 +-
js/tsconfig/tsconfig.es2015.esm.json | 2 +-
js/tsconfig/tsconfig.es5.cjs.json | 2 +-
js/tsconfig/tsconfig.es5.cls.json | 2 +-
js/tsconfig/tsconfig.es5.esm.json | 2 +-
js/tsconfig/tsconfig.esnext.cjs.json | 2 +-
js/tsconfig/tsconfig.esnext.cls.json | 2 +-
js/tsconfig/tsconfig.esnext.esm.json | 2 +-
js/tslint.json | 39 -
js/yarn.lock | 10958 ++++++++++++
.../matlab_interface_for_apache_arrow_design.md | 366 +
python/pyarrow/_dataset.pyx | 400 +-
python/pyarrow/_parquet.pxd | 3 +
python/pyarrow/_s3fs.pyx | 43 +-
python/pyarrow/dataset.py | 6 +-
python/pyarrow/hdfs.py | 16 +-
python/pyarrow/includes/libarrow_dataset.pxd | 20 +-
python/pyarrow/includes/libarrow_fs.pxd | 13 +
python/pyarrow/pandas_compat.py | 19 +-
python/pyarrow/parquet.py | 29 +-
python/pyarrow/serialization.pxi | 49 +-
python/pyarrow/tests/parquet/test_dataset.py | 17 +
python/pyarrow/tests/test_dataset.py | 127 +-
python/pyarrow/tests/test_fs.py | 141 +
python/pyarrow/tests/test_hdfs.py | 11 +-
r/DESCRIPTION | 5 +-
r/NAMESPACE | 6 +
r/NEWS.md | 42 +-
r/R/arrow-package.R | 54 +-
r/R/arrowExports.R | 44 +-
r/R/compute.R | 60 +-
r/R/dataset-format.R | 33 +-
r/R/dataset-scan.R | 19 +-
r/R/dataset.R | 33 +-
r/R/dplyr.R | 15 +
r/R/enums.R | 6 +
r/R/expression.R | 3 +-
r/R/feather.R | 11 +-
r/R/install-arrow.R | 92 +-
r/R/json.R | 16 +-
r/R/parquet.R | 10 +-
r/R/record-batch.R | 1 +
r/R/schema.R | 50 +
r/R/type.R | 7 +-
r/R/util.R | 18 +-
r/README.md | 405 +-
r/_pkgdown.yml | 26 +-
r/configure | 12 +-
r/data-raw/codegen.R | 11 +-
r/inst/build_arrow_static.sh | 2 +-
r/man/call_function.Rd | 46 +
r/man/data-type.Rd | 4 +-
r/man/enums.Rd | 5 +
r/man/list_compute_functions.Rd | 39 +
r/man/read_feather.Rd | 2 +-
r/man/read_json_arrow.Rd | 10 +-
r/pkgdown/extra.js | 65 +
r/src/arrowExports.cpp | 2488 ++-
r/src/compute.cpp | 13 +-
r/src/dataset.cpp | 75 +-
r/src/filesystem.cpp | 7 +-
r/src/json.cpp | 12 +-
r/src/recordbatchreader.cpp | 8 +-
r/src/recordbatchwriter.cpp | 2 +
r/src/schema.cpp | 20 +
r/tests/testthat/helper-expectation.R | 32 +-
r/tests/testthat/test-Array.R | 6 +-
r/tests/testthat/test-RecordBatch.R | 4 +-
r/tests/testthat/test-Table.R | 6 +-
r/tests/testthat/test-arrow-info.R | 2 +-
r/tests/testthat/test-buffer-reader.R | 8 +-
r/tests/testthat/test-buffer.R | 10 +-
r/tests/testthat/test-chunked-array.R | 6 +-
r/tests/testthat/test-compute-aggregate.R | 36 +-
r/tests/testthat/test-compute-arith.R | 27 +
r/tests/testthat/test-compute-vector.R | 2 +-
r/tests/testthat/test-data-type.R | 6 +-
r/tests/testthat/test-dataset.R | 83 +-
r/tests/testthat/test-dplyr-filter.R | 26 +-
r/tests/testthat/test-dplyr-mutate.R | 2 +-
r/tests/testthat/test-dplyr.R | 164 +-
r/tests/testthat/test-expression.R | 44 +-
r/tests/testthat/test-feather.R | 36 +-
r/tests/testthat/test-filesystem.R | 16 +-
r/tests/testthat/test-json.R | 94 +-
r/tests/testthat/test-memory-pool.R | 4 +-
r/tests/testthat/test-message-reader.R | 32 +-
r/tests/testthat/test-message.R | 12 +-
r/tests/testthat/test-metadata.R | 2 +-
r/tests/testthat/test-parquet.R | 18 +
r/tests/testthat/test-python.R | 16 +-
r/tests/testthat/test-read-record-batch.R | 2 +-
r/tests/testthat/test-read-write.R | 2 +-
r/tests/testthat/test-record-batch-reader.R | 26 +-
r/tests/testthat/test-s3-minio.R | 2 +-
r/tests/testthat/test-scalar.R | 2 +-
r/tests/testthat/test-schema.R | 64 +-
r/tests/testthat/test-type.R | 38 +
r/tools/nixlibs.R | 6 +-
r/vignettes/arrow.Rmd | 39 +
r/vignettes/dataset.Rmd | 159 +-
r/vignettes/developing.Rmd | 520 +
r/vignettes/install.Rmd | 67 +-
rust/Cargo.toml | 2 +-
rust/README.md | 1 +
rust/arrow/README.md | 2 -
rust/arrow/src/array/array_primitive.rs | 29 +-
rust/arrow/src/array/iterator.rs | 161 +-
rust/arrow/src/array/transform/mod.rs | 109 +-
rust/arrow/src/buffer/immutable.rs | 2 +
rust/arrow/src/buffer/mutable.rs | 4 +
rust/arrow/src/compute/kernels/boolean.rs | 143 +-
rust/arrow/src/datatypes/types.rs | 4 +
rust/arrow/src/json/writer.rs | 348 +-
rust/arrow/src/temporal_conversions.rs | 26 +-
.../js_test.sh => rust/ballista/.dockerignore | 13 +-
rust/ballista/README.md | 64 +
.../ballista/dev/build-rust-base.sh | 18 +-
.../crossbow.py => rust/ballista/dev/build-rust.sh | 9 +-
.../ballista/dev/integration-tests.sh | 19 +-
rust/ballista/docker/README.md | 29 +
rust/ballista/docker/rust-base.dockerfile | 99 +
rust/ballista/docker/rust.dockerfile | 71 +
rust/ballista/docs/README.md | 37 +
rust/ballista/docs/architecture.md | 75 +
rust/ballista/docs/dev-env-rust.md | 38 +
rust/ballista/docs/images/query-execution.png | Bin 0 -> 11378 bytes
rust/ballista/docs/integration-testing.md | 32 +
rust/ballista/docs/release-process.md | 68 +
rust/ballista/docs/rust-docker.md | 66 +
rust/ballista/docs/user-guide/.gitignore | 2 +
rust/ballista/docs/user-guide/README.md | 36 +
.../ballista/docs/user-guide/book.toml | 18 +-
rust/ballista/docs/user-guide/src/SUMMARY.md | 30 +
rust/ballista/docs/user-guide/src/client-rust.md | 22 +
rust/ballista/docs/user-guide/src/clients.md | 22 +
rust/ballista/docs/user-guide/src/configuration.md | 32 +
rust/ballista/docs/user-guide/src/deployment.md | 26 +
.../ballista/docs/user-guide/src/docker-compose.md | 55 +
rust/ballista/docs/user-guide/src/faq.md | 31 +
.../user-guide/src/img/ballista-architecture.png | Bin 0 -> 21225 bytes
rust/ballista/docs/user-guide/src/introduction.md | 52 +
rust/ballista/docs/user-guide/src/kubernetes.md | 216 +
rust/ballista/docs/user-guide/src/standalone.md | 92 +
.../js_test.sh => rust/ballista/rust/.dockerignore | 18 +-
rust/ballista/rust/.gitignore | 2 +
.../js_test.sh => rust/ballista/rust/Cargo.toml | 21 +-
.../ballista/rust/benchmarks/tpch/.dockerignore | 18 +-
rust/ballista/rust/benchmarks/tpch/.gitignore | 1 +
.../ballista/rust/benchmarks/tpch/Cargo.toml | 78 +-
rust/ballista/rust/benchmarks/tpch/README.md | 104 +
.../rust/benchmarks/tpch/docker-compose.yaml | 62 +
.../ballista/rust/benchmarks/tpch/entrypoint.sh | 17 +-
rust/ballista/rust/benchmarks/tpch/queries/q1.sql | 21 +
rust/ballista/rust/benchmarks/tpch/queries/q10.sql | 31 +
rust/ballista/rust/benchmarks/tpch/queries/q11.sql | 27 +
rust/ballista/rust/benchmarks/tpch/queries/q12.sql | 30 +
rust/ballista/rust/benchmarks/tpch/queries/q13.sql | 20 +
rust/ballista/rust/benchmarks/tpch/queries/q14.sql | 13 +
rust/ballista/rust/benchmarks/tpch/queries/q16.sql | 30 +
rust/ballista/rust/benchmarks/tpch/queries/q17.sql | 17 +
rust/ballista/rust/benchmarks/tpch/queries/q18.sql | 32 +
rust/ballista/rust/benchmarks/tpch/queries/q19.sql | 35 +
rust/ballista/rust/benchmarks/tpch/queries/q2.sql | 43 +
rust/ballista/rust/benchmarks/tpch/queries/q20.sql | 37 +
rust/ballista/rust/benchmarks/tpch/queries/q21.sql | 39 +
rust/ballista/rust/benchmarks/tpch/queries/q22.sql | 37 +
rust/ballista/rust/benchmarks/tpch/queries/q3.sql | 22 +
rust/ballista/rust/benchmarks/tpch/queries/q4.sql | 21 +
rust/ballista/rust/benchmarks/tpch/queries/q5.sql | 24 +
rust/ballista/rust/benchmarks/tpch/queries/q6.sql | 9 +
rust/ballista/rust/benchmarks/tpch/queries/q7.sql | 39 +
rust/ballista/rust/benchmarks/tpch/queries/q8.sql | 37 +
rust/ballista/rust/benchmarks/tpch/queries/q9.sql | 32 +
.../ballista/rust/benchmarks/tpch/run.sh | 13 +-
rust/ballista/rust/benchmarks/tpch/src/main.rs | 360 +
.../ballista/rust/benchmarks/tpch/tpch-gen.sh | 22 +-
.../rust/benchmarks/tpch/tpchgen.dockerfile | 25 +-
.../ballista/rust/client/Cargo.toml | 40 +-
rust/ballista/rust/client/README.md | 22 +
rust/ballista/rust/client/src/columnar_batch.rs | 167 +
rust/ballista/rust/client/src/context.rs | 400 +
.../ballista/rust/client/src/lib.rs | 16 +-
.../ballista/rust/client/src/prelude.rs | 19 +-
rust/ballista/rust/core/Cargo.toml | 54 +
rust/ballista/rust/core/README.md | 21 +
.../mod.rs => ballista/rust/core/build.rs} | 18 +-
rust/ballista/rust/core/proto/ballista.proto | 824 +
rust/ballista/rust/core/src/client.rs | 224 +
rust/ballista/rust/core/src/datasource.rs | 72 +
rust/ballista/rust/core/src/error.rs | 172 +
.../ballista/rust/core/src/execution_plans/mod.rs | 23 +-
.../rust/core/src/execution_plans/query_stage.rs | 92 +
.../core/src/execution_plans/shuffle_reader.rs | 106 +
.../core/src/execution_plans/unresolved_shuffle.rs | 101 +
.../mod.rs => ballista/rust/core/src/lib.rs} | 22 +-
rust/ballista/rust/core/src/memory_stream.rs | 93 +
.../rust/core/src/serde/logical_plan/from_proto.rs | 1200 ++
.../rust/core/src/serde/logical_plan/mod.rs | 929 +
.../rust/core/src/serde/logical_plan/to_proto.rs | 1233 ++
rust/ballista/rust/core/src/serde/mod.rs | 69 +
.../core/src/serde/physical_plan/from_proto.rs | 398 +
.../rust/core/src/serde/physical_plan/mod.rs | 178 +
.../rust/core/src/serde/physical_plan/to_proto.rs | 556 +
.../rust/core/src/serde/scheduler/from_proto.rs | 124 +
rust/ballista/rust/core/src/serde/scheduler/mod.rs | 262 +
.../rust/core/src/serde/scheduler/to_proto.rs | 90 +
rust/ballista/rust/core/src/utils.rs | 309 +
rust/ballista/rust/executor/Cargo.toml | 63 +
rust/ballista/rust/executor/README.md | 31 +
.../ballista/rust/executor/build.rs | 20 +-
.../executor/examples/example_executor_config.toml | 17 +-
.../rust/executor/executor_config_spec.toml | 79 +
rust/ballista/rust/executor/src/collect.rs | 127 +
rust/ballista/rust/executor/src/execution_loop.rs | 172 +
rust/ballista/rust/executor/src/flight_service.rs | 374 +
.../ballista/rust/executor/src/lib.rs | 45 +-
rust/ballista/rust/executor/src/main.rs | 176 +
rust/ballista/rust/scheduler/Cargo.toml | 69 +
rust/ballista/rust/scheduler/README.md | 43 +
.../ballista/rust/scheduler/build.rs | 20 +-
.../rust/scheduler/scheduler_config_spec.toml | 60 +
rust/ballista/rust/scheduler/src/api/handlers.rs | 40 +
rust/ballista/rust/scheduler/src/api/mod.rs | 87 +
rust/ballista/rust/scheduler/src/lib.rs | 505 +
rust/ballista/rust/scheduler/src/main.rs | 155 +
rust/ballista/rust/scheduler/src/planner.rs | 494 +
rust/ballista/rust/scheduler/src/state/etcd.rs | 121 +
rust/ballista/rust/scheduler/src/state/mod.rs | 835 +
.../rust/scheduler/src/state/standalone.rs | 161 +
rust/ballista/rust/scheduler/src/test_utils.rs | 148 +
.../rust/scheduler/testdata/customer/customer.tbl | 10 +
.../scheduler/testdata/lineitem/partition0.tbl | 10 +
.../scheduler/testdata/lineitem/partition1.tbl | 10 +
.../rust/scheduler/testdata/nation/nation.tbl | 10 +
.../rust/scheduler/testdata/orders/orders.tbl | 10 +
.../ballista/rust/scheduler/testdata/part/part.tbl | 10 +
.../rust/scheduler/testdata/partsupp/partsupp.tbl | 10 +
.../rust/scheduler/testdata/region/region.tbl | 5 +
.../rust/scheduler/testdata/supplier/supplier.tbl | 10 +
rust/datafusion/README.md | 5 +-
rust/datafusion/src/datasource/parquet.rs | 5 +-
rust/datafusion/src/execution/context.rs | 328 +-
rust/datafusion/src/lib.rs | 1 +
rust/datafusion/src/optimizer/mod.rs | 1 -
.../src/physical_optimizer/coalesce_batches.rs | 88 +
.../src/physical_optimizer/merge_exec.rs | 74 +
.../src/{optimizer => physical_optimizer}/mod.rs | 14 +-
.../datafusion/src/physical_optimizer/optimizer.rs | 36 +-
.../src/physical_optimizer/repartition.rs | 186 +
rust/datafusion/src/physical_plan/aggregates.rs | 19 +-
.../src/physical_plan/datetime_expressions.rs | 4 +-
.../src/physical_plan/expressions/min_max.rs | 49 +-
rust/datafusion/src/physical_plan/group_scalar.rs | 24 +-
.../datafusion/src/physical_plan/hash_aggregate.rs | 38 +-
rust/datafusion/src/physical_plan/limit.rs | 61 +-
rust/datafusion/src/physical_plan/mod.rs | 48 +-
rust/datafusion/src/physical_plan/parquet.rs | 4 +-
rust/datafusion/src/physical_plan/planner.rs | 90 +-
rust/datafusion/src/scalar.rs | 132 +-
rust/datafusion/src/sql/planner.rs | 2 +-
rust/datafusion/src/test/exec.rs | 102 +
rust/datafusion/src/test/mod.rs | 119 +
rust/datafusion/tests/sql.rs | 18 +-
rust/datafusion/tests/user_defined_plan.rs | 9 +-
rust/parquet/src/arrow/arrow_writer.rs | 2 +-
676 files changed, 47853 insertions(+), 25678 deletions(-)
create mode 100644 ci/docker/ubuntu-20.10-cpp.dockerfile
create mode 100755 ci/scripts/r_pkgdown_check.sh
create mode 100644 cpp/cmake_modules/Find-c-aresAlt.cmake
create mode 100644 cpp/cmake_modules/FindOpenSSLAlt.cmake
create mode 100644 cpp/examples/arrow/dataset_documentation_example.cc
delete mode 100644 cpp/src/arrow/util/bpacking_avx2_codegen.py
delete mode 100644 cpp/src/arrow/util/bpacking_avx512_codegen.py
copy rust/datafusion/src/optimizer/mod.rs =>
cpp/src/arrow/util/bpacking_neon.cc (62%)
copy js/jest.coverage.config.js => cpp/src/arrow/util/bpacking_neon.h (73%)
create mode 100644 cpp/src/arrow/util/bpacking_simd128_generated.h
create mode 100644 cpp/src/arrow/util/bpacking_simd256_generated.h
create mode 100644 cpp/src/arrow/util/bpacking_simd512_generated.h
create mode 100644 cpp/src/arrow/util/bpacking_simd_codegen.py
create mode 100644 cpp/src/arrow/util/bpacking_simd_internal.h
create mode 100644 cpp/src/gandiva/formatting_utils.h
create mode 100644 cpp/src/gandiva/hash_utils.cc
copy cpp/src/gandiva/{node_visitor.h => hash_utils.h} (51%)
create mode 100644 cpp/src/gandiva/hash_utils_test.cc
copy ci/scripts/js_test.sh => dev/archery/archery/crossbow/__init__.py (85%)
mode change 100755 => 100644
create mode 100644 dev/archery/archery/crossbow/cli.py
rename dev/{tasks/crossbow.py => archery/archery/crossbow/core.py} (57%)
mode change 100755 => 100644
create mode 100644 dev/archery/archery/crossbow/reports.py
rename dev/archery/archery/{ => crossbow}/tests/fixtures/crossbow-job.yaml
(100%)
rename dev/archery/archery/{ =>
crossbow}/tests/fixtures/crossbow-success-message.md (100%)
copy ci/scripts/js_test.sh => dev/archery/archery/crossbow/tests/test_core.py
(78%)
mode change 100755 => 100644
copy .github/workflows/dev_pr/labeler.yml =>
dev/archery/archery/crossbow/tests/test_crossbow_cli.py (50%)
copy
dev/{tasks/linux-packages/apache-arrow-archive-keyring/apt/debian-bullseye/Dockerfile
=> archery/archery/crossbow/tests/test_reports.py} (56%)
create mode 100644 dev/archery/conftest.py
rename dev/release/{00-prepare-test.rb => 01-prepare-test.rb} (99%)
rename dev/release/{00-prepare.sh => 01-prepare.sh} (83%)
rename dev/release/{01-perform.sh => 03-binary-submit.sh} (53%)
copy ci/scripts/integration_kartothek.sh => dev/release/04-binary-download.sh
(62%)
rename dev/release/{03-binary.sh => 05-binary-upload.sh} (91%)
delete mode 100755 dev/release/generate_force_push_script.py
create mode 100755 dev/release/post-11-java.sh
rename
dev/tasks/conda-recipes/.ci_support/{linux_cuda_compiler_version9.2python3.6.____cpython.yaml
=> linux_64_cuda_compiler_version10.2numpy1.17python3.6.____cpython.yaml} (76%)
rename
dev/tasks/conda-recipes/.ci_support/{linux_cuda_compiler_version9.2python3.7.____cpython.yaml
=> linux_64_cuda_compiler_version10.2numpy1.17python3.7.____cpython.yaml} (76%)
rename
dev/tasks/conda-recipes/.ci_support/{linux_cuda_compiler_version9.2python3.8.____cpython.yaml
=> linux_64_cuda_compiler_version10.2numpy1.17python3.8.____cpython.yaml} (76%)
rename
dev/tasks/conda-recipes/.ci_support/{linux_cuda_compiler_version9.2python3.9.____cpython.yaml
=> linux_64_cuda_compiler_version10.2numpy1.19python3.9.____cpython.yaml} (77%)
rename
dev/tasks/conda-recipes/.ci_support/{linux_cuda_compiler_versionNonepython3.6.____cpython.yaml
=> linux_64_cuda_compiler_versionNonenumpy1.17python3.6.____cpython.yaml} (77%)
rename
dev/tasks/conda-recipes/.ci_support/{linux_cuda_compiler_versionNonepython3.7.____cpython.yaml
=> linux_64_cuda_compiler_versionNonenumpy1.17python3.7.____cpython.yaml} (77%)
rename
dev/tasks/conda-recipes/.ci_support/{linux_cuda_compiler_versionNonepython3.8.____cpython.yaml
=> linux_64_cuda_compiler_versionNonenumpy1.17python3.8.____cpython.yaml} (77%)
rename
dev/tasks/conda-recipes/.ci_support/{linux_cuda_compiler_versionNonepython3.9.____cpython.yaml
=> linux_64_cuda_compiler_versionNonenumpy1.19python3.9.____cpython.yaml} (78%)
rename dev/tasks/conda-recipes/.ci_support/{osx_python3.6.____cpython.yaml =>
osx_64_numpy1.17python3.6.____cpython.yaml} (81%)
rename dev/tasks/conda-recipes/.ci_support/{osx_python3.7.____cpython.yaml =>
osx_64_numpy1.17python3.7.____cpython.yaml} (81%)
rename dev/tasks/conda-recipes/.ci_support/{osx_python3.8.____cpython.yaml =>
osx_64_numpy1.17python3.8.____cpython.yaml} (77%)
copy dev/tasks/conda-recipes/.ci_support/{osx_python3.9.____cpython.yaml =>
osx_64_numpy1.19python3.9.____cpython.yaml} (82%)
copy dev/tasks/conda-recipes/.ci_support/{osx_python3.9.____cpython.yaml =>
osx_arm64_python3.8.____cpython.yaml} (71%)
rename dev/tasks/conda-recipes/.ci_support/{osx_python3.9.____cpython.yaml =>
osx_arm64_python3.9.____cpython.yaml} (74%)
rename dev/tasks/conda-recipes/.ci_support/{win_python3.6.____cpython.yaml =>
win_64_cuda_compiler_versionNonenumpy1.17python3.6.____cpython.yaml} (82%)
rename dev/tasks/conda-recipes/.ci_support/{win_python3.7.____cpython.yaml =>
win_64_cuda_compiler_versionNonenumpy1.17python3.7.____cpython.yaml} (82%)
rename dev/tasks/conda-recipes/.ci_support/{win_python3.8.____cpython.yaml =>
win_64_cuda_compiler_versionNonenumpy1.17python3.8.____cpython.yaml} (82%)
rename dev/tasks/conda-recipes/.ci_support/{win_python3.9.____cpython.yaml =>
win_64_cuda_compiler_versionNonenumpy1.19python3.9.____cpython.yaml} (83%)
create mode 100644 dev/tasks/conda-recipes/.scripts/logging_utils.sh
mode change 100755 => 100644 dev/tasks/conda-recipes/arrow-cpp/build-arrow.sh
mode change 100755 => 100644 dev/tasks/conda-recipes/arrow-cpp/build-pyarrow.sh
rename dev/tasks/linux-packages/{apache-arrow-archive-keyring =>
apache-arrow-apt-source}/Rakefile (92%)
rename dev/tasks/linux-packages/{apache-arrow-archive-keyring =>
apache-arrow-apt-source}/apt/debian-bullseye/Dockerfile (100%)
rename dev/tasks/linux-packages/{apache-arrow-archive-keyring =>
apache-arrow-apt-source}/apt/debian-buster/Dockerfile (100%)
rename dev/tasks/linux-packages/{apache-arrow-archive-keyring =>
apache-arrow-apt-source}/apt/ubuntu-bionic/Dockerfile (100%)
rename dev/tasks/linux-packages/{apache-arrow-archive-keyring =>
apache-arrow-apt-source}/apt/ubuntu-focal/Dockerfile (100%)
rename dev/tasks/linux-packages/{apache-arrow-archive-keyring =>
apache-arrow-apt-source}/apt/ubuntu-groovy/Dockerfile (100%)
rename dev/tasks/linux-packages/{apache-arrow-archive-keyring =>
apache-arrow-apt-source}/apt/ubuntu-xenial/Dockerfile (100%)
rename
dev/tasks/linux-packages/{apache-arrow-archive-keyring/debian/apache-arrow-archive-keyring.install
=> apache-arrow-apt-source/debian/apache-arrow-apt-source.install} (100%)
copy python/pyarrow/tests/__init__.py =>
dev/tasks/linux-packages/apache-arrow-apt-source/debian/changelog (100%)
rename dev/tasks/linux-packages/{apache-arrow-archive-keyring =>
apache-arrow-apt-source}/debian/compat (100%)
rename dev/tasks/linux-packages/{apache-arrow-archive-keyring =>
apache-arrow-apt-source}/debian/control (77%)
rename dev/tasks/linux-packages/{apache-arrow-archive-keyring =>
apache-arrow-apt-source}/debian/copyright (100%)
rename dev/tasks/linux-packages/{apache-arrow-archive-keyring =>
apache-arrow-apt-source}/debian/rules (75%)
rename dev/tasks/linux-packages/{apache-arrow-archive-keyring =>
apache-arrow-apt-source}/debian/source/format (100%)
delete mode 100644
dev/tasks/linux-packages/apache-arrow-archive-keyring/debian/changelog
create mode 100644 dev/tasks/macros.jinja
create mode 100644 dev/tasks/r/github.devdocs.yml
delete mode 100644 dev/tasks/requirements-crossbow.txt
rename dev/tasks/verify-rc/{github.osx.yml => github.macos.yml} (68%)
create mode 100644 docs/source/_static/arrow.png
create mode 100644 docs/source/_static/favicon.ico
create mode 100644 docs/source/_templates/docs-sidebar.html
copy docs/source/cpp/api/{filesystem.rst => dataset.rst} (61%)
create mode 100644 docs/source/cpp/dataset.rst
copy docs/source/cpp/{getting_started.rst =>
examples/dataset_documentation_example.rst} (74%)
create mode 100644 js/.eslintignore
create mode 100644 js/.eslintrc.js
delete mode 100644 js/package-lock.json
copy js/{jest.coverage.config.js => src/fb/.eslintrc.js} (75%)
copy js/{jest.coverage.config.js => test/.eslintrc.js} (67%)
create mode 100644 js/test/unit/bit-tests.ts
copy js/{jest.coverage.config.js => test/unit/utils.ts} (73%)
delete mode 100644 js/tslint.json
create mode 100644 js/yarn.lock
create mode 100644 matlab/doc/matlab_interface_for_apache_arrow_design.md
create mode 100644 r/man/call_function.Rd
create mode 100644 r/man/list_compute_functions.Rd
create mode 100644 r/pkgdown/extra.js
create mode 100644 r/vignettes/developing.Rmd
copy ci/scripts/js_test.sh => rust/ballista/.dockerignore (88%)
mode change 100755 => 100644
create mode 100644 rust/ballista/README.md
copy ci/scripts/js_test.sh => rust/ballista/dev/build-rust-base.sh (84%)
rename dev/archery/archery/utils/crossbow.py =>
rust/ballista/dev/build-rust.sh (80%)
mode change 100644 => 100755
copy ci/scripts/js_test.sh => rust/ballista/dev/integration-tests.sh (82%)
create mode 100644 rust/ballista/docker/README.md
create mode 100644 rust/ballista/docker/rust-base.dockerfile
create mode 100644 rust/ballista/docker/rust.dockerfile
create mode 100644 rust/ballista/docs/README.md
create mode 100644 rust/ballista/docs/architecture.md
create mode 100644 rust/ballista/docs/dev-env-rust.md
create mode 100644 rust/ballista/docs/images/query-execution.png
create mode 100644 rust/ballista/docs/integration-testing.md
create mode 100644 rust/ballista/docs/release-process.md
create mode 100644 rust/ballista/docs/rust-docker.md
create mode 100644 rust/ballista/docs/user-guide/.gitignore
create mode 100644 rust/ballista/docs/user-guide/README.md
copy ci/scripts/js_test.sh => rust/ballista/docs/user-guide/book.toml (87%)
mode change 100755 => 100644
create mode 100644 rust/ballista/docs/user-guide/src/SUMMARY.md
create mode 100644 rust/ballista/docs/user-guide/src/client-rust.md
create mode 100644 rust/ballista/docs/user-guide/src/clients.md
create mode 100644 rust/ballista/docs/user-guide/src/configuration.md
create mode 100644 rust/ballista/docs/user-guide/src/deployment.md
create mode 100644 rust/ballista/docs/user-guide/src/docker-compose.md
create mode 100644 rust/ballista/docs/user-guide/src/faq.md
create mode 100644
rust/ballista/docs/user-guide/src/img/ballista-architecture.png
create mode 100644 rust/ballista/docs/user-guide/src/introduction.md
create mode 100644 rust/ballista/docs/user-guide/src/kubernetes.md
create mode 100644 rust/ballista/docs/user-guide/src/standalone.md
copy ci/scripts/js_test.sh => rust/ballista/rust/.dockerignore (70%)
mode change 100755 => 100644
create mode 100644 rust/ballista/rust/.gitignore
copy ci/scripts/js_test.sh => rust/ballista/rust/Cargo.toml (83%)
mode change 100755 => 100644
copy ci/scripts/js_test.sh => rust/ballista/rust/benchmarks/tpch/.dockerignore
(69%)
mode change 100755 => 100644
create mode 100644 rust/ballista/rust/benchmarks/tpch/.gitignore
copy .github/workflows/dev_pr/labeler.yml =>
rust/ballista/rust/benchmarks/tpch/Cargo.toml (53%)
create mode 100644 rust/ballista/rust/benchmarks/tpch/README.md
create mode 100644 rust/ballista/rust/benchmarks/tpch/docker-compose.yaml
copy ci/scripts/js_test.sh => rust/ballista/rust/benchmarks/tpch/entrypoint.sh
(88%)
create mode 100644 rust/ballista/rust/benchmarks/tpch/queries/q1.sql
create mode 100644 rust/ballista/rust/benchmarks/tpch/queries/q10.sql
create mode 100644 rust/ballista/rust/benchmarks/tpch/queries/q11.sql
create mode 100644 rust/ballista/rust/benchmarks/tpch/queries/q12.sql
create mode 100644 rust/ballista/rust/benchmarks/tpch/queries/q13.sql
create mode 100644 rust/ballista/rust/benchmarks/tpch/queries/q14.sql
create mode 100644 rust/ballista/rust/benchmarks/tpch/queries/q16.sql
create mode 100644 rust/ballista/rust/benchmarks/tpch/queries/q17.sql
create mode 100644 rust/ballista/rust/benchmarks/tpch/queries/q18.sql
create mode 100644 rust/ballista/rust/benchmarks/tpch/queries/q19.sql
create mode 100644 rust/ballista/rust/benchmarks/tpch/queries/q2.sql
create mode 100644 rust/ballista/rust/benchmarks/tpch/queries/q20.sql
create mode 100644 rust/ballista/rust/benchmarks/tpch/queries/q21.sql
create mode 100644 rust/ballista/rust/benchmarks/tpch/queries/q22.sql
create mode 100644 rust/ballista/rust/benchmarks/tpch/queries/q3.sql
create mode 100644 rust/ballista/rust/benchmarks/tpch/queries/q4.sql
create mode 100644 rust/ballista/rust/benchmarks/tpch/queries/q5.sql
create mode 100644 rust/ballista/rust/benchmarks/tpch/queries/q6.sql
create mode 100644 rust/ballista/rust/benchmarks/tpch/queries/q7.sql
create mode 100644 rust/ballista/rust/benchmarks/tpch/queries/q8.sql
create mode 100644 rust/ballista/rust/benchmarks/tpch/queries/q9.sql
copy js/npm-release.sh => rust/ballista/rust/benchmarks/tpch/run.sh (73%)
create mode 100644 rust/ballista/rust/benchmarks/tpch/src/main.rs
copy ci/scripts/js_test.sh => rust/ballista/rust/benchmarks/tpch/tpch-gen.sh
(64%)
copy ci/scripts/js_build.sh =>
rust/ballista/rust/benchmarks/tpch/tpchgen.dockerfile (73%)
mode change 100755 => 100644
rename dev/release/post-00-rebase.sh => rust/ballista/rust/client/Cargo.toml
(56%)
mode change 100755 => 100644
create mode 100644 rust/ballista/rust/client/README.md
create mode 100644 rust/ballista/rust/client/src/columnar_batch.rs
create mode 100644 rust/ballista/rust/client/src/context.rs
copy js/jest.coverage.config.js => rust/ballista/rust/client/src/lib.rs (73%)
copy js/jest.coverage.config.js => rust/ballista/rust/client/src/prelude.rs
(73%)
create mode 100644 rust/ballista/rust/core/Cargo.toml
create mode 100644 rust/ballista/rust/core/README.md
copy rust/{datafusion/src/optimizer/mod.rs => ballista/rust/core/build.rs}
(68%)
create mode 100644 rust/ballista/rust/core/proto/ballista.proto
create mode 100644 rust/ballista/rust/core/src/client.rs
create mode 100644 rust/ballista/rust/core/src/datasource.rs
create mode 100644 rust/ballista/rust/core/src/error.rs
copy js/jest.coverage.config.js =>
rust/ballista/rust/core/src/execution_plans/mod.rs (70%)
create mode 100644 rust/ballista/rust/core/src/execution_plans/query_stage.rs
create mode 100644
rust/ballista/rust/core/src/execution_plans/shuffle_reader.rs
create mode 100644
rust/ballista/rust/core/src/execution_plans/unresolved_shuffle.rs
copy rust/{datafusion/src/optimizer/mod.rs => ballista/rust/core/src/lib.rs}
(70%)
create mode 100644 rust/ballista/rust/core/src/memory_stream.rs
create mode 100644 rust/ballista/rust/core/src/serde/logical_plan/from_proto.rs
create mode 100644 rust/ballista/rust/core/src/serde/logical_plan/mod.rs
create mode 100644 rust/ballista/rust/core/src/serde/logical_plan/to_proto.rs
create mode 100644 rust/ballista/rust/core/src/serde/mod.rs
create mode 100644
rust/ballista/rust/core/src/serde/physical_plan/from_proto.rs
create mode 100644 rust/ballista/rust/core/src/serde/physical_plan/mod.rs
create mode 100644 rust/ballista/rust/core/src/serde/physical_plan/to_proto.rs
create mode 100644 rust/ballista/rust/core/src/serde/scheduler/from_proto.rs
create mode 100644 rust/ballista/rust/core/src/serde/scheduler/mod.rs
create mode 100644 rust/ballista/rust/core/src/serde/scheduler/to_proto.rs
create mode 100644 rust/ballista/rust/core/src/utils.rs
create mode 100644 rust/ballista/rust/executor/Cargo.toml
create mode 100644 rust/ballista/rust/executor/README.md
copy js/jest.coverage.config.js => rust/ballista/rust/executor/build.rs (73%)
copy ci/scripts/js_test.sh =>
rust/ballista/rust/executor/examples/example_executor_config.toml (73%)
mode change 100755 => 100644
create mode 100644 rust/ballista/rust/executor/executor_config_spec.toml
create mode 100644 rust/ballista/rust/executor/src/collect.rs
create mode 100644 rust/ballista/rust/executor/src/execution_loop.rs
create mode 100644 rust/ballista/rust/executor/src/flight_service.rs
copy js/src/builder/run.ts => rust/ballista/rust/executor/src/lib.rs (50%)
create mode 100644 rust/ballista/rust/executor/src/main.rs
create mode 100644 rust/ballista/rust/scheduler/Cargo.toml
create mode 100644 rust/ballista/rust/scheduler/README.md
copy js/jest.coverage.config.js => rust/ballista/rust/scheduler/build.rs (73%)
create mode 100644 rust/ballista/rust/scheduler/scheduler_config_spec.toml
create mode 100644 rust/ballista/rust/scheduler/src/api/handlers.rs
create mode 100644 rust/ballista/rust/scheduler/src/api/mod.rs
create mode 100644 rust/ballista/rust/scheduler/src/lib.rs
create mode 100644 rust/ballista/rust/scheduler/src/main.rs
create mode 100644 rust/ballista/rust/scheduler/src/planner.rs
create mode 100644 rust/ballista/rust/scheduler/src/state/etcd.rs
create mode 100644 rust/ballista/rust/scheduler/src/state/mod.rs
create mode 100644 rust/ballista/rust/scheduler/src/state/standalone.rs
create mode 100644 rust/ballista/rust/scheduler/src/test_utils.rs
create mode 100644 rust/ballista/rust/scheduler/testdata/customer/customer.tbl
create mode 100644
rust/ballista/rust/scheduler/testdata/lineitem/partition0.tbl
create mode 100644
rust/ballista/rust/scheduler/testdata/lineitem/partition1.tbl
create mode 100644 rust/ballista/rust/scheduler/testdata/nation/nation.tbl
create mode 100644 rust/ballista/rust/scheduler/testdata/orders/orders.tbl
create mode 100644 rust/ballista/rust/scheduler/testdata/part/part.tbl
create mode 100644 rust/ballista/rust/scheduler/testdata/partsupp/partsupp.tbl
create mode 100644 rust/ballista/rust/scheduler/testdata/region/region.tbl
create mode 100644 rust/ballista/rust/scheduler/testdata/supplier/supplier.tbl
create mode 100644 rust/datafusion/src/physical_optimizer/coalesce_batches.rs
create mode 100644 rust/datafusion/src/physical_optimizer/merge_exec.rs
copy rust/datafusion/src/{optimizer => physical_optimizer}/mod.rs (76%)
copy js/src/builder/run.ts =>
rust/datafusion/src/physical_optimizer/optimizer.rs (56%)
create mode 100644 rust/datafusion/src/physical_optimizer/repartition.rs
create mode 100644 rust/datafusion/src/test/exec.rs