This is an automated email from the ASF dual-hosted git repository.
github-bot pushed a commit to branch asf-site
in repository https://gitbox.apache.org/repos/asf/arrow-rs.git
The following commit(s) were added to refs/heads/asf-site by this push:
new 797d815706d deploy: ce8363af34c1c3f9a121aa0ed61e36dc99749d08
797d815706d is described below
commit 797d815706d67e6a97e57991d437c4fd0447afc0
Author: tustvold <[email protected]>
AuthorDate: Mon May 20 10:39:58 2024 +0000
deploy: ce8363af34c1c3f9a121aa0ed61e36dc99749d08
---
src/parquet/encodings/encoding/mod.rs.html | 4 ++--
src/parquet/util/bit_util.rs.html | 38 +++++++-----------------------
2 files changed, 10 insertions(+), 32 deletions(-)
diff --git a/src/parquet/encodings/encoding/mod.rs.html
b/src/parquet/encodings/encoding/mod.rs.html
index d99984ea6de..ed9abb16878 100644
--- a/src/parquet/encodings/encoding/mod.rs.html
+++ b/src/parquet/encodings/encoding/mod.rs.html
@@ -1393,7 +1393,7 @@
// DELTA_BINARY_PACKED encoding
</span><span class="kw">const </span>MAX_PAGE_HEADER_WRITER_SIZE: usize =
<span class="number">32</span>;
-<span class="kw">const </span>MAX_BIT_WRITER_SIZE: usize = <span
class="number">10 </span>* <span class="number">1024 </span>* <span
class="number">1024</span>;
+<span class="kw">const </span>DEFAULT_BIT_WRITER_SIZE: usize = <span
class="number">1024 </span>* <span class="number">1024</span>;
<span class="kw">const </span>DEFAULT_NUM_MINI_BLOCKS: usize = <span
class="number">4</span>;
<span class="doccomment">/// Delta bit packed encoder.
@@ -1457,7 +1457,7 @@
DeltaBitPackEncoder {
page_header_writer: BitWriter::new(MAX_PAGE_HEADER_WRITER_SIZE),
- bit_writer: BitWriter::new(MAX_BIT_WRITER_SIZE),
+ bit_writer: BitWriter::new(DEFAULT_BIT_WRITER_SIZE),
total_values: <span class="number">0</span>,
first_value: <span class="number">0</span>,
current_value: <span class="number">0</span>, <span
class="comment">// current value to keep adding deltas
diff --git a/src/parquet/util/bit_util.rs.html
b/src/parquet/util/bit_util.rs.html
index 2de5373fa6c..f6a4e7494df 100644
--- a/src/parquet/util/bit_util.rs.html
+++ b/src/parquet/util/bit_util.rs.html
@@ -1128,17 +1128,6 @@
<a href="#1128" id="1128">1128</a>
<a href="#1129" id="1129">1129</a>
<a href="#1130" id="1130">1130</a>
-<a href="#1131" id="1131">1131</a>
-<a href="#1132" id="1132">1132</a>
-<a href="#1133" id="1133">1133</a>
-<a href="#1134" id="1134">1134</a>
-<a href="#1135" id="1135">1135</a>
-<a href="#1136" id="1136">1136</a>
-<a href="#1137" id="1137">1137</a>
-<a href="#1138" id="1138">1138</a>
-<a href="#1139" id="1139">1139</a>
-<a href="#1140" id="1140">1140</a>
-<a href="#1141" id="1141">1141</a>
</pre></div><pre class="rust"><code><span class="comment">// Licensed to the
Apache Software Foundation (ASF) under one
// or more contributor license agreements. See the NOTICE file
// distributed with this work for additional information
@@ -1313,9 +1302,9 @@
}
<span class="kw">impl </span>BitWriter {
- <span class="kw">pub fn </span>new(max_bytes: usize) -> <span
class="self">Self </span>{
+ <span class="kw">pub fn </span>new(initial_capacity: usize) -> <span
class="self">Self </span>{
<span class="self">Self </span>{
- buffer: Vec::with_capacity(max_bytes),
+ buffer: Vec::with_capacity(initial_capacity),
buffered_values: <span class="number">0</span>,
bit_offset: <span class="number">0</span>,
}
@@ -1445,12 +1434,7 @@
/// `offset + num_bytes`. Also that if size of `T` is larger than
`num_bytes`, extra
/// higher ordered bytes will be ignored.
</span><span class="attr">#[inline]
- </span><span class="kw">pub fn </span>put_aligned_offset<T: AsBytes>(
- <span class="kw-2">&mut </span><span class="self">self</span>,
- val: T,
- num_bytes: usize,
- offset: usize,
- ) {
+ </span><span class="kw">pub fn </span>put_aligned_offset<T:
AsBytes>(<span class="kw-2">&mut </span><span class="self">self</span>,
val: T, num_bytes: usize, offset: usize) {
<span class="kw">let </span>slice = val.as_bytes();
<span class="kw">let </span>len = num_bytes.min(slice.len());
<span class="self">self</span>.buffer[offset..offset +
len].copy_from_slice(<span class="kw-2">&</span>slice[..len])
@@ -1546,8 +1530,8 @@
<span class="self">self</span>.load_buffered_values()
}
- <span class="kw">let </span><span class="kw-2">mut </span>v =
trailing_bits(<span class="self">self</span>.buffered_values, <span
class="self">self</span>.bit_offset + num_bits)
- >> <span class="self">self</span>.bit_offset;
+ <span class="kw">let </span><span class="kw-2">mut </span>v =
+ trailing_bits(<span class="self">self</span>.buffered_values,
<span class="self">self</span>.bit_offset + num_bits) >> <span
class="self">self</span>.bit_offset;
<span class="self">self</span>.bit_offset += num_bits;
<span class="kw">if </span><span class="self">self</span>.bit_offset
>= <span class="number">64 </span>{
@@ -1712,8 +1696,7 @@
<span class="bool-val">false </span>=> num_values,
};
- <span class="kw">let </span>end_bit_offset =
- <span class="self">self</span>.byte_offset * <span
class="number">8 </span>+ values_to_read * num_bits + <span
class="self">self</span>.bit_offset;
+ <span class="kw">let </span>end_bit_offset = <span
class="self">self</span>.byte_offset * <span class="number">8 </span>+
values_to_read * num_bits + <span class="self">self</span>.bit_offset;
<span class="self">self</span>.byte_offset = end_bit_offset / <span
class="number">8</span>;
<span class="self">self</span>.bit_offset = end_bit_offset % <span
class="number">8</span>;
@@ -1726,11 +1709,7 @@
}
<span class="doccomment">/// Reads up to `num_bytes` to `buf` returning
the number of bytes read
- </span><span class="kw">pub</span>(<span class="kw">crate</span>) <span
class="kw">fn </span>get_aligned_bytes(
- <span class="kw-2">&mut </span><span class="self">self</span>,
- buf: <span class="kw-2">&mut </span>Vec<u8>,
- num_bytes: usize,
- ) -> usize {
+ </span><span class="kw">pub</span>(<span class="kw">crate</span>) <span
class="kw">fn </span>get_aligned_bytes(<span class="kw-2">&mut </span><span
class="self">self</span>, buf: <span class="kw-2">&mut
</span>Vec<u8>, num_bytes: usize) -> usize {
<span class="comment">// Align to byte offset
</span><span class="self">self</span>.byte_offset = <span
class="self">self</span>.get_byte_offset();
<span class="self">self</span>.bit_offset = <span
class="number">0</span>;
@@ -2139,8 +2118,7 @@
.collect();
<span class="comment">// Generic values used to check against actual
values read from `get_batch`.
- </span><span class="kw">let </span>expected_values: Vec<T> =
- values.iter().map(|v| from_le_slice(v.as_bytes())).collect();
+ </span><span class="kw">let </span>expected_values: Vec<T> =
values.iter().map(|v| from_le_slice(v.as_bytes())).collect();
(<span class="number">0</span>..total).for_each(|i|
writer.put_value(values[i], num_bits));