This is an automated email from the ASF dual-hosted git repository.
github-bot pushed a commit to branch gh-pages
in repository https://gitbox.apache.org/repos/asf/iceberg-rust.git
The following commit(s) were added to refs/heads/gh-pages by this push:
new aeef732f deploy: fd089164bff19fdd4b0d297363fc7808b6f6ea18
aeef732f is described below
commit aeef732fc5789895e230cde822ff54c97ddb0ca4
Author: liurenjie1024 <[email protected]>
AuthorDate: Wed Nov 5 01:45:04 2025 +0000
deploy: fd089164bff19fdd4b0d297363fc7808b6f6ea18
---
.../arrow/caching_delete_file_loader.rs.html | 115 +++-
api/src/iceberg/arrow/delete_filter.rs.html | 602 +++++++++++----------
2 files changed, 416 insertions(+), 301 deletions(-)
diff --git a/api/src/iceberg/arrow/caching_delete_file_loader.rs.html
b/api/src/iceberg/arrow/caching_delete_file_loader.rs.html
index 2fea5f78..17b82561 100644
--- a/api/src/iceberg/arrow/caching_delete_file_loader.rs.html
+++ b/api/src/iceberg/arrow/caching_delete_file_loader.rs.html
@@ -788,4 +788,117 @@
<a href=#788 id=788 data-nosnippet>788</a> <span
class="macro">assert_eq!</span>(data_col.value(<span class="number">1</span>),
<span class="string">"d"</span>);
<a href=#789 id=789 data-nosnippet>789</a> <span
class="macro">assert_eq!</span>(data_col.value(<span class="number">2</span>),
<span class="string">"g"</span>);
<a href=#790 id=790 data-nosnippet>790</a> }
-<a href=#791 id=791
data-nosnippet>791</a>}</code></pre></div></section></main></body></html>
\ No newline at end of file
+<a href=#791 id=791 data-nosnippet>791</a>
+<a href=#792 id=792 data-nosnippet>792</a> <span class="doccomment">///
Test loading a FileScanTask with BOTH positional and equality deletes.
+<a href=#793 id=793 data-nosnippet>793</a> /// Verifies the fix for the
inverted condition that caused "Missing predicate for equality delete file"
errors.
+<a href=#794 id=794 data-nosnippet>794</a> </span><span
class="attr">#[tokio::test]
+<a href=#795 id=795 data-nosnippet>795</a> </span><span class="kw">async fn
</span>test_load_deletes_with_mixed_types() {
+<a href=#796 id=796 data-nosnippet>796</a> <span class="kw">use
</span><span class="kw">crate</span>::scan::FileScanTask;
+<a href=#797 id=797 data-nosnippet>797</a> <span class="kw">use
</span><span class="kw">crate</span>::spec::{DataFileFormat, Schema};
+<a href=#798 id=798 data-nosnippet>798</a>
+<a href=#799 id=799 data-nosnippet>799</a> <span class="kw">let
</span>tmp_dir = TempDir::new().unwrap();
+<a href=#800 id=800 data-nosnippet>800</a> <span class="kw">let
</span>table_location = tmp_dir.path();
+<a href=#801 id=801 data-nosnippet>801</a> <span class="kw">let
</span>file_io = FileIO::from_path(table_location.as_os_str().to_str().unwrap())
+<a href=#802 id=802 data-nosnippet>802</a> .unwrap()
+<a href=#803 id=803 data-nosnippet>803</a> .build()
+<a href=#804 id=804 data-nosnippet>804</a> .unwrap();
+<a href=#805 id=805 data-nosnippet>805</a>
+<a href=#806 id=806 data-nosnippet>806</a> <span class="comment">//
Create the data file schema
+<a href=#807 id=807 data-nosnippet>807</a> </span><span class="kw">let
</span>data_file_schema = Arc::new(
+<a href=#808 id=808 data-nosnippet>808</a> Schema::builder()
+<a href=#809 id=809 data-nosnippet>809</a> .with_fields(<span
class="macro">vec!</span>[
+<a href=#810 id=810 data-nosnippet>810</a> <span
class="kw">crate</span>::spec::NestedField::optional(
+<a href=#811 id=811 data-nosnippet>811</a> <span
class="number">2</span>,
+<a href=#812 id=812 data-nosnippet>812</a> <span
class="string">"y"</span>,
+<a href=#813 id=813 data-nosnippet>813</a> <span
class="kw">crate</span>::spec::Type::Primitive(<span
class="kw">crate</span>::spec::PrimitiveType::Long),
+<a href=#814 id=814 data-nosnippet>814</a> )
+<a href=#815 id=815 data-nosnippet>815</a> .into(),
+<a href=#816 id=816 data-nosnippet>816</a> <span
class="kw">crate</span>::spec::NestedField::optional(
+<a href=#817 id=817 data-nosnippet>817</a> <span
class="number">3</span>,
+<a href=#818 id=818 data-nosnippet>818</a> <span
class="string">"z"</span>,
+<a href=#819 id=819 data-nosnippet>819</a> <span
class="kw">crate</span>::spec::Type::Primitive(<span
class="kw">crate</span>::spec::PrimitiveType::Long),
+<a href=#820 id=820 data-nosnippet>820</a> )
+<a href=#821 id=821 data-nosnippet>821</a> .into(),
+<a href=#822 id=822 data-nosnippet>822</a> ])
+<a href=#823 id=823 data-nosnippet>823</a> .build()
+<a href=#824 id=824 data-nosnippet>824</a> .unwrap(),
+<a href=#825 id=825 data-nosnippet>825</a> );
+<a href=#826 id=826 data-nosnippet>826</a>
+<a href=#827 id=827 data-nosnippet>827</a> <span class="comment">//
Write positional delete file
+<a href=#828 id=828 data-nosnippet>828</a> </span><span class="kw">let
</span>positional_delete_schema = <span
class="kw">crate</span>::arrow::delete_filter::tests::create_pos_del_schema();
+<a href=#829 id=829 data-nosnippet>829</a> <span class="kw">let
</span>file_path_values =
+<a href=#830 id=830 data-nosnippet>830</a> <span
class="macro">vec!</span>[<span class="macro">format!</span>(<span
class="string">"{}/data-1.parquet"</span>, table_location.to_str().unwrap());
<span class="number">4</span>];
+<a href=#831 id=831 data-nosnippet>831</a> <span class="kw">let
</span>file_path_col = Arc::new(StringArray::from_iter_values(<span
class="kw-2">&</span>file_path_values));
+<a href=#832 id=832 data-nosnippet>832</a> <span class="kw">let
</span>pos_col = Arc::new(Int64Array::from_iter_values(<span
class="macro">vec!</span>[<span class="number">0i64</span>, <span
class="number">1</span>, <span class="number">2</span>, <span
class="number">3</span>]));
+<a href=#833 id=833 data-nosnippet>833</a>
+<a href=#834 id=834 data-nosnippet>834</a> <span class="kw">let
</span>positional_deletes_to_write =
+<a href=#835 id=835 data-nosnippet>835</a>
RecordBatch::try_new(positional_delete_schema.clone(), <span
class="macro">vec!</span>[
+<a href=#836 id=836 data-nosnippet>836</a> file_path_col,
+<a href=#837 id=837 data-nosnippet>837</a> pos_col,
+<a href=#838 id=838 data-nosnippet>838</a> ])
+<a href=#839 id=839 data-nosnippet>839</a> .unwrap();
+<a href=#840 id=840 data-nosnippet>840</a>
+<a href=#841 id=841 data-nosnippet>841</a> <span class="kw">let
</span>props = WriterProperties::builder()
+<a href=#842 id=842 data-nosnippet>842</a>
.set_compression(Compression::SNAPPY)
+<a href=#843 id=843 data-nosnippet>843</a> .build();
+<a href=#844 id=844 data-nosnippet>844</a>
+<a href=#845 id=845 data-nosnippet>845</a> <span class="kw">let
</span>pos_del_path = <span class="macro">format!</span>(<span
class="string">"{}/pos-del-mixed.parquet"</span>,
table_location.to_str().unwrap());
+<a href=#846 id=846 data-nosnippet>846</a> <span class="kw">let
</span>file = File::create(<span
class="kw-2">&</span>pos_del_path).unwrap();
+<a href=#847 id=847 data-nosnippet>847</a> <span class="kw">let
</span><span class="kw-2">mut </span>writer = ArrowWriter::try_new(
+<a href=#848 id=848 data-nosnippet>848</a> file,
+<a href=#849 id=849 data-nosnippet>849</a>
positional_deletes_to_write.schema(),
+<a href=#850 id=850 data-nosnippet>850</a> <span
class="prelude-val">Some</span>(props.clone()),
+<a href=#851 id=851 data-nosnippet>851</a> )
+<a href=#852 id=852 data-nosnippet>852</a> .unwrap();
+<a href=#853 id=853 data-nosnippet>853</a> writer.write(<span
class="kw-2">&</span>positional_deletes_to_write).unwrap();
+<a href=#854 id=854 data-nosnippet>854</a> writer.close().unwrap();
+<a href=#855 id=855 data-nosnippet>855</a>
+<a href=#856 id=856 data-nosnippet>856</a> <span class="comment">//
Write equality delete file
+<a href=#857 id=857 data-nosnippet>857</a> </span><span class="kw">let
</span>eq_delete_path =
setup_write_equality_delete_file_1(table_location.to_str().unwrap());
+<a href=#858 id=858 data-nosnippet>858</a>
+<a href=#859 id=859 data-nosnippet>859</a> <span class="comment">//
Create FileScanTask with BOTH positional and equality deletes
+<a href=#860 id=860 data-nosnippet>860</a> </span><span class="kw">let
</span>pos_del = FileScanTaskDeleteFile {
+<a href=#861 id=861 data-nosnippet>861</a> file_path: pos_del_path,
+<a href=#862 id=862 data-nosnippet>862</a> file_type:
DataContentType::PositionDeletes,
+<a href=#863 id=863 data-nosnippet>863</a> partition_spec_id: <span
class="number">0</span>,
+<a href=#864 id=864 data-nosnippet>864</a> equality_ids: <span
class="prelude-val">None</span>,
+<a href=#865 id=865 data-nosnippet>865</a> };
+<a href=#866 id=866 data-nosnippet>866</a>
+<a href=#867 id=867 data-nosnippet>867</a> <span class="kw">let
</span>eq_del = FileScanTaskDeleteFile {
+<a href=#868 id=868 data-nosnippet>868</a> file_path:
eq_delete_path.clone(),
+<a href=#869 id=869 data-nosnippet>869</a> file_type:
DataContentType::EqualityDeletes,
+<a href=#870 id=870 data-nosnippet>870</a> partition_spec_id: <span
class="number">0</span>,
+<a href=#871 id=871 data-nosnippet>871</a> equality_ids: <span
class="prelude-val">Some</span>(<span class="macro">vec!</span>[<span
class="number">2</span>, <span class="number">3</span>]), <span
class="comment">// Only use field IDs that exist in both schemas
+<a href=#872 id=872 data-nosnippet>872</a> </span>};
+<a href=#873 id=873 data-nosnippet>873</a>
+<a href=#874 id=874 data-nosnippet>874</a> <span class="kw">let
</span>file_scan_task = FileScanTask {
+<a href=#875 id=875 data-nosnippet>875</a> start: <span
class="number">0</span>,
+<a href=#876 id=876 data-nosnippet>876</a> length: <span
class="number">0</span>,
+<a href=#877 id=877 data-nosnippet>877</a> record_count: <span
class="prelude-val">None</span>,
+<a href=#878 id=878 data-nosnippet>878</a> data_file_path: <span
class="macro">format!</span>(<span class="string">"{}/data-1.parquet"</span>,
table_location.to_str().unwrap()),
+<a href=#879 id=879 data-nosnippet>879</a> data_file_format:
DataFileFormat::Parquet,
+<a href=#880 id=880 data-nosnippet>880</a> schema:
data_file_schema.clone(),
+<a href=#881 id=881 data-nosnippet>881</a> project_field_ids: <span
class="macro">vec!</span>[<span class="number">2</span>, <span
class="number">3</span>],
+<a href=#882 id=882 data-nosnippet>882</a> predicate: <span
class="prelude-val">None</span>,
+<a href=#883 id=883 data-nosnippet>883</a> deletes: <span
class="macro">vec!</span>[pos_del, eq_del],
+<a href=#884 id=884 data-nosnippet>884</a> };
+<a href=#885 id=885 data-nosnippet>885</a>
+<a href=#886 id=886 data-nosnippet>886</a> <span class="comment">//
Load the deletes - should handle both types without error
+<a href=#887 id=887 data-nosnippet>887</a> </span><span class="kw">let
</span>delete_file_loader = CachingDeleteFileLoader::new(file_io.clone(), <span
class="number">10</span>);
+<a href=#888 id=888 data-nosnippet>888</a> <span class="kw">let
</span>delete_filter = delete_file_loader
+<a href=#889 id=889 data-nosnippet>889</a> .load_deletes(<span
class="kw-2">&</span>file_scan_task.deletes, file_scan_task.schema_ref())
+<a href=#890 id=890 data-nosnippet>890</a> .<span class="kw">await
+<a href=#891 id=891 data-nosnippet>891</a> </span>.unwrap()
+<a href=#892 id=892 data-nosnippet>892</a> .unwrap();
+<a href=#893 id=893 data-nosnippet>893</a>
+<a href=#894 id=894 data-nosnippet>894</a> <span class="comment">//
Verify both delete types can be processed together
+<a href=#895 id=895 data-nosnippet>895</a> </span><span class="kw">let
</span>result = delete_filter
+<a href=#896 id=896 data-nosnippet>896</a>
.build_equality_delete_predicate(<span class="kw-2">&</span>file_scan_task)
+<a href=#897 id=897 data-nosnippet>897</a> .<span
class="kw">await</span>;
+<a href=#898 id=898 data-nosnippet>898</a> <span
class="macro">assert!</span>(
+<a href=#899 id=899 data-nosnippet>899</a> result.is_ok(),
+<a href=#900 id=900 data-nosnippet>900</a> <span
class="string">"Failed to build equality delete predicate: {:?}"</span>,
+<a href=#901 id=901 data-nosnippet>901</a> result.err()
+<a href=#902 id=902 data-nosnippet>902</a> );
+<a href=#903 id=903 data-nosnippet>903</a> }
+<a href=#904 id=904
data-nosnippet>904</a>}</code></pre></div></section></main></body></html>
\ No newline at end of file
diff --git a/api/src/iceberg/arrow/delete_filter.rs.html
b/api/src/iceberg/arrow/delete_filter.rs.html
index b1a98e70..52414c23 100644
--- a/api/src/iceberg/arrow/delete_filter.rs.html
+++ b/api/src/iceberg/arrow/delete_filter.rs.html
@@ -68,308 +68,310 @@
<a href=#68 id=68 data-nosnippet>68</a> <span class="kw">pub</span>(<span
class="kw">crate</span>) <span class="kw">fn </span>try_start_eq_del_load(<span
class="kw-2">&</span><span class="self">self</span>, file_path: <span
class="kw-2">&</span>str) -> <span
class="prelude-ty">Option</span><Arc<Notify>> {
<a href=#69 id=69 data-nosnippet>69</a> <span class="kw">let
</span><span class="kw-2">mut </span>state = <span
class="self">self</span>.state.write().unwrap();
<a href=#70 id=70 data-nosnippet>70</a>
-<a href=#71 id=71 data-nosnippet>71</a> <span class="kw">if
</span>!state.equality_deletes.contains_key(file_path) {
-<a href=#72 id=72 data-nosnippet>72</a> <span class="kw">return
</span><span class="prelude-val">None</span>;
-<a href=#73 id=73 data-nosnippet>73</a> }
-<a href=#74 id=74 data-nosnippet>74</a>
-<a href=#75 id=75 data-nosnippet>75</a> <span class="kw">let
</span>notifier = Arc::new(Notify::new());
-<a href=#76 id=76 data-nosnippet>76</a> state
-<a href=#77 id=77 data-nosnippet>77</a> .equality_deletes
-<a href=#78 id=78 data-nosnippet>78</a>
.insert(file_path.to_string(), EqDelState::Loading(notifier.clone()));
-<a href=#79 id=79 data-nosnippet>79</a>
-<a href=#80 id=80 data-nosnippet>80</a> <span
class="prelude-val">Some</span>(notifier)
-<a href=#81 id=81 data-nosnippet>81</a> }
-<a href=#82 id=82 data-nosnippet>82</a>
-<a href=#83 id=83 data-nosnippet>83</a> <span class="doccomment">///
Retrieve the equality delete predicate for a given eq delete file path
-<a href=#84 id=84 data-nosnippet>84</a> </span><span
class="kw">pub</span>(<span class="kw">crate</span>) <span class="kw">async fn
</span>get_equality_delete_predicate_for_delete_file_path(
-<a href=#85 id=85 data-nosnippet>85</a> <span
class="kw-2">&</span><span class="self">self</span>,
-<a href=#86 id=86 data-nosnippet>86</a> file_path: <span
class="kw-2">&</span>str,
-<a href=#87 id=87 data-nosnippet>87</a> ) -> <span
class="prelude-ty">Option</span><Predicate> {
-<a href=#88 id=88 data-nosnippet>88</a> <span class="kw">let
</span>notifier = {
-<a href=#89 id=89 data-nosnippet>89</a> <span class="kw">match
</span><span
class="self">self</span>.state.read().unwrap().equality_deletes.get(file_path) {
-<a href=#90 id=90 data-nosnippet>90</a> <span
class="prelude-val">None </span>=> <span class="kw">return </span><span
class="prelude-val">None</span>,
-<a href=#91 id=91 data-nosnippet>91</a> <span
class="prelude-val">Some</span>(EqDelState::Loading(notifier)) =>
notifier.clone(),
-<a href=#92 id=92 data-nosnippet>92</a> <span
class="prelude-val">Some</span>(EqDelState::Loaded(predicate)) => {
-<a href=#93 id=93 data-nosnippet>93</a> <span
class="kw">return </span><span
class="prelude-val">Some</span>(predicate.clone());
-<a href=#94 id=94 data-nosnippet>94</a> }
-<a href=#95 id=95 data-nosnippet>95</a> }
-<a href=#96 id=96 data-nosnippet>96</a> };
-<a href=#97 id=97 data-nosnippet>97</a>
-<a href=#98 id=98 data-nosnippet>98</a> notifier.notified().<span
class="kw">await</span>;
+<a href=#71 id=71 data-nosnippet>71</a> <span class="comment">// Skip
if already loaded/loading - another task owns it
+<a href=#72 id=72 data-nosnippet>72</a> </span><span class="kw">if
</span>state.equality_deletes.contains_key(file_path) {
+<a href=#73 id=73 data-nosnippet>73</a> <span class="kw">return
</span><span class="prelude-val">None</span>;
+<a href=#74 id=74 data-nosnippet>74</a> }
+<a href=#75 id=75 data-nosnippet>75</a>
+<a href=#76 id=76 data-nosnippet>76</a> <span class="comment">// Mark
as loading to prevent duplicate work
+<a href=#77 id=77 data-nosnippet>77</a> </span><span class="kw">let
</span>notifier = Arc::new(Notify::new());
+<a href=#78 id=78 data-nosnippet>78</a> state
+<a href=#79 id=79 data-nosnippet>79</a> .equality_deletes
+<a href=#80 id=80 data-nosnippet>80</a>
.insert(file_path.to_string(), EqDelState::Loading(notifier.clone()));
+<a href=#81 id=81 data-nosnippet>81</a>
+<a href=#82 id=82 data-nosnippet>82</a> <span
class="prelude-val">Some</span>(notifier)
+<a href=#83 id=83 data-nosnippet>83</a> }
+<a href=#84 id=84 data-nosnippet>84</a>
+<a href=#85 id=85 data-nosnippet>85</a> <span class="doccomment">///
Retrieve the equality delete predicate for a given eq delete file path
+<a href=#86 id=86 data-nosnippet>86</a> </span><span
class="kw">pub</span>(<span class="kw">crate</span>) <span class="kw">async fn
</span>get_equality_delete_predicate_for_delete_file_path(
+<a href=#87 id=87 data-nosnippet>87</a> <span
class="kw-2">&</span><span class="self">self</span>,
+<a href=#88 id=88 data-nosnippet>88</a> file_path: <span
class="kw-2">&</span>str,
+<a href=#89 id=89 data-nosnippet>89</a> ) -> <span
class="prelude-ty">Option</span><Predicate> {
+<a href=#90 id=90 data-nosnippet>90</a> <span class="kw">let
</span>notifier = {
+<a href=#91 id=91 data-nosnippet>91</a> <span class="kw">match
</span><span
class="self">self</span>.state.read().unwrap().equality_deletes.get(file_path) {
+<a href=#92 id=92 data-nosnippet>92</a> <span
class="prelude-val">None </span>=> <span class="kw">return </span><span
class="prelude-val">None</span>,
+<a href=#93 id=93 data-nosnippet>93</a> <span
class="prelude-val">Some</span>(EqDelState::Loading(notifier)) =>
notifier.clone(),
+<a href=#94 id=94 data-nosnippet>94</a> <span
class="prelude-val">Some</span>(EqDelState::Loaded(predicate)) => {
+<a href=#95 id=95 data-nosnippet>95</a> <span
class="kw">return </span><span
class="prelude-val">Some</span>(predicate.clone());
+<a href=#96 id=96 data-nosnippet>96</a> }
+<a href=#97 id=97 data-nosnippet>97</a> }
+<a href=#98 id=98 data-nosnippet>98</a> };
<a href=#99 id=99 data-nosnippet>99</a>
-<a href=#100 id=100 data-nosnippet>100</a> <span class="kw">match
</span><span
class="self">self</span>.state.read().unwrap().equality_deletes.get(file_path) {
-<a href=#101 id=101 data-nosnippet>101</a> <span
class="prelude-val">Some</span>(EqDelState::Loaded(predicate)) => <span
class="prelude-val">Some</span>(predicate.clone()),
-<a href=#102 id=102 data-nosnippet>102</a> <span class="kw">_
</span>=> <span class="macro">unreachable!</span>(<span
class="string">"Cannot be any other state than loaded"</span>),
-<a href=#103 id=103 data-nosnippet>103</a> }
-<a href=#104 id=104 data-nosnippet>104</a> }
-<a href=#105 id=105 data-nosnippet>105</a>
-<a href=#106 id=106 data-nosnippet>106</a> <span class="doccomment">///
Builds eq delete predicate for the provided task.
-<a href=#107 id=107 data-nosnippet>107</a> </span><span
class="kw">pub</span>(<span class="kw">crate</span>) <span class="kw">async fn
</span>build_equality_delete_predicate(
-<a href=#108 id=108 data-nosnippet>108</a> <span
class="kw-2">&</span><span class="self">self</span>,
-<a href=#109 id=109 data-nosnippet>109</a> file_scan_task: <span
class="kw-2">&</span>FileScanTask,
-<a href=#110 id=110 data-nosnippet>110</a> ) -> <span
class="prelude-ty">Result</span><<span
class="prelude-ty">Option</span><BoundPredicate>> {
-<a href=#111 id=111 data-nosnippet>111</a> <span class="comment">// *
Filter the task's deletes into just the Equality deletes
-<a href=#112 id=112 data-nosnippet>112</a> // * Retrieve the unbound
predicate for each from self.state.equality_deletes
-<a href=#113 id=113 data-nosnippet>113</a> // * Logical-AND them all
together to get a single combined `Predicate`
-<a href=#114 id=114 data-nosnippet>114</a> // * Bind the predicate to
the task's schema to get a `BoundPredicate`
-<a href=#115 id=115 data-nosnippet>115</a>
-<a href=#116 id=116 data-nosnippet>116</a> </span><span class="kw">let
</span><span class="kw-2">mut </span>combined_predicate = AlwaysTrue;
-<a href=#117 id=117 data-nosnippet>117</a> <span class="kw">for
</span>delete <span class="kw">in </span><span
class="kw-2">&</span>file_scan_task.deletes {
-<a href=#118 id=118 data-nosnippet>118</a> <span class="kw">if
</span>!is_equality_delete(delete) {
-<a href=#119 id=119 data-nosnippet>119</a> <span
class="kw">continue</span>;
-<a href=#120 id=120 data-nosnippet>120</a> }
-<a href=#121 id=121 data-nosnippet>121</a>
-<a href=#122 id=122 data-nosnippet>122</a> <span class="kw">let
</span><span class="prelude-val">Some</span>(predicate) = <span
class="self">self
-<a href=#123 id=123 data-nosnippet>123</a>
</span>.get_equality_delete_predicate_for_delete_file_path(<span
class="kw-2">&</span>delete.file_path)
-<a href=#124 id=124 data-nosnippet>124</a> .<span
class="kw">await
-<a href=#125 id=125 data-nosnippet>125</a> else </span>{
-<a href=#126 id=126 data-nosnippet>126</a> <span
class="kw">return </span><span class="prelude-val">Err</span>(Error::new(
-<a href=#127 id=127 data-nosnippet>127</a>
ErrorKind::Unexpected,
-<a href=#128 id=128 data-nosnippet>128</a> <span
class="macro">format!</span>(
-<a href=#129 id=129 data-nosnippet>129</a> <span
class="string">"Missing predicate for equality delete file '{}'"</span>,
-<a href=#130 id=130 data-nosnippet>130</a>
delete.file_path
-<a href=#131 id=131 data-nosnippet>131</a> ),
-<a href=#132 id=132 data-nosnippet>132</a> ));
-<a href=#133 id=133 data-nosnippet>133</a> };
-<a href=#134 id=134 data-nosnippet>134</a>
-<a href=#135 id=135 data-nosnippet>135</a> combined_predicate =
combined_predicate.and(predicate);
-<a href=#136 id=136 data-nosnippet>136</a> }
-<a href=#137 id=137 data-nosnippet>137</a>
-<a href=#138 id=138 data-nosnippet>138</a> <span class="kw">if
</span>combined_predicate == AlwaysTrue {
-<a href=#139 id=139 data-nosnippet>139</a> <span class="kw">return
</span><span class="prelude-val">Ok</span>(<span
class="prelude-val">None</span>);
-<a href=#140 id=140 data-nosnippet>140</a> }
-<a href=#141 id=141 data-nosnippet>141</a>
-<a href=#142 id=142 data-nosnippet>142</a> <span class="comment">//
TODO: handle case-insensitive case
-<a href=#143 id=143 data-nosnippet>143</a> </span><span class="kw">let
</span>bound_predicate = combined_predicate.bind(file_scan_task.schema.clone(),
<span class="bool-val">false</span>)<span class="question-mark">?</span>;
-<a href=#144 id=144 data-nosnippet>144</a> <span
class="prelude-val">Ok</span>(<span
class="prelude-val">Some</span>(bound_predicate))
-<a href=#145 id=145 data-nosnippet>145</a> }
-<a href=#146 id=146 data-nosnippet>146</a>
-<a href=#147 id=147 data-nosnippet>147</a> <span
class="kw">pub</span>(<span class="kw">crate</span>) <span class="kw">fn
</span>upsert_delete_vector(
-<a href=#148 id=148 data-nosnippet>148</a> <span class="kw-2">&mut
</span><span class="self">self</span>,
-<a href=#149 id=149 data-nosnippet>149</a> data_file_path: String,
-<a href=#150 id=150 data-nosnippet>150</a> delete_vector: DeleteVector,
-<a href=#151 id=151 data-nosnippet>151</a> ) {
-<a href=#152 id=152 data-nosnippet>152</a> <span class="kw">let
</span><span class="kw-2">mut </span>state = <span
class="self">self</span>.state.write().unwrap();
-<a href=#153 id=153 data-nosnippet>153</a>
-<a href=#154 id=154 data-nosnippet>154</a> <span class="kw">let
</span><span class="prelude-val">Some</span>(entry) =
state.delete_vectors.get_mut(<span class="kw-2">&</span>data_file_path)
<span class="kw">else </span>{
-<a href=#155 id=155 data-nosnippet>155</a> state
-<a href=#156 id=156 data-nosnippet>156</a> .delete_vectors
-<a href=#157 id=157 data-nosnippet>157</a>
.insert(data_file_path, Arc::new(Mutex::new(delete_vector)));
-<a href=#158 id=158 data-nosnippet>158</a> <span
class="kw">return</span>;
-<a href=#159 id=159 data-nosnippet>159</a> };
-<a href=#160 id=160 data-nosnippet>160</a>
-<a href=#161 id=161 data-nosnippet>161</a> <span
class="kw-2">*</span>entry.lock().unwrap() |= delete_vector;
-<a href=#162 id=162 data-nosnippet>162</a> }
-<a href=#163 id=163 data-nosnippet>163</a>
-<a href=#164 id=164 data-nosnippet>164</a> <span
class="kw">pub</span>(<span class="kw">crate</span>) <span class="kw">fn
</span>insert_equality_delete(
-<a href=#165 id=165 data-nosnippet>165</a> <span
class="kw-2">&</span><span class="self">self</span>,
-<a href=#166 id=166 data-nosnippet>166</a> delete_file_path: <span
class="kw-2">&</span>str,
-<a href=#167 id=167 data-nosnippet>167</a> eq_del:
Receiver<Predicate>,
-<a href=#168 id=168 data-nosnippet>168</a> ) {
-<a href=#169 id=169 data-nosnippet>169</a> <span class="kw">let
</span>notify = Arc::new(Notify::new());
-<a href=#170 id=170 data-nosnippet>170</a> {
-<a href=#171 id=171 data-nosnippet>171</a> <span class="kw">let
</span><span class="kw-2">mut </span>state = <span
class="self">self</span>.state.write().unwrap();
-<a href=#172 id=172 data-nosnippet>172</a>
state.equality_deletes.insert(
-<a href=#173 id=173 data-nosnippet>173</a>
delete_file_path.to_string(),
-<a href=#174 id=174 data-nosnippet>174</a>
EqDelState::Loading(notify.clone()),
-<a href=#175 id=175 data-nosnippet>175</a> );
-<a href=#176 id=176 data-nosnippet>176</a> }
-<a href=#177 id=177 data-nosnippet>177</a>
-<a href=#178 id=178 data-nosnippet>178</a> <span class="kw">let
</span>state = <span class="self">self</span>.state.clone();
-<a href=#179 id=179 data-nosnippet>179</a> <span class="kw">let
</span>delete_file_path = delete_file_path.to_string();
-<a href=#180 id=180 data-nosnippet>180</a> <span
class="kw">crate</span>::runtime::spawn(<span class="kw">async move </span>{
-<a href=#181 id=181 data-nosnippet>181</a> <span class="kw">let
</span>eq_del = eq_del.<span class="kw">await</span>.unwrap();
-<a href=#182 id=182 data-nosnippet>182</a> {
-<a href=#183 id=183 data-nosnippet>183</a> <span class="kw">let
</span><span class="kw-2">mut </span>state = state.write().unwrap();
-<a href=#184 id=184 data-nosnippet>184</a> state
-<a href=#185 id=185 data-nosnippet>185</a> .equality_deletes
-<a href=#186 id=186 data-nosnippet>186</a>
.insert(delete_file_path, EqDelState::Loaded(eq_del));
-<a href=#187 id=187 data-nosnippet>187</a> }
-<a href=#188 id=188 data-nosnippet>188</a> notify.notify_waiters();
-<a href=#189 id=189 data-nosnippet>189</a> });
-<a href=#190 id=190 data-nosnippet>190</a> }
-<a href=#191 id=191 data-nosnippet>191</a>}
-<a href=#192 id=192 data-nosnippet>192</a>
-<a href=#193 id=193 data-nosnippet>193</a><span class="kw">pub</span>(<span
class="kw">crate</span>) <span class="kw">fn </span>is_equality_delete(f: <span
class="kw-2">&</span>FileScanTaskDeleteFile) -> bool {
-<a href=#194 id=194 data-nosnippet>194</a> <span
class="macro">matches!</span>(f.file_type, DataContentType::EqualityDeletes)
-<a href=#195 id=195 data-nosnippet>195</a>}
-<a href=#196 id=196 data-nosnippet>196</a>
-<a href=#197 id=197 data-nosnippet>197</a><span class="attr">#[cfg(test)]
-<a href=#198 id=198 data-nosnippet>198</a></span><span
class="kw">pub</span>(<span class="kw">crate</span>) <span class="kw">mod
</span>tests {
-<a href=#199 id=199 data-nosnippet>199</a> <span class="kw">use
</span>std::fs::File;
-<a href=#200 id=200 data-nosnippet>200</a> <span class="kw">use
</span>std::path::Path;
-<a href=#201 id=201 data-nosnippet>201</a> <span class="kw">use
</span>std::sync::Arc;
-<a href=#202 id=202 data-nosnippet>202</a>
-<a href=#203 id=203 data-nosnippet>203</a> <span class="kw">use
</span>arrow_array::{Int64Array, RecordBatch, StringArray};
-<a href=#204 id=204 data-nosnippet>204</a> <span class="kw">use
</span>arrow_schema::Schema <span class="kw">as </span>ArrowSchema;
-<a href=#205 id=205 data-nosnippet>205</a> <span class="kw">use
</span>parquet::arrow::{ArrowWriter, PARQUET_FIELD_ID_META_KEY};
-<a href=#206 id=206 data-nosnippet>206</a> <span class="kw">use
</span>parquet::basic::Compression;
-<a href=#207 id=207 data-nosnippet>207</a> <span class="kw">use
</span>parquet::file::properties::WriterProperties;
-<a href=#208 id=208 data-nosnippet>208</a> <span class="kw">use
</span>tempfile::TempDir;
-<a href=#209 id=209 data-nosnippet>209</a>
-<a href=#210 id=210 data-nosnippet>210</a> <span class="kw">use
super</span>::<span class="kw-2">*</span>;
-<a href=#211 id=211 data-nosnippet>211</a> <span class="kw">use
</span><span
class="kw">crate</span>::arrow::caching_delete_file_loader::CachingDeleteFileLoader;
-<a href=#212 id=212 data-nosnippet>212</a> <span class="kw">use
</span><span class="kw">crate</span>::io::FileIO;
-<a href=#213 id=213 data-nosnippet>213</a> <span class="kw">use
</span><span class="kw">crate</span>::spec::{DataFileFormat, Schema};
-<a href=#214 id=214 data-nosnippet>214</a>
-<a href=#215 id=215 data-nosnippet>215</a> <span class="kw">type
</span>ArrowSchemaRef = Arc<ArrowSchema>;
+<a href=#100 id=100 data-nosnippet>100</a> notifier.notified().<span
class="kw">await</span>;
+<a href=#101 id=101 data-nosnippet>101</a>
+<a href=#102 id=102 data-nosnippet>102</a> <span class="kw">match
</span><span
class="self">self</span>.state.read().unwrap().equality_deletes.get(file_path) {
+<a href=#103 id=103 data-nosnippet>103</a> <span
class="prelude-val">Some</span>(EqDelState::Loaded(predicate)) => <span
class="prelude-val">Some</span>(predicate.clone()),
+<a href=#104 id=104 data-nosnippet>104</a> <span class="kw">_
</span>=> <span class="macro">unreachable!</span>(<span
class="string">"Cannot be any other state than loaded"</span>),
+<a href=#105 id=105 data-nosnippet>105</a> }
+<a href=#106 id=106 data-nosnippet>106</a> }
+<a href=#107 id=107 data-nosnippet>107</a>
+<a href=#108 id=108 data-nosnippet>108</a> <span class="doccomment">///
Builds eq delete predicate for the provided task.
+<a href=#109 id=109 data-nosnippet>109</a> </span><span
class="kw">pub</span>(<span class="kw">crate</span>) <span class="kw">async fn
</span>build_equality_delete_predicate(
+<a href=#110 id=110 data-nosnippet>110</a> <span
class="kw-2">&</span><span class="self">self</span>,
+<a href=#111 id=111 data-nosnippet>111</a> file_scan_task: <span
class="kw-2">&</span>FileScanTask,
+<a href=#112 id=112 data-nosnippet>112</a> ) -> <span
class="prelude-ty">Result</span><<span
class="prelude-ty">Option</span><BoundPredicate>> {
+<a href=#113 id=113 data-nosnippet>113</a> <span class="comment">// *
Filter the task's deletes into just the Equality deletes
+<a href=#114 id=114 data-nosnippet>114</a> // * Retrieve the unbound
predicate for each from self.state.equality_deletes
+<a href=#115 id=115 data-nosnippet>115</a> // * Logical-AND them all
together to get a single combined `Predicate`
+<a href=#116 id=116 data-nosnippet>116</a> // * Bind the predicate to
the task's schema to get a `BoundPredicate`
+<a href=#117 id=117 data-nosnippet>117</a>
+<a href=#118 id=118 data-nosnippet>118</a> </span><span class="kw">let
</span><span class="kw-2">mut </span>combined_predicate = AlwaysTrue;
+<a href=#119 id=119 data-nosnippet>119</a> <span class="kw">for
</span>delete <span class="kw">in </span><span
class="kw-2">&</span>file_scan_task.deletes {
+<a href=#120 id=120 data-nosnippet>120</a> <span class="kw">if
</span>!is_equality_delete(delete) {
+<a href=#121 id=121 data-nosnippet>121</a> <span
class="kw">continue</span>;
+<a href=#122 id=122 data-nosnippet>122</a> }
+<a href=#123 id=123 data-nosnippet>123</a>
+<a href=#124 id=124 data-nosnippet>124</a> <span class="kw">let
</span><span class="prelude-val">Some</span>(predicate) = <span
class="self">self
+<a href=#125 id=125 data-nosnippet>125</a>
</span>.get_equality_delete_predicate_for_delete_file_path(<span
class="kw-2">&</span>delete.file_path)
+<a href=#126 id=126 data-nosnippet>126</a> .<span
class="kw">await
+<a href=#127 id=127 data-nosnippet>127</a> else </span>{
+<a href=#128 id=128 data-nosnippet>128</a> <span
class="kw">return </span><span class="prelude-val">Err</span>(Error::new(
+<a href=#129 id=129 data-nosnippet>129</a>
ErrorKind::Unexpected,
+<a href=#130 id=130 data-nosnippet>130</a> <span
class="macro">format!</span>(
+<a href=#131 id=131 data-nosnippet>131</a> <span
class="string">"Missing predicate for equality delete file '{}'"</span>,
+<a href=#132 id=132 data-nosnippet>132</a>
delete.file_path
+<a href=#133 id=133 data-nosnippet>133</a> ),
+<a href=#134 id=134 data-nosnippet>134</a> ));
+<a href=#135 id=135 data-nosnippet>135</a> };
+<a href=#136 id=136 data-nosnippet>136</a>
+<a href=#137 id=137 data-nosnippet>137</a> combined_predicate =
combined_predicate.and(predicate);
+<a href=#138 id=138 data-nosnippet>138</a> }
+<a href=#139 id=139 data-nosnippet>139</a>
+<a href=#140 id=140 data-nosnippet>140</a> <span class="kw">if
</span>combined_predicate == AlwaysTrue {
+<a href=#141 id=141 data-nosnippet>141</a> <span class="kw">return
</span><span class="prelude-val">Ok</span>(<span
class="prelude-val">None</span>);
+<a href=#142 id=142 data-nosnippet>142</a> }
+<a href=#143 id=143 data-nosnippet>143</a>
+<a href=#144 id=144 data-nosnippet>144</a> <span class="comment">//
TODO: handle case-insensitive case
+<a href=#145 id=145 data-nosnippet>145</a> </span><span class="kw">let
</span>bound_predicate = combined_predicate.bind(file_scan_task.schema.clone(),
<span class="bool-val">false</span>)<span class="question-mark">?</span>;
+<a href=#146 id=146 data-nosnippet>146</a> <span
class="prelude-val">Ok</span>(<span
class="prelude-val">Some</span>(bound_predicate))
+<a href=#147 id=147 data-nosnippet>147</a> }
+<a href=#148 id=148 data-nosnippet>148</a>
+<a href=#149 id=149 data-nosnippet>149</a> <span
class="kw">pub</span>(<span class="kw">crate</span>) <span class="kw">fn
</span>upsert_delete_vector(
+<a href=#150 id=150 data-nosnippet>150</a> <span class="kw-2">&mut
</span><span class="self">self</span>,
+<a href=#151 id=151 data-nosnippet>151</a> data_file_path: String,
+<a href=#152 id=152 data-nosnippet>152</a> delete_vector: DeleteVector,
+<a href=#153 id=153 data-nosnippet>153</a> ) {
+<a href=#154 id=154 data-nosnippet>154</a> <span class="kw">let
</span><span class="kw-2">mut </span>state = <span
class="self">self</span>.state.write().unwrap();
+<a href=#155 id=155 data-nosnippet>155</a>
+<a href=#156 id=156 data-nosnippet>156</a> <span class="kw">let
</span><span class="prelude-val">Some</span>(entry) =
state.delete_vectors.get_mut(<span class="kw-2">&</span>data_file_path)
<span class="kw">else </span>{
+<a href=#157 id=157 data-nosnippet>157</a> state
+<a href=#158 id=158 data-nosnippet>158</a> .delete_vectors
+<a href=#159 id=159 data-nosnippet>159</a>
.insert(data_file_path, Arc::new(Mutex::new(delete_vector)));
+<a href=#160 id=160 data-nosnippet>160</a> <span
class="kw">return</span>;
+<a href=#161 id=161 data-nosnippet>161</a> };
+<a href=#162 id=162 data-nosnippet>162</a>
+<a href=#163 id=163 data-nosnippet>163</a> <span
class="kw-2">*</span>entry.lock().unwrap() |= delete_vector;
+<a href=#164 id=164 data-nosnippet>164</a> }
+<a href=#165 id=165 data-nosnippet>165</a>
+<a href=#166 id=166 data-nosnippet>166</a> <span
class="kw">pub</span>(<span class="kw">crate</span>) <span class="kw">fn
</span>insert_equality_delete(
+<a href=#167 id=167 data-nosnippet>167</a> <span
class="kw-2">&</span><span class="self">self</span>,
+<a href=#168 id=168 data-nosnippet>168</a> delete_file_path: <span
class="kw-2">&</span>str,
+<a href=#169 id=169 data-nosnippet>169</a> eq_del:
Receiver<Predicate>,
+<a href=#170 id=170 data-nosnippet>170</a> ) {
+<a href=#171 id=171 data-nosnippet>171</a> <span class="kw">let
</span>notify = Arc::new(Notify::new());
+<a href=#172 id=172 data-nosnippet>172</a> {
+<a href=#173 id=173 data-nosnippet>173</a> <span class="kw">let
</span><span class="kw-2">mut </span>state = <span
class="self">self</span>.state.write().unwrap();
+<a href=#174 id=174 data-nosnippet>174</a>
state.equality_deletes.insert(
+<a href=#175 id=175 data-nosnippet>175</a>
delete_file_path.to_string(),
+<a href=#176 id=176 data-nosnippet>176</a>
EqDelState::Loading(notify.clone()),
+<a href=#177 id=177 data-nosnippet>177</a> );
+<a href=#178 id=178 data-nosnippet>178</a> }
+<a href=#179 id=179 data-nosnippet>179</a>
+<a href=#180 id=180 data-nosnippet>180</a> <span class="kw">let
</span>state = <span class="self">self</span>.state.clone();
+<a href=#181 id=181 data-nosnippet>181</a> <span class="kw">let
</span>delete_file_path = delete_file_path.to_string();
+<a href=#182 id=182 data-nosnippet>182</a> <span
class="kw">crate</span>::runtime::spawn(<span class="kw">async move </span>{
+<a href=#183 id=183 data-nosnippet>183</a> <span class="kw">let
</span>eq_del = eq_del.<span class="kw">await</span>.unwrap();
+<a href=#184 id=184 data-nosnippet>184</a> {
+<a href=#185 id=185 data-nosnippet>185</a> <span class="kw">let
</span><span class="kw-2">mut </span>state = state.write().unwrap();
+<a href=#186 id=186 data-nosnippet>186</a> state
+<a href=#187 id=187 data-nosnippet>187</a> .equality_deletes
+<a href=#188 id=188 data-nosnippet>188</a>
.insert(delete_file_path, EqDelState::Loaded(eq_del));
+<a href=#189 id=189 data-nosnippet>189</a> }
+<a href=#190 id=190 data-nosnippet>190</a> notify.notify_waiters();
+<a href=#191 id=191 data-nosnippet>191</a> });
+<a href=#192 id=192 data-nosnippet>192</a> }
+<a href=#193 id=193 data-nosnippet>193</a>}
+<a href=#194 id=194 data-nosnippet>194</a>
+<a href=#195 id=195 data-nosnippet>195</a><span class="kw">pub</span>(<span
class="kw">crate</span>) <span class="kw">fn </span>is_equality_delete(f: <span
class="kw-2">&</span>FileScanTaskDeleteFile) -> bool {
+<a href=#196 id=196 data-nosnippet>196</a> <span
class="macro">matches!</span>(f.file_type, DataContentType::EqualityDeletes)
+<a href=#197 id=197 data-nosnippet>197</a>}
+<a href=#198 id=198 data-nosnippet>198</a>
+<a href=#199 id=199 data-nosnippet>199</a><span class="attr">#[cfg(test)]
+<a href=#200 id=200 data-nosnippet>200</a></span><span
class="kw">pub</span>(<span class="kw">crate</span>) <span class="kw">mod
</span>tests {
+<a href=#201 id=201 data-nosnippet>201</a> <span class="kw">use
</span>std::fs::File;
+<a href=#202 id=202 data-nosnippet>202</a> <span class="kw">use
</span>std::path::Path;
+<a href=#203 id=203 data-nosnippet>203</a> <span class="kw">use
</span>std::sync::Arc;
+<a href=#204 id=204 data-nosnippet>204</a>
+<a href=#205 id=205 data-nosnippet>205</a> <span class="kw">use
</span>arrow_array::{Int64Array, RecordBatch, StringArray};
+<a href=#206 id=206 data-nosnippet>206</a> <span class="kw">use
</span>arrow_schema::Schema <span class="kw">as </span>ArrowSchema;
+<a href=#207 id=207 data-nosnippet>207</a> <span class="kw">use
</span>parquet::arrow::{ArrowWriter, PARQUET_FIELD_ID_META_KEY};
+<a href=#208 id=208 data-nosnippet>208</a> <span class="kw">use
</span>parquet::basic::Compression;
+<a href=#209 id=209 data-nosnippet>209</a> <span class="kw">use
</span>parquet::file::properties::WriterProperties;
+<a href=#210 id=210 data-nosnippet>210</a> <span class="kw">use
</span>tempfile::TempDir;
+<a href=#211 id=211 data-nosnippet>211</a>
+<a href=#212 id=212 data-nosnippet>212</a> <span class="kw">use
super</span>::<span class="kw-2">*</span>;
+<a href=#213 id=213 data-nosnippet>213</a> <span class="kw">use
</span><span
class="kw">crate</span>::arrow::caching_delete_file_loader::CachingDeleteFileLoader;
+<a href=#214 id=214 data-nosnippet>214</a> <span class="kw">use
</span><span class="kw">crate</span>::io::FileIO;
+<a href=#215 id=215 data-nosnippet>215</a> <span class="kw">use
</span><span class="kw">crate</span>::spec::{DataFileFormat, Schema};
<a href=#216 id=216 data-nosnippet>216</a>
-<a href=#217 id=217 data-nosnippet>217</a> <span class="kw">const
</span>FIELD_ID_POSITIONAL_DELETE_FILE_PATH: u64 = <span
class="number">2147483546</span>;
-<a href=#218 id=218 data-nosnippet>218</a> <span class="kw">const
</span>FIELD_ID_POSITIONAL_DELETE_POS: u64 = <span
class="number">2147483545</span>;
-<a href=#219 id=219 data-nosnippet>219</a>
-<a href=#220 id=220 data-nosnippet>220</a> <span class="attr">#[tokio::test]
-<a href=#221 id=221 data-nosnippet>221</a> </span><span class="kw">async fn
</span>test_delete_file_filter_load_deletes() {
-<a href=#222 id=222 data-nosnippet>222</a> <span class="kw">let
</span>tmp_dir = TempDir::new().unwrap();
-<a href=#223 id=223 data-nosnippet>223</a> <span class="kw">let
</span>table_location = tmp_dir.path();
-<a href=#224 id=224 data-nosnippet>224</a> <span class="kw">let
</span>file_io = FileIO::from_path(table_location.as_os_str().to_str().unwrap())
-<a href=#225 id=225 data-nosnippet>225</a> .unwrap()
-<a href=#226 id=226 data-nosnippet>226</a> .build()
-<a href=#227 id=227 data-nosnippet>227</a> .unwrap();
-<a href=#228 id=228 data-nosnippet>228</a>
-<a href=#229 id=229 data-nosnippet>229</a> <span class="kw">let
</span>delete_file_loader = CachingDeleteFileLoader::new(file_io.clone(), <span
class="number">10</span>);
+<a href=#217 id=217 data-nosnippet>217</a> <span class="kw">type
</span>ArrowSchemaRef = Arc<ArrowSchema>;
+<a href=#218 id=218 data-nosnippet>218</a>
+<a href=#219 id=219 data-nosnippet>219</a> <span class="kw">const
</span>FIELD_ID_POSITIONAL_DELETE_FILE_PATH: u64 = <span
class="number">2147483546</span>;
+<a href=#220 id=220 data-nosnippet>220</a> <span class="kw">const
</span>FIELD_ID_POSITIONAL_DELETE_POS: u64 = <span
class="number">2147483545</span>;
+<a href=#221 id=221 data-nosnippet>221</a>
+<a href=#222 id=222 data-nosnippet>222</a> <span class="attr">#[tokio::test]
+<a href=#223 id=223 data-nosnippet>223</a> </span><span class="kw">async fn
</span>test_delete_file_filter_load_deletes() {
+<a href=#224 id=224 data-nosnippet>224</a> <span class="kw">let
</span>tmp_dir = TempDir::new().unwrap();
+<a href=#225 id=225 data-nosnippet>225</a> <span class="kw">let
</span>table_location = tmp_dir.path();
+<a href=#226 id=226 data-nosnippet>226</a> <span class="kw">let
</span>file_io = FileIO::from_path(table_location.as_os_str().to_str().unwrap())
+<a href=#227 id=227 data-nosnippet>227</a> .unwrap()
+<a href=#228 id=228 data-nosnippet>228</a> .build()
+<a href=#229 id=229 data-nosnippet>229</a> .unwrap();
<a href=#230 id=230 data-nosnippet>230</a>
-<a href=#231 id=231 data-nosnippet>231</a> <span class="kw">let
</span>file_scan_tasks = setup(table_location);
+<a href=#231 id=231 data-nosnippet>231</a> <span class="kw">let
</span>delete_file_loader = CachingDeleteFileLoader::new(file_io.clone(), <span
class="number">10</span>);
<a href=#232 id=232 data-nosnippet>232</a>
-<a href=#233 id=233 data-nosnippet>233</a> <span class="kw">let
</span>delete_filter = delete_file_loader
-<a href=#234 id=234 data-nosnippet>234</a> .load_deletes(<span
class="kw-2">&</span>file_scan_tasks[<span
class="number">0</span>].deletes, file_scan_tasks[<span
class="number">0</span>].schema_ref())
-<a href=#235 id=235 data-nosnippet>235</a> .<span class="kw">await
-<a href=#236 id=236 data-nosnippet>236</a> </span>.unwrap()
-<a href=#237 id=237 data-nosnippet>237</a> .unwrap();
-<a href=#238 id=238 data-nosnippet>238</a>
-<a href=#239 id=239 data-nosnippet>239</a> <span class="kw">let
</span>result = delete_filter
-<a href=#240 id=240 data-nosnippet>240</a> .get_delete_vector(<span
class="kw-2">&</span>file_scan_tasks[<span class="number">0</span>])
-<a href=#241 id=241 data-nosnippet>241</a> .unwrap();
-<a href=#242 id=242 data-nosnippet>242</a> <span
class="macro">assert_eq!</span>(result.lock().unwrap().len(), <span
class="number">12</span>); <span class="comment">// pos dels from pos del file
1 and 2
-<a href=#243 id=243 data-nosnippet>243</a>
-<a href=#244 id=244 data-nosnippet>244</a> </span><span class="kw">let
</span>delete_filter = delete_file_loader
-<a href=#245 id=245 data-nosnippet>245</a> .load_deletes(<span
class="kw-2">&</span>file_scan_tasks[<span
class="number">1</span>].deletes, file_scan_tasks[<span
class="number">1</span>].schema_ref())
-<a href=#246 id=246 data-nosnippet>246</a> .<span class="kw">await
-<a href=#247 id=247 data-nosnippet>247</a> </span>.unwrap()
-<a href=#248 id=248 data-nosnippet>248</a> .unwrap();
-<a href=#249 id=249 data-nosnippet>249</a>
-<a href=#250 id=250 data-nosnippet>250</a> <span class="kw">let
</span>result = delete_filter
-<a href=#251 id=251 data-nosnippet>251</a> .get_delete_vector(<span
class="kw-2">&</span>file_scan_tasks[<span class="number">1</span>])
-<a href=#252 id=252 data-nosnippet>252</a> .unwrap();
-<a href=#253 id=253 data-nosnippet>253</a> <span
class="macro">assert_eq!</span>(result.lock().unwrap().len(), <span
class="number">8</span>); <span class="comment">// no pos dels for file 3
-<a href=#254 id=254 data-nosnippet>254</a> </span>}
-<a href=#255 id=255 data-nosnippet>255</a>
-<a href=#256 id=256 data-nosnippet>256</a> <span
class="kw">pub</span>(<span class="kw">crate</span>) <span class="kw">fn
</span>setup(table_location: <span class="kw-2">&</span>Path) ->
Vec<FileScanTask> {
-<a href=#257 id=257 data-nosnippet>257</a> <span class="kw">let
</span>data_file_schema = Arc::new(Schema::builder().build().unwrap());
-<a href=#258 id=258 data-nosnippet>258</a> <span class="kw">let
</span>positional_delete_schema = create_pos_del_schema();
-<a href=#259 id=259 data-nosnippet>259</a>
-<a href=#260 id=260 data-nosnippet>260</a> <span class="kw">let
</span>file_path_values = [
-<a href=#261 id=261 data-nosnippet>261</a> <span
class="macro">vec!</span>[<span class="macro">format!</span>(<span
class="string">"{}/1.parquet"</span>, table_location.to_str().unwrap()); <span
class="number">8</span>],
-<a href=#262 id=262 data-nosnippet>262</a> <span
class="macro">vec!</span>[<span class="macro">format!</span>(<span
class="string">"{}/1.parquet"</span>, table_location.to_str().unwrap()); <span
class="number">8</span>],
-<a href=#263 id=263 data-nosnippet>263</a> <span
class="macro">vec!</span>[<span class="macro">format!</span>(<span
class="string">"{}/2.parquet"</span>, table_location.to_str().unwrap()); <span
class="number">8</span>],
-<a href=#264 id=264 data-nosnippet>264</a> ];
-<a href=#265 id=265 data-nosnippet>265</a> <span class="kw">let
</span>pos_values = [
-<a href=#266 id=266 data-nosnippet>266</a> <span
class="macro">vec!</span>[<span class="number">0i64</span>, <span
class="number">1</span>, <span class="number">3</span>, <span
class="number">5</span>, <span class="number">6</span>, <span
class="number">8</span>, <span class="number">1022</span>, <span
class="number">1023</span>],
-<a href=#267 id=267 data-nosnippet>267</a> <span
class="macro">vec!</span>[<span class="number">0i64</span>, <span
class="number">1</span>, <span class="number">3</span>, <span
class="number">5</span>, <span class="number">20</span>, <span
class="number">21</span>, <span class="number">22</span>, <span
class="number">23</span>],
+<a href=#233 id=233 data-nosnippet>233</a> <span class="kw">let
</span>file_scan_tasks = setup(table_location);
+<a href=#234 id=234 data-nosnippet>234</a>
+<a href=#235 id=235 data-nosnippet>235</a> <span class="kw">let
</span>delete_filter = delete_file_loader
+<a href=#236 id=236 data-nosnippet>236</a> .load_deletes(<span
class="kw-2">&</span>file_scan_tasks[<span
class="number">0</span>].deletes, file_scan_tasks[<span
class="number">0</span>].schema_ref())
+<a href=#237 id=237 data-nosnippet>237</a> .<span class="kw">await
+<a href=#238 id=238 data-nosnippet>238</a> </span>.unwrap()
+<a href=#239 id=239 data-nosnippet>239</a> .unwrap();
+<a href=#240 id=240 data-nosnippet>240</a>
+<a href=#241 id=241 data-nosnippet>241</a> <span class="kw">let
</span>result = delete_filter
+<a href=#242 id=242 data-nosnippet>242</a> .get_delete_vector(<span
class="kw-2">&</span>file_scan_tasks[<span class="number">0</span>])
+<a href=#243 id=243 data-nosnippet>243</a> .unwrap();
+<a href=#244 id=244 data-nosnippet>244</a> <span
class="macro">assert_eq!</span>(result.lock().unwrap().len(), <span
class="number">12</span>); <span class="comment">// pos dels from pos del file
1 and 2
+<a href=#245 id=245 data-nosnippet>245</a>
+<a href=#246 id=246 data-nosnippet>246</a> </span><span class="kw">let
</span>delete_filter = delete_file_loader
+<a href=#247 id=247 data-nosnippet>247</a> .load_deletes(<span
class="kw-2">&</span>file_scan_tasks[<span
class="number">1</span>].deletes, file_scan_tasks[<span
class="number">1</span>].schema_ref())
+<a href=#248 id=248 data-nosnippet>248</a> .<span class="kw">await
+<a href=#249 id=249 data-nosnippet>249</a> </span>.unwrap()
+<a href=#250 id=250 data-nosnippet>250</a> .unwrap();
+<a href=#251 id=251 data-nosnippet>251</a>
+<a href=#252 id=252 data-nosnippet>252</a> <span class="kw">let
</span>result = delete_filter
+<a href=#253 id=253 data-nosnippet>253</a> .get_delete_vector(<span
class="kw-2">&</span>file_scan_tasks[<span class="number">1</span>])
+<a href=#254 id=254 data-nosnippet>254</a> .unwrap();
+<a href=#255 id=255 data-nosnippet>255</a> <span
class="macro">assert_eq!</span>(result.lock().unwrap().len(), <span
class="number">8</span>); <span class="comment">// no pos dels for file 3
+<a href=#256 id=256 data-nosnippet>256</a> </span>}
+<a href=#257 id=257 data-nosnippet>257</a>
+<a href=#258 id=258 data-nosnippet>258</a> <span
class="kw">pub</span>(<span class="kw">crate</span>) <span class="kw">fn
</span>setup(table_location: <span class="kw-2">&</span>Path) ->
Vec<FileScanTask> {
+<a href=#259 id=259 data-nosnippet>259</a> <span class="kw">let
</span>data_file_schema = Arc::new(Schema::builder().build().unwrap());
+<a href=#260 id=260 data-nosnippet>260</a> <span class="kw">let
</span>positional_delete_schema = create_pos_del_schema();
+<a href=#261 id=261 data-nosnippet>261</a>
+<a href=#262 id=262 data-nosnippet>262</a> <span class="kw">let
</span>file_path_values = [
+<a href=#263 id=263 data-nosnippet>263</a> <span
class="macro">vec!</span>[<span class="macro">format!</span>(<span
class="string">"{}/1.parquet"</span>, table_location.to_str().unwrap()); <span
class="number">8</span>],
+<a href=#264 id=264 data-nosnippet>264</a> <span
class="macro">vec!</span>[<span class="macro">format!</span>(<span
class="string">"{}/1.parquet"</span>, table_location.to_str().unwrap()); <span
class="number">8</span>],
+<a href=#265 id=265 data-nosnippet>265</a> <span
class="macro">vec!</span>[<span class="macro">format!</span>(<span
class="string">"{}/2.parquet"</span>, table_location.to_str().unwrap()); <span
class="number">8</span>],
+<a href=#266 id=266 data-nosnippet>266</a> ];
+<a href=#267 id=267 data-nosnippet>267</a> <span class="kw">let
</span>pos_values = [
<a href=#268 id=268 data-nosnippet>268</a> <span
class="macro">vec!</span>[<span class="number">0i64</span>, <span
class="number">1</span>, <span class="number">3</span>, <span
class="number">5</span>, <span class="number">6</span>, <span
class="number">8</span>, <span class="number">1022</span>, <span
class="number">1023</span>],
-<a href=#269 id=269 data-nosnippet>269</a> ];
-<a href=#270 id=270 data-nosnippet>270</a>
-<a href=#271 id=271 data-nosnippet>271</a> <span class="kw">let
</span>props = WriterProperties::builder()
-<a href=#272 id=272 data-nosnippet>272</a>
.set_compression(Compression::SNAPPY)
-<a href=#273 id=273 data-nosnippet>273</a> .build();
-<a href=#274 id=274 data-nosnippet>274</a>
-<a href=#275 id=275 data-nosnippet>275</a> <span class="kw">for
</span>n <span class="kw">in </span><span class="number">1</span>..=<span
class="number">3 </span>{
-<a href=#276 id=276 data-nosnippet>276</a> <span class="kw">let
</span>file_path_vals = file_path_values.get(n - <span
class="number">1</span>).unwrap();
-<a href=#277 id=277 data-nosnippet>277</a> <span class="kw">let
</span>file_path_col = Arc::new(StringArray::from_iter_values(file_path_vals));
-<a href=#278 id=278 data-nosnippet>278</a>
-<a href=#279 id=279 data-nosnippet>279</a> <span class="kw">let
</span>pos_vals = pos_values.get(n - <span class="number">1</span>).unwrap();
-<a href=#280 id=280 data-nosnippet>280</a> <span class="kw">let
</span>pos_col = Arc::new(Int64Array::from_iter_values(pos_vals.clone()));
-<a href=#281 id=281 data-nosnippet>281</a>
-<a href=#282 id=282 data-nosnippet>282</a> <span class="kw">let
</span>positional_deletes_to_write =
-<a href=#283 id=283 data-nosnippet>283</a>
RecordBatch::try_new(positional_delete_schema.clone(), <span
class="macro">vec!</span>[
-<a href=#284 id=284 data-nosnippet>284</a>
file_path_col.clone(),
-<a href=#285 id=285 data-nosnippet>285</a> pos_col.clone(),
-<a href=#286 id=286 data-nosnippet>286</a> ])
-<a href=#287 id=287 data-nosnippet>287</a> .unwrap();
-<a href=#288 id=288 data-nosnippet>288</a>
-<a href=#289 id=289 data-nosnippet>289</a> <span class="kw">let
</span>file = File::create(<span class="macro">format!</span>(
-<a href=#290 id=290 data-nosnippet>290</a> <span
class="string">"{}/pos-del-{}.parquet"</span>,
-<a href=#291 id=291 data-nosnippet>291</a>
table_location.to_str().unwrap(),
-<a href=#292 id=292 data-nosnippet>292</a> n
-<a href=#293 id=293 data-nosnippet>293</a> ))
-<a href=#294 id=294 data-nosnippet>294</a> .unwrap();
-<a href=#295 id=295 data-nosnippet>295</a> <span class="kw">let
</span><span class="kw-2">mut </span>writer = ArrowWriter::try_new(
-<a href=#296 id=296 data-nosnippet>296</a> file,
-<a href=#297 id=297 data-nosnippet>297</a>
positional_deletes_to_write.schema(),
-<a href=#298 id=298 data-nosnippet>298</a> <span
class="prelude-val">Some</span>(props.clone()),
-<a href=#299 id=299 data-nosnippet>299</a> )
-<a href=#300 id=300 data-nosnippet>300</a> .unwrap();
-<a href=#301 id=301 data-nosnippet>301</a>
-<a href=#302 id=302 data-nosnippet>302</a> writer
-<a href=#303 id=303 data-nosnippet>303</a> .write(<span
class="kw-2">&</span>positional_deletes_to_write)
-<a href=#304 id=304 data-nosnippet>304</a> .expect(<span
class="string">"Writing batch"</span>);
-<a href=#305 id=305 data-nosnippet>305</a>
-<a href=#306 id=306 data-nosnippet>306</a> <span class="comment">//
writer must be closed to write footer
-<a href=#307 id=307 data-nosnippet>307</a>
</span>writer.close().unwrap();
-<a href=#308 id=308 data-nosnippet>308</a> }
-<a href=#309 id=309 data-nosnippet>309</a>
-<a href=#310 id=310 data-nosnippet>310</a> <span class="kw">let
</span>pos_del_1 = FileScanTaskDeleteFile {
-<a href=#311 id=311 data-nosnippet>311</a> file_path: <span
class="macro">format!</span>(<span
class="string">"{}/pos-del-1.parquet"</span>, table_location.to_str().unwrap()),
-<a href=#312 id=312 data-nosnippet>312</a> file_type:
DataContentType::PositionDeletes,
-<a href=#313 id=313 data-nosnippet>313</a> partition_spec_id: <span
class="number">0</span>,
-<a href=#314 id=314 data-nosnippet>314</a> equality_ids: <span
class="prelude-val">None</span>,
-<a href=#315 id=315 data-nosnippet>315</a> };
-<a href=#316 id=316 data-nosnippet>316</a>
-<a href=#317 id=317 data-nosnippet>317</a> <span class="kw">let
</span>pos_del_2 = FileScanTaskDeleteFile {
-<a href=#318 id=318 data-nosnippet>318</a> file_path: <span
class="macro">format!</span>(<span
class="string">"{}/pos-del-2.parquet"</span>, table_location.to_str().unwrap()),
-<a href=#319 id=319 data-nosnippet>319</a> file_type:
DataContentType::PositionDeletes,
-<a href=#320 id=320 data-nosnippet>320</a> partition_spec_id: <span
class="number">0</span>,
-<a href=#321 id=321 data-nosnippet>321</a> equality_ids: <span
class="prelude-val">None</span>,
-<a href=#322 id=322 data-nosnippet>322</a> };
-<a href=#323 id=323 data-nosnippet>323</a>
-<a href=#324 id=324 data-nosnippet>324</a> <span class="kw">let
</span>pos_del_3 = FileScanTaskDeleteFile {
-<a href=#325 id=325 data-nosnippet>325</a> file_path: <span
class="macro">format!</span>(<span
class="string">"{}/pos-del-3.parquet"</span>, table_location.to_str().unwrap()),
-<a href=#326 id=326 data-nosnippet>326</a> file_type:
DataContentType::PositionDeletes,
-<a href=#327 id=327 data-nosnippet>327</a> partition_spec_id: <span
class="number">0</span>,
-<a href=#328 id=328 data-nosnippet>328</a> equality_ids: <span
class="prelude-val">None</span>,
-<a href=#329 id=329 data-nosnippet>329</a> };
-<a href=#330 id=330 data-nosnippet>330</a>
-<a href=#331 id=331 data-nosnippet>331</a> <span class="kw">let
</span>file_scan_tasks = <span class="macro">vec!</span>[
-<a href=#332 id=332 data-nosnippet>332</a> FileScanTask {
-<a href=#333 id=333 data-nosnippet>333</a> start: <span
class="number">0</span>,
-<a href=#334 id=334 data-nosnippet>334</a> length: <span
class="number">0</span>,
-<a href=#335 id=335 data-nosnippet>335</a> record_count: <span
class="prelude-val">None</span>,
-<a href=#336 id=336 data-nosnippet>336</a> data_file_path:
<span class="macro">format!</span>(<span class="string">"{}/1.parquet"</span>,
table_location.to_str().unwrap()),
-<a href=#337 id=337 data-nosnippet>337</a> data_file_format:
DataFileFormat::Parquet,
-<a href=#338 id=338 data-nosnippet>338</a> schema:
data_file_schema.clone(),
-<a href=#339 id=339 data-nosnippet>339</a> project_field_ids:
<span class="macro">vec!</span>[],
-<a href=#340 id=340 data-nosnippet>340</a> predicate: <span
class="prelude-val">None</span>,
-<a href=#341 id=341 data-nosnippet>341</a> deletes: <span
class="macro">vec!</span>[pos_del_1, pos_del_2.clone()],
-<a href=#342 id=342 data-nosnippet>342</a> },
-<a href=#343 id=343 data-nosnippet>343</a> FileScanTask {
-<a href=#344 id=344 data-nosnippet>344</a> start: <span
class="number">0</span>,
-<a href=#345 id=345 data-nosnippet>345</a> length: <span
class="number">0</span>,
-<a href=#346 id=346 data-nosnippet>346</a> record_count: <span
class="prelude-val">None</span>,
-<a href=#347 id=347 data-nosnippet>347</a> data_file_path:
<span class="macro">format!</span>(<span class="string">"{}/2.parquet"</span>,
table_location.to_str().unwrap()),
-<a href=#348 id=348 data-nosnippet>348</a> data_file_format:
DataFileFormat::Parquet,
-<a href=#349 id=349 data-nosnippet>349</a> schema:
data_file_schema.clone(),
-<a href=#350 id=350 data-nosnippet>350</a> project_field_ids:
<span class="macro">vec!</span>[],
-<a href=#351 id=351 data-nosnippet>351</a> predicate: <span
class="prelude-val">None</span>,
-<a href=#352 id=352 data-nosnippet>352</a> deletes: <span
class="macro">vec!</span>[pos_del_3],
-<a href=#353 id=353 data-nosnippet>353</a> },
-<a href=#354 id=354 data-nosnippet>354</a> ];
-<a href=#355 id=355 data-nosnippet>355</a>
-<a href=#356 id=356 data-nosnippet>356</a> file_scan_tasks
-<a href=#357 id=357 data-nosnippet>357</a> }
-<a href=#358 id=358 data-nosnippet>358</a>
-<a href=#359 id=359 data-nosnippet>359</a> <span
class="kw">pub</span>(<span class="kw">crate</span>) <span class="kw">fn
</span>create_pos_del_schema() -> ArrowSchemaRef {
-<a href=#360 id=360 data-nosnippet>360</a> <span class="kw">let
</span>fields = <span class="macro">vec!</span>[
-<a href=#361 id=361 data-nosnippet>361</a>
arrow_schema::Field::new(<span class="string">"file_path"</span>,
arrow_schema::DataType::Utf8, <span class="bool-val">false</span>)
-<a href=#362 id=362 data-nosnippet>362</a>
.with_metadata(HashMap::from([(
-<a href=#363 id=363 data-nosnippet>363</a>
PARQUET_FIELD_ID_META_KEY.to_string(),
-<a href=#364 id=364 data-nosnippet>364</a>
FIELD_ID_POSITIONAL_DELETE_FILE_PATH.to_string(),
-<a href=#365 id=365 data-nosnippet>365</a> )])),
-<a href=#366 id=366 data-nosnippet>366</a>
arrow_schema::Field::new(<span class="string">"pos"</span>,
arrow_schema::DataType::Int64, <span
class="bool-val">false</span>).with_metadata(
-<a href=#367 id=367 data-nosnippet>367</a> HashMap::from([(
-<a href=#368 id=368 data-nosnippet>368</a>
PARQUET_FIELD_ID_META_KEY.to_string(),
-<a href=#369 id=369 data-nosnippet>369</a>
FIELD_ID_POSITIONAL_DELETE_POS.to_string(),
-<a href=#370 id=370 data-nosnippet>370</a> )]),
-<a href=#371 id=371 data-nosnippet>371</a> ),
-<a href=#372 id=372 data-nosnippet>372</a> ];
-<a href=#373 id=373 data-nosnippet>373</a>
Arc::new(arrow_schema::Schema::new(fields))
-<a href=#374 id=374 data-nosnippet>374</a> }
-<a href=#375 id=375
data-nosnippet>375</a>}</code></pre></div></section></main></body></html>
\ No newline at end of file
+<a href=#269 id=269 data-nosnippet>269</a> <span
class="macro">vec!</span>[<span class="number">0i64</span>, <span
class="number">1</span>, <span class="number">3</span>, <span
class="number">5</span>, <span class="number">20</span>, <span
class="number">21</span>, <span class="number">22</span>, <span
class="number">23</span>],
+<a href=#270 id=270 data-nosnippet>270</a> <span
class="macro">vec!</span>[<span class="number">0i64</span>, <span
class="number">1</span>, <span class="number">3</span>, <span
class="number">5</span>, <span class="number">6</span>, <span
class="number">8</span>, <span class="number">1022</span>, <span
class="number">1023</span>],
+<a href=#271 id=271 data-nosnippet>271</a> ];
+<a href=#272 id=272 data-nosnippet>272</a>
+<a href=#273 id=273 data-nosnippet>273</a> <span class="kw">let
</span>props = WriterProperties::builder()
+<a href=#274 id=274 data-nosnippet>274</a>
.set_compression(Compression::SNAPPY)
+<a href=#275 id=275 data-nosnippet>275</a> .build();
+<a href=#276 id=276 data-nosnippet>276</a>
+<a href=#277 id=277 data-nosnippet>277</a> <span class="kw">for
</span>n <span class="kw">in </span><span class="number">1</span>..=<span
class="number">3 </span>{
+<a href=#278 id=278 data-nosnippet>278</a> <span class="kw">let
</span>file_path_vals = file_path_values.get(n - <span
class="number">1</span>).unwrap();
+<a href=#279 id=279 data-nosnippet>279</a> <span class="kw">let
</span>file_path_col = Arc::new(StringArray::from_iter_values(file_path_vals));
+<a href=#280 id=280 data-nosnippet>280</a>
+<a href=#281 id=281 data-nosnippet>281</a> <span class="kw">let
</span>pos_vals = pos_values.get(n - <span class="number">1</span>).unwrap();
+<a href=#282 id=282 data-nosnippet>282</a> <span class="kw">let
</span>pos_col = Arc::new(Int64Array::from_iter_values(pos_vals.clone()));
+<a href=#283 id=283 data-nosnippet>283</a>
+<a href=#284 id=284 data-nosnippet>284</a> <span class="kw">let
</span>positional_deletes_to_write =
+<a href=#285 id=285 data-nosnippet>285</a>
RecordBatch::try_new(positional_delete_schema.clone(), <span
class="macro">vec!</span>[
+<a href=#286 id=286 data-nosnippet>286</a>
file_path_col.clone(),
+<a href=#287 id=287 data-nosnippet>287</a> pos_col.clone(),
+<a href=#288 id=288 data-nosnippet>288</a> ])
+<a href=#289 id=289 data-nosnippet>289</a> .unwrap();
+<a href=#290 id=290 data-nosnippet>290</a>
+<a href=#291 id=291 data-nosnippet>291</a> <span class="kw">let
</span>file = File::create(<span class="macro">format!</span>(
+<a href=#292 id=292 data-nosnippet>292</a> <span
class="string">"{}/pos-del-{}.parquet"</span>,
+<a href=#293 id=293 data-nosnippet>293</a>
table_location.to_str().unwrap(),
+<a href=#294 id=294 data-nosnippet>294</a> n
+<a href=#295 id=295 data-nosnippet>295</a> ))
+<a href=#296 id=296 data-nosnippet>296</a> .unwrap();
+<a href=#297 id=297 data-nosnippet>297</a> <span class="kw">let
</span><span class="kw-2">mut </span>writer = ArrowWriter::try_new(
+<a href=#298 id=298 data-nosnippet>298</a> file,
+<a href=#299 id=299 data-nosnippet>299</a>
positional_deletes_to_write.schema(),
+<a href=#300 id=300 data-nosnippet>300</a> <span
class="prelude-val">Some</span>(props.clone()),
+<a href=#301 id=301 data-nosnippet>301</a> )
+<a href=#302 id=302 data-nosnippet>302</a> .unwrap();
+<a href=#303 id=303 data-nosnippet>303</a>
+<a href=#304 id=304 data-nosnippet>304</a> writer
+<a href=#305 id=305 data-nosnippet>305</a> .write(<span
class="kw-2">&</span>positional_deletes_to_write)
+<a href=#306 id=306 data-nosnippet>306</a> .expect(<span
class="string">"Writing batch"</span>);
+<a href=#307 id=307 data-nosnippet>307</a>
+<a href=#308 id=308 data-nosnippet>308</a> <span class="comment">//
writer must be closed to write footer
+<a href=#309 id=309 data-nosnippet>309</a>
</span>writer.close().unwrap();
+<a href=#310 id=310 data-nosnippet>310</a> }
+<a href=#311 id=311 data-nosnippet>311</a>
+<a href=#312 id=312 data-nosnippet>312</a> <span class="kw">let
</span>pos_del_1 = FileScanTaskDeleteFile {
+<a href=#313 id=313 data-nosnippet>313</a> file_path: <span
class="macro">format!</span>(<span
class="string">"{}/pos-del-1.parquet"</span>, table_location.to_str().unwrap()),
+<a href=#314 id=314 data-nosnippet>314</a> file_type:
DataContentType::PositionDeletes,
+<a href=#315 id=315 data-nosnippet>315</a> partition_spec_id: <span
class="number">0</span>,
+<a href=#316 id=316 data-nosnippet>316</a> equality_ids: <span
class="prelude-val">None</span>,
+<a href=#317 id=317 data-nosnippet>317</a> };
+<a href=#318 id=318 data-nosnippet>318</a>
+<a href=#319 id=319 data-nosnippet>319</a> <span class="kw">let
</span>pos_del_2 = FileScanTaskDeleteFile {
+<a href=#320 id=320 data-nosnippet>320</a> file_path: <span
class="macro">format!</span>(<span
class="string">"{}/pos-del-2.parquet"</span>, table_location.to_str().unwrap()),
+<a href=#321 id=321 data-nosnippet>321</a> file_type:
DataContentType::PositionDeletes,
+<a href=#322 id=322 data-nosnippet>322</a> partition_spec_id: <span
class="number">0</span>,
+<a href=#323 id=323 data-nosnippet>323</a> equality_ids: <span
class="prelude-val">None</span>,
+<a href=#324 id=324 data-nosnippet>324</a> };
+<a href=#325 id=325 data-nosnippet>325</a>
+<a href=#326 id=326 data-nosnippet>326</a> <span class="kw">let
</span>pos_del_3 = FileScanTaskDeleteFile {
+<a href=#327 id=327 data-nosnippet>327</a> file_path: <span
class="macro">format!</span>(<span
class="string">"{}/pos-del-3.parquet"</span>, table_location.to_str().unwrap()),
+<a href=#328 id=328 data-nosnippet>328</a> file_type:
DataContentType::PositionDeletes,
+<a href=#329 id=329 data-nosnippet>329</a> partition_spec_id: <span
class="number">0</span>,
+<a href=#330 id=330 data-nosnippet>330</a> equality_ids: <span
class="prelude-val">None</span>,
+<a href=#331 id=331 data-nosnippet>331</a> };
+<a href=#332 id=332 data-nosnippet>332</a>
+<a href=#333 id=333 data-nosnippet>333</a> <span class="kw">let
</span>file_scan_tasks = <span class="macro">vec!</span>[
+<a href=#334 id=334 data-nosnippet>334</a> FileScanTask {
+<a href=#335 id=335 data-nosnippet>335</a> start: <span
class="number">0</span>,
+<a href=#336 id=336 data-nosnippet>336</a> length: <span
class="number">0</span>,
+<a href=#337 id=337 data-nosnippet>337</a> record_count: <span
class="prelude-val">None</span>,
+<a href=#338 id=338 data-nosnippet>338</a> data_file_path:
<span class="macro">format!</span>(<span class="string">"{}/1.parquet"</span>,
table_location.to_str().unwrap()),
+<a href=#339 id=339 data-nosnippet>339</a> data_file_format:
DataFileFormat::Parquet,
+<a href=#340 id=340 data-nosnippet>340</a> schema:
data_file_schema.clone(),
+<a href=#341 id=341 data-nosnippet>341</a> project_field_ids:
<span class="macro">vec!</span>[],
+<a href=#342 id=342 data-nosnippet>342</a> predicate: <span
class="prelude-val">None</span>,
+<a href=#343 id=343 data-nosnippet>343</a> deletes: <span
class="macro">vec!</span>[pos_del_1, pos_del_2.clone()],
+<a href=#344 id=344 data-nosnippet>344</a> },
+<a href=#345 id=345 data-nosnippet>345</a> FileScanTask {
+<a href=#346 id=346 data-nosnippet>346</a> start: <span
class="number">0</span>,
+<a href=#347 id=347 data-nosnippet>347</a> length: <span
class="number">0</span>,
+<a href=#348 id=348 data-nosnippet>348</a> record_count: <span
class="prelude-val">None</span>,
+<a href=#349 id=349 data-nosnippet>349</a> data_file_path:
<span class="macro">format!</span>(<span class="string">"{}/2.parquet"</span>,
table_location.to_str().unwrap()),
+<a href=#350 id=350 data-nosnippet>350</a> data_file_format:
DataFileFormat::Parquet,
+<a href=#351 id=351 data-nosnippet>351</a> schema:
data_file_schema.clone(),
+<a href=#352 id=352 data-nosnippet>352</a> project_field_ids:
<span class="macro">vec!</span>[],
+<a href=#353 id=353 data-nosnippet>353</a> predicate: <span
class="prelude-val">None</span>,
+<a href=#354 id=354 data-nosnippet>354</a> deletes: <span
class="macro">vec!</span>[pos_del_3],
+<a href=#355 id=355 data-nosnippet>355</a> },
+<a href=#356 id=356 data-nosnippet>356</a> ];
+<a href=#357 id=357 data-nosnippet>357</a>
+<a href=#358 id=358 data-nosnippet>358</a> file_scan_tasks
+<a href=#359 id=359 data-nosnippet>359</a> }
+<a href=#360 id=360 data-nosnippet>360</a>
+<a href=#361 id=361 data-nosnippet>361</a> <span
class="kw">pub</span>(<span class="kw">crate</span>) <span class="kw">fn
</span>create_pos_del_schema() -> ArrowSchemaRef {
+<a href=#362 id=362 data-nosnippet>362</a> <span class="kw">let
</span>fields = <span class="macro">vec!</span>[
+<a href=#363 id=363 data-nosnippet>363</a>
arrow_schema::Field::new(<span class="string">"file_path"</span>,
arrow_schema::DataType::Utf8, <span class="bool-val">false</span>)
+<a href=#364 id=364 data-nosnippet>364</a>
.with_metadata(HashMap::from([(
+<a href=#365 id=365 data-nosnippet>365</a>
PARQUET_FIELD_ID_META_KEY.to_string(),
+<a href=#366 id=366 data-nosnippet>366</a>
FIELD_ID_POSITIONAL_DELETE_FILE_PATH.to_string(),
+<a href=#367 id=367 data-nosnippet>367</a> )])),
+<a href=#368 id=368 data-nosnippet>368</a>
arrow_schema::Field::new(<span class="string">"pos"</span>,
arrow_schema::DataType::Int64, <span
class="bool-val">false</span>).with_metadata(
+<a href=#369 id=369 data-nosnippet>369</a> HashMap::from([(
+<a href=#370 id=370 data-nosnippet>370</a>
PARQUET_FIELD_ID_META_KEY.to_string(),
+<a href=#371 id=371 data-nosnippet>371</a>
FIELD_ID_POSITIONAL_DELETE_POS.to_string(),
+<a href=#372 id=372 data-nosnippet>372</a> )]),
+<a href=#373 id=373 data-nosnippet>373</a> ),
+<a href=#374 id=374 data-nosnippet>374</a> ];
+<a href=#375 id=375 data-nosnippet>375</a>
Arc::new(arrow_schema::Schema::new(fields))
+<a href=#376 id=376 data-nosnippet>376</a> }
+<a href=#377 id=377
data-nosnippet>377</a>}</code></pre></div></section></main></body></html>
\ No newline at end of file