This is an automated email from the ASF dual-hosted git repository.
fokko pushed a commit to branch parquet-1.14.x
in repository https://gitbox.apache.org/repos/asf/parquet-mr.git
The following commit(s) were added to refs/heads/parquet-1.14.x by this push:
new bb8c72d63 PARQUET-2465: Fall back to HadoopConfig (#1339) (#1342)
bb8c72d63 is described below
commit bb8c72d633c3dbe661776b89279cf4d7d6afcc19
Author: Fokko Driesprong <[email protected]>
AuthorDate: Fri May 3 12:58:30 2024 +0200
PARQUET-2465: Fall back to HadoopConfig (#1339) (#1342)
Add fallback logic
We see that this causes the 1.14 to be incompatible
with the previous releases. The config will be created
and right after that the `getWriteSupport(conf)` is called.
But since this method is freshly introduced:
```java
protected WriteSupport<T> getWriteSupport(ParquetConfiguration conf) {
throw new UnsupportedOperationException(
"Override
ParquetWriter$Builder#getWriteSupport(ParquetConfiguration)");
}
```
---
.../main/java/org/apache/parquet/hadoop/ParquetWriter.java | 5 +++--
.../main/java/org/apache/parquet/hadoop/api/InitContext.java | 2 ++
.../main/java/org/apache/parquet/hadoop/api/ReadSupport.java | 11 +++++++----
.../main/java/org/apache/parquet/hadoop/api/WriteSupport.java | 5 ++++-
4 files changed, 16 insertions(+), 7 deletions(-)
diff --git
a/parquet-hadoop/src/main/java/org/apache/parquet/hadoop/ParquetWriter.java
b/parquet-hadoop/src/main/java/org/apache/parquet/hadoop/ParquetWriter.java
index a76b843e7..5c7fcaa22 100644
--- a/parquet-hadoop/src/main/java/org/apache/parquet/hadoop/ParquetWriter.java
+++ b/parquet-hadoop/src/main/java/org/apache/parquet/hadoop/ParquetWriter.java
@@ -495,7 +495,9 @@ public class ParquetWriter<T> implements Closeable {
/**
* @param conf a configuration
* @return an appropriate WriteSupport for the object model.
+ * @deprecated Use {@link #getWriteSupport(ParquetConfiguration)} instead
*/
+ @Deprecated
protected abstract WriteSupport<T> getWriteSupport(Configuration conf);
/**
@@ -503,8 +505,7 @@ public class ParquetWriter<T> implements Closeable {
* @return an appropriate WriteSupport for the object model.
*/
protected WriteSupport<T> getWriteSupport(ParquetConfiguration conf) {
- throw new UnsupportedOperationException(
- "Override
ParquetWriter$Builder#getWriteSupport(ParquetConfiguration)");
+ return
getWriteSupport(ConfigurationUtil.createHadoopConfiguration(conf));
}
/**
diff --git
a/parquet-hadoop/src/main/java/org/apache/parquet/hadoop/api/InitContext.java
b/parquet-hadoop/src/main/java/org/apache/parquet/hadoop/api/InitContext.java
index 06efbcf6a..a9ee43f7f 100644
---
a/parquet-hadoop/src/main/java/org/apache/parquet/hadoop/api/InitContext.java
+++
b/parquet-hadoop/src/main/java/org/apache/parquet/hadoop/api/InitContext.java
@@ -79,7 +79,9 @@ public class InitContext {
/**
* @return the configuration for this job
+ * @deprecated Use {@link #getParquetConfiguration()} instead
*/
+ @Deprecated
public Configuration getConfiguration() {
return ConfigurationUtil.createHadoopConfiguration(configuration);
}
diff --git
a/parquet-hadoop/src/main/java/org/apache/parquet/hadoop/api/ReadSupport.java
b/parquet-hadoop/src/main/java/org/apache/parquet/hadoop/api/ReadSupport.java
index 904def186..1366b6060 100644
---
a/parquet-hadoop/src/main/java/org/apache/parquet/hadoop/api/ReadSupport.java
+++
b/parquet-hadoop/src/main/java/org/apache/parquet/hadoop/api/ReadSupport.java
@@ -21,6 +21,7 @@ package org.apache.parquet.hadoop.api;
import java.util.Map;
import org.apache.hadoop.conf.Configuration;
import org.apache.parquet.conf.ParquetConfiguration;
+import org.apache.parquet.hadoop.util.ConfigurationUtil;
import org.apache.parquet.io.api.RecordMaterializer;
import org.apache.parquet.schema.MessageType;
import org.apache.parquet.schema.MessageTypeParser;
@@ -76,12 +77,12 @@ public abstract class ReadSupport<T> {
* @param keyValueMetaData the app specific metadata from the file
* @param fileSchema the schema of the file
* @return the readContext that defines how to read the file
- * @deprecated override {@link ReadSupport#init(InitContext)} instead
+ * @deprecated override {@link #init(InitContext)} instead
*/
@Deprecated
public ReadContext init(
ParquetConfiguration configuration, Map<String, String>
keyValueMetaData, MessageType fileSchema) {
- throw new UnsupportedOperationException("Override
ReadSupport.init(InitContext)");
+ return init(ConfigurationUtil.createHadoopConfiguration(configuration),
keyValueMetaData, fileSchema);
}
/**
@@ -103,7 +104,9 @@ public abstract class ReadSupport<T> {
* @param fileSchema the schema of the file
* @param readContext returned by the init method
* @return the recordMaterializer that will materialize the records
+ * @deprecated override {@link
#prepareForRead(ParquetConfiguration,Map,MessageType,ReadContext)} instead
*/
+ @Deprecated
public abstract RecordMaterializer<T> prepareForRead(
Configuration configuration,
Map<String, String> keyValueMetaData,
@@ -125,8 +128,8 @@ public abstract class ReadSupport<T> {
Map<String, String> keyValueMetaData,
MessageType fileSchema,
ReadContext readContext) {
- throw new UnsupportedOperationException(
- "Override ReadSupport.prepareForRead(ParquetConfiguration, Map<String,
String>, MessageType, ReadContext)");
+ return prepareForRead(
+ ConfigurationUtil.createHadoopConfiguration(configuration),
keyValueMetaData, fileSchema, readContext);
}
/**
diff --git
a/parquet-hadoop/src/main/java/org/apache/parquet/hadoop/api/WriteSupport.java
b/parquet-hadoop/src/main/java/org/apache/parquet/hadoop/api/WriteSupport.java
index 3a0b35f4f..140206867 100644
---
a/parquet-hadoop/src/main/java/org/apache/parquet/hadoop/api/WriteSupport.java
+++
b/parquet-hadoop/src/main/java/org/apache/parquet/hadoop/api/WriteSupport.java
@@ -24,6 +24,7 @@ import java.util.Map;
import java.util.Objects;
import org.apache.hadoop.conf.Configuration;
import org.apache.parquet.conf.ParquetConfiguration;
+import org.apache.parquet.hadoop.util.ConfigurationUtil;
import org.apache.parquet.io.api.RecordConsumer;
import org.apache.parquet.schema.MessageType;
@@ -99,7 +100,9 @@ public abstract class WriteSupport<T> {
*
* @param configuration the job's configuration
* @return the information needed to write the file
+ * @deprecated override {@link #init(ParquetConfiguration)} instead
*/
+ @Deprecated
public abstract WriteContext init(Configuration configuration);
/**
@@ -109,7 +112,7 @@ public abstract class WriteSupport<T> {
* @return the information needed to write the file
*/
public WriteContext init(ParquetConfiguration configuration) {
- throw new UnsupportedOperationException("Override
WriteSupport#init(ParquetConfiguration)");
+ return init(ConfigurationUtil.createHadoopConfiguration(configuration));
}
/**