[ 
https://issues.apache.org/jira/browse/HUDI-4369?page=com.atlassian.jira.plugin.system.issuetabpanels:all-tabpanel
 ]

Vishal Agarwal updated HUDI-4369:
---------------------------------
    Description: 
Hi team,

I am trying to use Hudi sink connector with Kafka Connect to write to GCS 
bucket. But I am getting error regarding "gs" file scheme. I have added all GCS 
related properties in core-site.xml and the corresponding gcs-connector jar in 
the plugin path. But still facing the issue.

The issue was already reported with S3 as per jira 
https://issues.apache.org/jira/browse/HUDI-3610. But I am unable to get the 
resolution.

Happy to discuss on this !

Thanks


*StackTrace-*

%d [%thread] %-5level %logger - %msg%n 
org.apache.hudi.exception.HoodieException: Fatal error instantiating Hudi Write 
Provider 

 at 
org.apache.hudi.connect.writers.KafkaConnectWriterProvider.<init>(KafkaConnectWriterProvider.java:103)
 ~[connectors-uber.jar:?]

 at 
org.apache.hudi.connect.transaction.ConnectTransactionParticipant.<init>(ConnectTransactionParticipant.java:65)
 ~[connectors-uber.jar:?]

 at org.apache.hudi.connect.HoodieSinkTask.bootstrap(HoodieSinkTask.java:198) 
[connectors-uber.jar:?]

 at org.apache.hudi.connect.HoodieSinkTask.open(HoodieSinkTask.java:151) 
[connectors-uber.jar:?]

 at 
org.apache.kafka.connect.runtime.WorkerSinkTask.openPartitions(WorkerSinkTask.java:587)
 [connect-runtime-2.4.1.jar:?]

 at 
org.apache.kafka.connect.runtime.WorkerSinkTask.access$1100(WorkerSinkTask.java:67)
 [connect-runtime-2.4.1.jar:?]

 at 
org.apache.kafka.connect.runtime.WorkerSinkTask$HandleRebalance.onPartitionsAssigned(WorkerSinkTask.java:652)
 [connect-runtime-2.4.1.jar:?]

 at 
org.apache.kafka.clients.consumer.internals.ConsumerCoordinator.invokePartitionsAssigned(ConsumerCoordinator.java:272)
 [kafka-clients-2.4.1.jar:?]

 at 
org.apache.kafka.clients.consumer.internals.ConsumerCoordinator.onJoinComplete(ConsumerCoordinator.java:400)
 [kafka-clients-2.4.1.jar:?]

 at 
org.apache.kafka.clients.consumer.internals.AbstractCoordinator.joinGroupIfNeeded(AbstractCoordinator.java:421)
 [kafka-clients-2.4.1.jar:?]

 at 
org.apache.kafka.clients.consumer.internals.AbstractCoordinator.ensureActiveGroup(AbstractCoordinator.java:340)
 [kafka-clients-2.4.1.jar:?]

 at 
org.apache.kafka.clients.consumer.internals.ConsumerCoordinator.poll(ConsumerCoordinator.java:471)
 [kafka-clients-2.4.1.jar:?]

 at 
org.apache.kafka.clients.consumer.KafkaConsumer.updateAssignmentMetadataIfNeeded(KafkaConsumer.java:1267)
 [kafka-clients-2.4.1.jar:?]

 at 
org.apache.kafka.clients.consumer.KafkaConsumer.poll(KafkaConsumer.java:1231) 
[kafka-clients-2.4.1.jar:?]

 at 
org.apache.kafka.clients.consumer.KafkaConsumer.poll(KafkaConsumer.java:1211) 
[kafka-clients-2.4.1.jar:?]

 at 
org.apache.kafka.connect.runtime.WorkerSinkTask.pollConsumer(WorkerSinkTask.java:444)
 [connect-runtime-2.4.1.jar:?]

 at 
org.apache.kafka.connect.runtime.WorkerSinkTask.poll(WorkerSinkTask.java:317) 
[connect-runtime-2.4.1.jar:?]

 at 
org.apache.kafka.connect.runtime.WorkerSinkTask.iteration(WorkerSinkTask.java:224)
 [connect-runtime-2.4.1.jar:?]

 at 
org.apache.kafka.connect.runtime.WorkerSinkTask.execute(WorkerSinkTask.java:192)
 [connect-runtime-2.4.1.jar:?]

 at org.apache.kafka.connect.runtime.WorkerTask.doRun(WorkerTask.java:177) 
[connect-runtime-2.4.1.jar:?]

 at org.apache.kafka.connect.runtime.WorkerTask.run(WorkerTask.java:227) 
[connect-runtime-2.4.1.jar:?]

 at java.util.concurrent.Executors$RunnableAdapter.call(Executors.java:511) 
[?:1.8.0_331]

 at java.util.concurrent.FutureTask.run(FutureTask.java:266) [?:1.8.0_331]

 at 
java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1149) 
[?:1.8.0_331]

 at 
java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:624) 
[?:1.8.0_331]

 at java.lang.Thread.run(Thread.java:750) [?:1.8.0_331]

Caused by: org.apache.hudi.exception.HoodieIOException: Failed to get instance 
of org.apache.hadoop.fs.FileSystem

 at org.apache.hudi.common.fs.FSUtils.getFs(FSUtils.java:109) 
~[connectors-uber.jar:?]

 at org.apache.hudi.common.fs.FSUtils.getFs(FSUtils.java:100) 
~[connectors-uber.jar:?]

 at org.apache.hudi.client.BaseHoodieClient.<init>(BaseHoodieClient.java:69) 
~[connectors-uber.jar:?]

 at 
org.apache.hudi.client.BaseHoodieWriteClient.<init>(BaseHoodieWriteClient.java:175)
 ~[connectors-uber.jar:?]

 at 
org.apache.hudi.client.BaseHoodieWriteClient.<init>(BaseHoodieWriteClient.java:160)
 ~[connectors-uber.jar:?]

 at 
org.apache.hudi.client.HoodieJavaWriteClient.<init>(HoodieJavaWriteClient.java:55)
 ~[connectors-uber.jar:?]

 at 
org.apache.hudi.connect.writers.KafkaConnectWriterProvider.<init>(KafkaConnectWriterProvider.java:101)
 ~[connectors-uber.jar:?]

 ... 25 more

Caused by: org.apache.hadoop.fs.UnsupportedFileSystemException: No FileSystem 
for scheme "gs"

 at org.apache.hadoop.fs.FileSystem.getFileSystemClass(FileSystem.java:3225) 
~[connectors-uber.jar:?]

 at org.apache.hadoop.fs.FileSystem.createFileSystem(FileSystem.java:3245) 
~[connectors-uber.jar:?]

 at org.apache.hadoop.fs.FileSystem.access$200(FileSystem.java:121) 
~[connectors-uber.jar:?]

 at org.apache.hadoop.fs.FileSystem$Cache.getInternal(FileSystem.java:3296) 
~[connectors-uber.jar:?]

 at org.apache.hadoop.fs.FileSystem$Cache.get(FileSystem.java:3264) 
~[connectors-uber.jar:?]

 at org.apache.hadoop.fs.FileSystem.get(FileSystem.java:475) 
~[connectors-uber.jar:?]

 at org.apache.hadoop.fs.Path.getFileSystem(Path.java:356) 
~[connectors-uber.jar:?]

 at org.apache.hudi.common.fs.FSUtils.getFs(FSUtils.java:107) 
~[connectors-uber.jar:?]

 at org.apache.hudi.common.fs.FSUtils.getFs(FSUtils.java:100) 
~[connectors-uber.jar:?]

 at org.apache.hudi.client.BaseHoodieClient.<init>(BaseHoodieClient.java:69) 
~[connectors-uber.jar:?]

 at 
org.apache.hudi.client.BaseHoodieWriteClient.<init>(BaseHoodieWriteClient.java:175)
 ~[connectors-uber.jar:?]

 at 
org.apache.hudi.client.BaseHoodieWriteClient.<init>(BaseHoodieWriteClient.java:160)
 ~[connectors-uber.jar:?]

 at 
org.apache.hudi.client.HoodieJavaWriteClient.<init>(HoodieJavaWriteClient.java:55)
 ~[connectors-uber.jar:?]

 at 
org.apache.hudi.connect.writers.KafkaConnectWriterProvider.<init>(KafkaConnectWriterProvider.java:101)
 ~[connectors-uber.jar:?]

 ... 25 more

> Hudi Kafka Connect Sink writing to GCS bucket
> ---------------------------------------------
>
>                 Key: HUDI-4369
>                 URL: https://issues.apache.org/jira/browse/HUDI-4369
>             Project: Apache Hudi
>          Issue Type: Bug
>          Components: kafka-connect
>            Reporter: Vishal Agarwal
>            Priority: Critical
>
> Hi team,
> I am trying to use Hudi sink connector with Kafka Connect to write to GCS 
> bucket. But I am getting error regarding "gs" file scheme. I have added all 
> GCS related properties in core-site.xml and the corresponding gcs-connector 
> jar in the plugin path. But still facing the issue.
> The issue was already reported with S3 as per jira 
> https://issues.apache.org/jira/browse/HUDI-3610. But I am unable to get the 
> resolution.
> Happy to discuss on this !
> Thanks
> *StackTrace-*
> %d [%thread] %-5level %logger - %msg%n 
> org.apache.hudi.exception.HoodieException: Fatal error instantiating Hudi 
> Write Provider 
>  at 
> org.apache.hudi.connect.writers.KafkaConnectWriterProvider.<init>(KafkaConnectWriterProvider.java:103)
>  ~[connectors-uber.jar:?]
>  at 
> org.apache.hudi.connect.transaction.ConnectTransactionParticipant.<init>(ConnectTransactionParticipant.java:65)
>  ~[connectors-uber.jar:?]
>  at org.apache.hudi.connect.HoodieSinkTask.bootstrap(HoodieSinkTask.java:198) 
> [connectors-uber.jar:?]
>  at org.apache.hudi.connect.HoodieSinkTask.open(HoodieSinkTask.java:151) 
> [connectors-uber.jar:?]
>  at 
> org.apache.kafka.connect.runtime.WorkerSinkTask.openPartitions(WorkerSinkTask.java:587)
>  [connect-runtime-2.4.1.jar:?]
>  at 
> org.apache.kafka.connect.runtime.WorkerSinkTask.access$1100(WorkerSinkTask.java:67)
>  [connect-runtime-2.4.1.jar:?]
>  at 
> org.apache.kafka.connect.runtime.WorkerSinkTask$HandleRebalance.onPartitionsAssigned(WorkerSinkTask.java:652)
>  [connect-runtime-2.4.1.jar:?]
>  at 
> org.apache.kafka.clients.consumer.internals.ConsumerCoordinator.invokePartitionsAssigned(ConsumerCoordinator.java:272)
>  [kafka-clients-2.4.1.jar:?]
>  at 
> org.apache.kafka.clients.consumer.internals.ConsumerCoordinator.onJoinComplete(ConsumerCoordinator.java:400)
>  [kafka-clients-2.4.1.jar:?]
>  at 
> org.apache.kafka.clients.consumer.internals.AbstractCoordinator.joinGroupIfNeeded(AbstractCoordinator.java:421)
>  [kafka-clients-2.4.1.jar:?]
>  at 
> org.apache.kafka.clients.consumer.internals.AbstractCoordinator.ensureActiveGroup(AbstractCoordinator.java:340)
>  [kafka-clients-2.4.1.jar:?]
>  at 
> org.apache.kafka.clients.consumer.internals.ConsumerCoordinator.poll(ConsumerCoordinator.java:471)
>  [kafka-clients-2.4.1.jar:?]
>  at 
> org.apache.kafka.clients.consumer.KafkaConsumer.updateAssignmentMetadataIfNeeded(KafkaConsumer.java:1267)
>  [kafka-clients-2.4.1.jar:?]
>  at 
> org.apache.kafka.clients.consumer.KafkaConsumer.poll(KafkaConsumer.java:1231) 
> [kafka-clients-2.4.1.jar:?]
>  at 
> org.apache.kafka.clients.consumer.KafkaConsumer.poll(KafkaConsumer.java:1211) 
> [kafka-clients-2.4.1.jar:?]
>  at 
> org.apache.kafka.connect.runtime.WorkerSinkTask.pollConsumer(WorkerSinkTask.java:444)
>  [connect-runtime-2.4.1.jar:?]
>  at 
> org.apache.kafka.connect.runtime.WorkerSinkTask.poll(WorkerSinkTask.java:317) 
> [connect-runtime-2.4.1.jar:?]
>  at 
> org.apache.kafka.connect.runtime.WorkerSinkTask.iteration(WorkerSinkTask.java:224)
>  [connect-runtime-2.4.1.jar:?]
>  at 
> org.apache.kafka.connect.runtime.WorkerSinkTask.execute(WorkerSinkTask.java:192)
>  [connect-runtime-2.4.1.jar:?]
>  at org.apache.kafka.connect.runtime.WorkerTask.doRun(WorkerTask.java:177) 
> [connect-runtime-2.4.1.jar:?]
>  at org.apache.kafka.connect.runtime.WorkerTask.run(WorkerTask.java:227) 
> [connect-runtime-2.4.1.jar:?]
>  at java.util.concurrent.Executors$RunnableAdapter.call(Executors.java:511) 
> [?:1.8.0_331]
>  at java.util.concurrent.FutureTask.run(FutureTask.java:266) [?:1.8.0_331]
>  at 
> java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1149)
>  [?:1.8.0_331]
>  at 
> java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:624)
>  [?:1.8.0_331]
>  at java.lang.Thread.run(Thread.java:750) [?:1.8.0_331]
> Caused by: org.apache.hudi.exception.HoodieIOException: Failed to get 
> instance of org.apache.hadoop.fs.FileSystem
>  at org.apache.hudi.common.fs.FSUtils.getFs(FSUtils.java:109) 
> ~[connectors-uber.jar:?]
>  at org.apache.hudi.common.fs.FSUtils.getFs(FSUtils.java:100) 
> ~[connectors-uber.jar:?]
>  at org.apache.hudi.client.BaseHoodieClient.<init>(BaseHoodieClient.java:69) 
> ~[connectors-uber.jar:?]
>  at 
> org.apache.hudi.client.BaseHoodieWriteClient.<init>(BaseHoodieWriteClient.java:175)
>  ~[connectors-uber.jar:?]
>  at 
> org.apache.hudi.client.BaseHoodieWriteClient.<init>(BaseHoodieWriteClient.java:160)
>  ~[connectors-uber.jar:?]
>  at 
> org.apache.hudi.client.HoodieJavaWriteClient.<init>(HoodieJavaWriteClient.java:55)
>  ~[connectors-uber.jar:?]
>  at 
> org.apache.hudi.connect.writers.KafkaConnectWriterProvider.<init>(KafkaConnectWriterProvider.java:101)
>  ~[connectors-uber.jar:?]
>  ... 25 more
> Caused by: org.apache.hadoop.fs.UnsupportedFileSystemException: No FileSystem 
> for scheme "gs"
>  at org.apache.hadoop.fs.FileSystem.getFileSystemClass(FileSystem.java:3225) 
> ~[connectors-uber.jar:?]
>  at org.apache.hadoop.fs.FileSystem.createFileSystem(FileSystem.java:3245) 
> ~[connectors-uber.jar:?]
>  at org.apache.hadoop.fs.FileSystem.access$200(FileSystem.java:121) 
> ~[connectors-uber.jar:?]
>  at org.apache.hadoop.fs.FileSystem$Cache.getInternal(FileSystem.java:3296) 
> ~[connectors-uber.jar:?]
>  at org.apache.hadoop.fs.FileSystem$Cache.get(FileSystem.java:3264) 
> ~[connectors-uber.jar:?]
>  at org.apache.hadoop.fs.FileSystem.get(FileSystem.java:475) 
> ~[connectors-uber.jar:?]
>  at org.apache.hadoop.fs.Path.getFileSystem(Path.java:356) 
> ~[connectors-uber.jar:?]
>  at org.apache.hudi.common.fs.FSUtils.getFs(FSUtils.java:107) 
> ~[connectors-uber.jar:?]
>  at org.apache.hudi.common.fs.FSUtils.getFs(FSUtils.java:100) 
> ~[connectors-uber.jar:?]
>  at org.apache.hudi.client.BaseHoodieClient.<init>(BaseHoodieClient.java:69) 
> ~[connectors-uber.jar:?]
>  at 
> org.apache.hudi.client.BaseHoodieWriteClient.<init>(BaseHoodieWriteClient.java:175)
>  ~[connectors-uber.jar:?]
>  at 
> org.apache.hudi.client.BaseHoodieWriteClient.<init>(BaseHoodieWriteClient.java:160)
>  ~[connectors-uber.jar:?]
>  at 
> org.apache.hudi.client.HoodieJavaWriteClient.<init>(HoodieJavaWriteClient.java:55)
>  ~[connectors-uber.jar:?]
>  at 
> org.apache.hudi.connect.writers.KafkaConnectWriterProvider.<init>(KafkaConnectWriterProvider.java:101)
>  ~[connectors-uber.jar:?]
>  ... 25 more



--
This message was sent by Atlassian Jira
(v8.20.10#820010)

Reply via email to