[
https://issues.apache.org/jira/browse/HIVE-27669?page=com.atlassian.jira.plugin.system.issuetabpanels:all-tabpanel
]
Work on HIVE-27669 started by Harshal Patel.
--------------------------------------------
> Hive Acid CTAS fails incremental if no of rows inserted is > INT_MAX
> --------------------------------------------------------------------
>
> Key: HIVE-27669
> URL: https://issues.apache.org/jira/browse/HIVE-27669
> Project: Hive
> Issue Type: Bug
> Reporter: Harshal Patel
> Assignee: Harshal Patel
> Priority: Major
>
> * If a Table is created using CTAS with rows > INT_MAX then beeline eats up
> the thrown error
> * As replication also uses the same infra it should also do the same
> instead of failing with NumberFormatException
> *Note:* This is happening in the customer's environment consistently but we
> are not able to reproduce it. So, we have gone through the whole code flow
> and handled the error accordingly.
>
> Error message while incremental replication:
> {code:java}
> 4:12:03.230 PM INFO Driver [Scheduled Query
> Executor(schedule:repl_sample_acid_1, execution_id:49625)]: Starting task
> [Stage-10066:REPL_STATE_LOG] in serial mode4:12:03.231 PM INFO
> ReplState [Scheduled Query Executor(schedule:repl_sample_acid_1,
> execution_id:49625)]: REPL::EVENT_LOAD:
> {"dbName":"sample","eventId":"50442182","eventType":"EVENT_ALLOC_WRITE_ID","eventsLoadProgress":"2443/20424","loadTime":1687187523,"eventDuration":"159
> ms"}4:12:03.231 PM INFO Driver [Scheduled Query
> Executor(schedule:repl_sample_acid_1, execution_id:49625)]: Starting task
> [Stage-10067:COLUMNSTATS] in serial mode4:12:03.488 PM INFO Driver
> [Scheduled Query Executor(schedule:repl_sample_acid_1, execution_id:49625)]:
> Starting task [Stage-10068:DEPENDENCY_COLLECTION] in serial mode4:12:03.488
> PM INFO Driver [Scheduled Query Executor(schedule:repl_sample_acid_1,
> execution_id:49625)]: Starting task [Stage-10069:DDL] in serial
> mode4:12:03.504 PM INFO Driver [Scheduled Query
> Executor(schedule:repl_sample_acid_1, execution_id:49625)]: Starting task
> [Stage-10070:REPL_STATE_LOG] in serial mode4:12:03.504 PM INFO
> ReplState [Scheduled Query Executor(schedule:repl_sample_acid_1,
> execution_id:49625)]: REPL::EVENT_LOAD:
> {"dbName":"sample","eventId":"50442183","eventType":"EVENT_UPDATE_TABLE_COL_STAT","eventsLoadProgress":"2444/20424","loadTime":1687187523,"eventDuration":"273
> ms"}4:12:03.504 PM INFO Driver [Scheduled Query
> Executor(schedule:repl_sample_acid_1, execution_id:49625)]: Starting task
> [Stage-10071:DDL] in serial mode4:12:03.596 PM ERROR Task
> [Scheduled Query Executor(schedule:repl_sample_acid_1, execution_id:49625)]:
> Failedorg.apache.hadoop.hive.ql.metadata.HiveException: Unable to alter
> table. java.lang.NumberFormatException: For input string: "5744479373" at
> org.apache.hadoop.hive.ql.metadata.Hive.alterTable(Hive.java:854)
> ~[hive-exec-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5] at
> org.apache.hadoop.hive.ql.ddl.table.create.CreateTableOperation.createTableReplaceMode(CreateTableOperation.java:127)
> ~[hive-exec-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5] at
> org.apache.hadoop.hive.ql.ddl.table.create.CreateTableOperation.execute(CreateTableOperation.java:90)
> ~[hive-exec-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5] at
> org.apache.hadoop.hive.ql.ddl.DDLTask.execute(DDLTask.java:82)
> ~[hive-exec-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5] at
> org.apache.hadoop.hive.ql.exec.Task.executeTask(Task.java:213)
> ~[hive-exec-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5] at
> org.apache.hadoop.hive.ql.exec.TaskRunner.runSequential(TaskRunner.java:105)
> ~[hive-exec-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5] at
> org.apache.hadoop.hive.ql.Executor.launchTask(Executor.java:357)
> ~[hive-exec-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5] at
> org.apache.hadoop.hive.ql.Executor.launchTasks(Executor.java:330)
> ~[hive-exec-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5] at
> org.apache.hadoop.hive.ql.Executor.runTasks(Executor.java:246)
> ~[hive-exec-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5] at
> org.apache.hadoop.hive.ql.Executor.execute(Executor.java:109)
> ~[hive-exec-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5] at
> org.apache.hadoop.hive.ql.Driver.runInternal(Driver.java:772)
> ~[hive-exec-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5] at
> org.apache.hadoop.hive.ql.Driver.run(Driver.java:511)
> ~[hive-exec-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5] at
> org.apache.hadoop.hive.ql.Driver.run(Driver.java:505)
> ~[hive-exec-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5] at
> org.apache.hadoop.hive.ql.reexec.ReExecDriver.run(ReExecDriver.java:166)
> ~[hive-exec-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5] at
> org.apache.hadoop.hive.ql.reexec.ReExecDriver.run(ReExecDriver.java:232)
> ~[hive-exec-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5] at
> org.apache.hadoop.hive.ql.scheduled.ScheduledQueryExecutionService$ScheduledQueryExecutor.processQuery(ScheduledQueryExecutionService.java:240)
> ~[hive-exec-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5] at
> org.apache.hadoop.hive.ql.scheduled.ScheduledQueryExecutionService$ScheduledQueryExecutor.run(ScheduledQueryExecutionService.java:193)
> ~[hive-exec-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5] at
> java.util.concurrent.Executors$RunnableAdapter.call(Executors.java:511)
> ~[?:1.8.0_342] at
> java.util.concurrent.FutureTask.run(FutureTask.java:266) ~[?:1.8.0_342]
> at
> java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1149)
> ~[?:1.8.0_342] at
> java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:624)
> ~[?:1.8.0_342] at java.lang.Thread.run(Thread.java:750)
> ~[?:1.8.0_342]Caused by: org.apache.hadoop.hive.metastore.api.MetaException:
> java.lang.NumberFormatException: For input string: "5744479373" at
> org.apache.hadoop.hive.metastore.api.ThriftHiveMetastore$alter_table_req_result$alter_table_req_resultStandardScheme.read(ThriftHiveMetastore.java)
> ~[hive-standalone-metastore-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5] at
> org.apache.hadoop.hive.metastore.api.ThriftHiveMetastore$alter_table_req_result$alter_table_req_resultStandardScheme.read(ThriftHiveMetastore.java)
> ~[hive-standalone-metastore-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5] at
> org.apache.hadoop.hive.metastore.api.ThriftHiveMetastore$alter_table_req_result.read(ThriftHiveMetastore.java)
> ~[hive-standalone-metastore-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5]
> at org.apache.thrift.TServiceClient.receiveBase(TServiceClient.java:88)
> ~[hive-exec-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5] at
> org.apache.hadoop.hive.metastore.api.ThriftHiveMetastore$Client.recv_alter_table_req(ThriftHiveMetastore.java:2628)
> ~[hive-standalone-metastore-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5] at
> org.apache.hadoop.hive.metastore.api.ThriftHiveMetastore$Client.alter_table_req(ThriftHiveMetastore.java:2615)
> ~[hive-standalone-metastore-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5]
> at
> org.apache.hadoop.hive.metastore.HiveMetaStoreClient.alter_table(HiveMetaStoreClient.java:494)
> ~[hive-standalone-metastore-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5]
> at
> org.apache.hadoop.hive.ql.metadata.SessionHiveMetaStoreClient.alter_table(SessionHiveMetaStoreClient.java:447)
> ~[hive-exec-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5] at
> sun.reflect.GeneratedMethodAccessor456.invoke(Unknown Source) ~[?:?] at
> sun.reflect.DelegatingMethodAccessorImpl.invoke(DelegatingMethodAccessorImpl.java:43)
> ~[?:1.8.0_342] at java.lang.reflect.Method.invoke(Method.java:498)
> ~[?:1.8.0_342] at
> org.apache.hadoop.hive.metastore.RetryingMetaStoreClient.invoke(RetryingMetaStoreClient.java:213)
> ~[hive-standalone-metastore-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5]
> at com.sun.proxy.$Proxy52.alter_table(Unknown Source) ~[?:?] at
> sun.reflect.GeneratedMethodAccessor456.invoke(Unknown Source) ~[?:?] at
> sun.reflect.DelegatingMethodAccessorImpl.invoke(DelegatingMethodAccessorImpl.java:43)
> ~[?:1.8.0_342] at java.lang.reflect.Method.invoke(Method.java:498)
> ~[?:1.8.0_342] at
> org.apache.hadoop.hive.metastore.HiveMetaStoreClient$SynchronizedHandler.invoke(HiveMetaStoreClient.java:3546)
> ~[hive-standalone-metastore-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5]
> at com.sun.proxy.$Proxy52.alter_table(Unknown Source) ~[?:?] at
> org.apache.hadoop.hive.ql.metadata.Hive.alterTable(Hive.java:850)
> ~[hive-exec-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5] ... 21
> more4:12:03.600 PM ERROR Task [Scheduled Query
> Executor(schedule:repl_sample_acid_1, execution_id:49625)]: DDLTask failed,
> DDL Operation: class
> org.apache.hadoop.hive.ql.ddl.table.create.CreateTableOperationorg.apache.hadoop.hive.ql.metadata.HiveException:
> Unable to alter table. java.lang.NumberFormatException: For input string:
> "5744479373" at
> org.apache.hadoop.hive.ql.metadata.Hive.alterTable(Hive.java:854)
> ~[hive-exec-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5] at
> org.apache.hadoop.hive.ql.ddl.table.create.CreateTableOperation.createTableReplaceMode(CreateTableOperation.java:127)
> ~[hive-exec-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5] at
> org.apache.hadoop.hive.ql.ddl.table.create.CreateTableOperation.execute(CreateTableOperation.java:90)
> ~[hive-exec-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5] at
> org.apache.hadoop.hive.ql.ddl.DDLTask.execute(DDLTask.java:82)
> ~[hive-exec-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5] at
> org.apache.hadoop.hive.ql.exec.Task.executeTask(Task.java:213)
> ~[hive-exec-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5] at
> org.apache.hadoop.hive.ql.exec.TaskRunner.runSequential(TaskRunner.java:105)
> ~[hive-exec-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5] at
> org.apache.hadoop.hive.ql.Executor.launchTask(Executor.java:357)
> ~[hive-exec-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5] at
> org.apache.hadoop.hive.ql.Executor.launchTasks(Executor.java:330)
> ~[hive-exec-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5] at
> org.apache.hadoop.hive.ql.Executor.runTasks(Executor.java:246)
> ~[hive-exec-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5] at
> org.apache.hadoop.hive.ql.Executor.execute(Executor.java:109)
> ~[hive-exec-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5] at
> org.apache.hadoop.hive.ql.Driver.runInternal(Driver.java:772)
> ~[hive-exec-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5] at
> org.apache.hadoop.hive.ql.Driver.run(Driver.java:511)
> ~[hive-exec-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5] at
> org.apache.hadoop.hive.ql.Driver.run(Driver.java:505)
> ~[hive-exec-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5] at
> org.apache.hadoop.hive.ql.reexec.ReExecDriver.run(ReExecDriver.java:166)
> ~[hive-exec-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5] at
> org.apache.hadoop.hive.ql.reexec.ReExecDriver.run(ReExecDriver.java:232)
> ~[hive-exec-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5] at
> org.apache.hadoop.hive.ql.scheduled.ScheduledQueryExecutionService$ScheduledQueryExecutor.processQuery(ScheduledQueryExecutionService.java:240)
> ~[hive-exec-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5] at
> org.apache.hadoop.hive.ql.scheduled.ScheduledQueryExecutionService$ScheduledQueryExecutor.run(ScheduledQueryExecutionService.java:193)
> ~[hive-exec-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5] at
> java.util.concurrent.Executors$RunnableAdapter.call(Executors.java:511)
> ~[?:1.8.0_342] at
> java.util.concurrent.FutureTask.run(FutureTask.java:266) ~[?:1.8.0_342]
> at
> java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1149)
> ~[?:1.8.0_342] at
> java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:624)
> ~[?:1.8.0_342] at java.lang.Thread.run(Thread.java:750)
> ~[?:1.8.0_342]Caused by: org.apache.hadoop.hive.metastore.api.MetaException:
> java.lang.NumberFormatException: For input string: "5744479373" at
> org.apache.hadoop.hive.metastore.api.ThriftHiveMetastore$alter_table_req_result$alter_table_req_resultStandardScheme.read(ThriftHiveMetastore.java)
> ~[hive-standalone-metastore-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5] at
> org.apache.hadoop.hive.metastore.api.ThriftHiveMetastore$alter_table_req_result$alter_table_req_resultStandardScheme.read(ThriftHiveMetastore.java)
> ~[hive-standalone-metastore-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5] at
> org.apache.hadoop.hive.metastore.api.ThriftHiveMetastore$alter_table_req_result.read(ThriftHiveMetastore.java)
> ~[hive-standalone-metastore-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5]
> at org.apache.thrift.TServiceClient.receiveBase(TServiceClient.java:88)
> ~[hive-exec-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5] at
> org.apache.hadoop.hive.metastore.api.ThriftHiveMetastore$Client.recv_alter_table_req(ThriftHiveMetastore.java:2628)
> ~[hive-standalone-metastore-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5] at
> org.apache.hadoop.hive.metastore.api.ThriftHiveMetastore$Client.alter_table_req(ThriftHiveMetastore.java:2615)
> ~[hive-standalone-metastore-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5]
> at
> org.apache.hadoop.hive.metastore.HiveMetaStoreClient.alter_table(HiveMetaStoreClient.java:494)
> ~[hive-standalone-metastore-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5]
> at
> org.apache.hadoop.hive.ql.metadata.SessionHiveMetaStoreClient.alter_table(SessionHiveMetaStoreClient.java:447)
> ~[hive-exec-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5] at
> sun.reflect.GeneratedMethodAccessor456.invoke(Unknown Source) ~[?:?] at
> sun.reflect.DelegatingMethodAccessorImpl.invoke(DelegatingMethodAccessorImpl.java:43)
> ~[?:1.8.0_342] at java.lang.reflect.Method.invoke(Method.java:498)
> ~[?:1.8.0_342] at
> org.apache.hadoop.hive.metastore.RetryingMetaStoreClient.invoke(RetryingMetaStoreClient.java:213)
> ~[hive-standalone-metastore-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5]
> at com.sun.proxy.$Proxy52.alter_table(Unknown Source) ~[?:?] at
> sun.reflect.GeneratedMethodAccessor456.invoke(Unknown Source) ~[?:?] at
> sun.reflect.DelegatingMethodAccessorImpl.invoke(DelegatingMethodAccessorImpl.java:43)
> ~[?:1.8.0_342] at java.lang.reflect.Method.invoke(Method.java:498)
> ~[?:1.8.0_342] at
> org.apache.hadoop.hive.metastore.HiveMetaStoreClient$SynchronizedHandler.invoke(HiveMetaStoreClient.java:3546)
> ~[hive-standalone-metastore-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5]
> at com.sun.proxy.$Proxy52.alter_table(Unknown Source) ~[?:?] at
> org.apache.hadoop.hive.ql.metadata.Hive.alterTable(Hive.java:850)
> ~[hive-exec-3.1.3000.7.1.8.15-5.jar:3.1.3000.7.1.8.15-5] ... 21
> more4:12:03.681 PM INFO ReplicationMetricCollector [Scheduled
> Query Executor(schedule:repl_sample_acid_1, execution_id:49625)]: End
> FAILED_ADMIN4:12:03.681 PM INFO ReOptimizePlugin [Scheduled
> Query Executor(schedule:repl_sample_acid_1, execution_id:49625)]:
> ReOptimization: retryPossible: false4:12:03.685 PM ERROR Driver [Scheduled
> Query Executor(schedule:repl_sample_acid_1, execution_id:49625)]: FAILED:
> Execution Error, return code 40013 from
> org.apache.hadoop.hive.ql.ddl.DDLTask. Unable to alter table.
> java.lang.NumberFormatException: For input string: "5744479373"4:12:03.686 PM
> INFO Driver [Scheduled Query Executor(schedule:repl_sample_acid_1,
> execution_id:49625)]: Completed executing
> command(queryId=eup1hive_20230619160006_d5a7e666-480f-4f55-a083-5aabcee41711);
> Time taken: 711.336 seconds4:12:03.686 PM INFO Driver [Scheduled
> Query Executor(schedule:repl_sample_acid_1, execution_id:49625)]: OK {code}
>
>
>
--
This message was sent by Atlassian Jira
(v8.20.10#820010)