[
https://issues.apache.org/jira/browse/DRILL-7853?page=com.atlassian.jira.plugin.system.issuetabpanels:all-tabpanel
]
Nick Venenga updated DRILL-7853:
--------------------------------
Description:
Exception when attempting to parse strings to timestamp using logRegex
{noformat}
$ tree data
data
└── 2021
└── 01
└── 20
└── sample.log.gz
{noformat}
{code:java}
{
"type": "file",
"connection": "file:///",
"config": {},
"workspaces": {
"tmp": {
"location": "/tmp",
"writable": true,
"defaultInputFormat": null,
"allowAccessOutsideWorkspace": false
},
"root": {
"location": "/data",
"writable": false,
"defaultInputFormat": null,
"allowAccessOutsideWorkspace": false
}
},
"formats": {
"log": {
"type": "logRegex",
"regex": "([^ ]*) ([^ ]*) ([^ ]*) ([^ ]*):([0-9]*) ([^ ]*)[:-]([0-9]*)
([-.0-9]*) ([-.0-9]*) ([-.0-9]*) (|[-0-9]*) (-|[-0-9]*) ([-0-9]*) ([-0-9]*)
\"([^ ]*) ([^ ]*) (- |[^ ]*)\" \"([^\"]*)\" ([A-Z0-9-]+) ([A-Za-z0-9.-]*) ([^
]*) \"([^\"]*)\" \"([^\"]*)\" \"([^\"]*)\" ([-.0-9]*) ([^ ]*) \"([^\"]*)\"($|
\"[^ ]*\")(.*)",
"extension": "gz",
"maxErrors": 10,
"schema": [
{
"fieldName": "type"
},
{
"fieldName": "time",
"fieldType": "TIMESTAMP",
"format": "yyyy-MM-dd''T''HH:mm:ssZ"
},
{
"fieldName": "elb"
},
{
"fieldName": "client_ip"
},
{
"fieldName": "client_port",
"fieldType": "INT"
},
{
"fieldName": "target_ip"
},
{
"fieldName": "target_port",
"fieldType": "INT"
},
{
"fieldName": "request_processing_time",
"fieldType": "FLOAT8"
},
{
"fieldName": "target_processing_time",
"fieldType": "FLOAT8"
},
{
"fieldName": "response_processing_time",
"fieldType": "FLOAT8"
},
{
"fieldName": "elb_status_code"
},
{
"fieldName": "target_status_code"
},
{
"fieldName": "received_bytes",
"fieldType": "BIGINT"
},
{
"fieldName": "sent_bytes",
"fieldType": "BIGINT"
},
{
"fieldName": "request_verb"
},
{
"fieldName": "request_url"
},
{
"fieldName": "request_proto"
},
{
"fieldName": "user_agent"
},
{
"fieldName": "ssl_cipher"
},
{
"fieldName": "ssl_protocol"
},
{
"fieldName": "target_group_arn"
},
{
"fieldName": "trace_id"
},
{
"fieldName": "domain_name"
},
{
"fieldName": "chosen_cert_arn"
},
{
"fieldName": "matched_rule_priority"
},
{
"fieldName": "request_creation_time"
},
{
"fieldName": "actions_executed"
},
{
"fieldName": "redirect_url"
},
{
"fieldName": "new_field"
}
]
}
},
"enabled": true
}
{code}
{noformat}
apache drill> select * from dfs.root.`2021` limit 5;
{noformat}
{noformat}
Caused by: java.lang.IllegalStateException: java.lang.NoSuchMethodException:
org.apache.drill.exec.physical.impl.scan.convert.ConvertStringToTimeStamp.<init>(org.apache.drill.exec.vector.accessor.ScalarWriter)
at
org.apache.drill.exec.physical.impl.scan.convert.StandardConversions.newInstance(StandardConversions.java:197)
at
org.apache.drill.exec.physical.impl.scan.convert.StandardConversions.newInstance(StandardConversions.java:188)
at
org.apache.drill.exec.physical.impl.scan.convert.StandardConversions.converterFor(StandardConversions.java:429)
at
org.apache.drill.exec.physical.impl.scan.convert.StandardConversions.converterFor(StandardConversions.java:446)
at
org.apache.drill.exec.store.log.LogBatchReader$ScalarGroupWriter.<init>(LogBatchReader.java:93)
at
org.apache.drill.exec.store.log.LogBatchReader.bindColumns(LogBatchReader.java:184)
at
org.apache.drill.exec.store.log.LogBatchReader.open(LogBatchReader.java:148)
at
org.apache.drill.exec.store.log.LogBatchReader.open(LogBatchReader.java:44)
at
org.apache.drill.exec.physical.impl.scan.framework.ManagedScanFramework.open(ManagedScanFramework.java:208)
at
org.apache.drill.exec.physical.impl.scan.file.FileScanFramework.open(FileScanFramework.java:268)
at
org.apache.drill.exec.physical.impl.scan.framework.ShimBatchReader.open(ShimBatchReader.java:75)
at
org.apache.drill.exec.physical.impl.scan.ReaderState.open(ReaderState.java:229)
at
org.apache.drill.exec.physical.impl.scan.ScanOperatorExec.nextAction(ScanOperatorExec.java:273)
at
org.apache.drill.exec.physical.impl.scan.ScanOperatorExec.next(ScanOperatorExec.java:229)
at
org.apache.drill.exec.physical.impl.protocol.OperatorDriver.doNext(OperatorDriver.java:201)
at
org.apache.drill.exec.physical.impl.protocol.OperatorDriver.start(OperatorDriver.java:179)
at
org.apache.drill.exec.physical.impl.protocol.OperatorDriver.next(OperatorDriver.java:129)
at
org.apache.drill.exec.physical.impl.protocol.OperatorRecordBatch.next(OperatorRecordBatch.java:149)
at
org.apache.drill.exec.record.AbstractRecordBatch.next(AbstractRecordBatch.java:119)
at
org.apache.drill.exec.record.AbstractRecordBatch.next(AbstractRecordBatch.java:111)
at
org.apache.drill.exec.record.AbstractUnaryRecordBatch.innerNext(AbstractUnaryRecordBatch.java:59)
at
org.apache.drill.exec.physical.impl.limit.LimitRecordBatch.innerNext(LimitRecordBatch.java:93)
at
org.apache.drill.exec.record.AbstractRecordBatch.next(AbstractRecordBatch.java:170)
at
org.apache.drill.exec.record.AbstractRecordBatch.next(AbstractRecordBatch.java:119)
at
org.apache.drill.exec.record.AbstractRecordBatch.next(AbstractRecordBatch.java:111)
at
org.apache.drill.exec.record.AbstractUnaryRecordBatch.innerNext(AbstractUnaryRecordBatch.java:59)
at
org.apache.drill.exec.record.AbstractRecordBatch.next(AbstractRecordBatch.java:170)
at
org.apache.drill.exec.physical.impl.BaseRootExec.next(BaseRootExec.java:103)
at
org.apache.drill.exec.physical.impl.SingleSenderCreator$SingleSenderRootExec.innerNext(SingleSenderCreator.java:87)
at
org.apache.drill.exec.physical.impl.BaseRootExec.next(BaseRootExec.java:93)
at
org.apache.drill.exec.work.fragment.FragmentExecutor$1.run(FragmentExecutor.java:323)
at
org.apache.drill.exec.work.fragment.FragmentExecutor$1.run(FragmentExecutor.java:310)
at .......(:0) at
org.apache.hadoop.security.UserGroupInformation.doAs(UserGroupInformation.java:1730)
at
org.apache.drill.exec.work.fragment.FragmentExecutor.run(FragmentExecutor.java:310)
at
org.apache.drill.common.SelfCleaningRunnable.run(SelfCleaningRunnable.java:38)
at .......(:0)Caused by: java.lang.NoSuchMethodException:
org.apache.drill.exec.physical.impl.scan.convert.ConvertStringToTimeStamp.<init>(org.apache.drill.exec.vector.accessor.ScalarWriter)
at .......(:0) at
org.apache.drill.exec.physical.impl.scan.convert.StandardConversions.newInstance(StandardConversions.java:194)
... 36 common frames omitted{noformat}
was:
Exception when attempting to parse strings to timestamp using logRegex
{noformat}
$ tree data
data
└── 2021
└── 01
└── 20
└── sample.log.gz
{noformat}
{code:java}
{
"type": "file",
"connection": "file:///",
"config": {},
"workspaces": {
"tmp": {
"location": "/tmp",
"writable": true,
"defaultInputFormat": null,
"allowAccessOutsideWorkspace": false
},
"root": {
"location": "/data",
"writable": false,
"defaultInputFormat": null,
"allowAccessOutsideWorkspace": false
}
},
"formats": {
"log": {
"type": "logRegex",
"regex": "([^ ]*) ([^ ]*) ([^ ]*) ([^ ]*):([0-9]*) ([^ ]*)[:-]([0-9]*)
([-.0-9]*) ([-.0-9]*) ([-.0-9]*) (|[-0-9]*) (-|[-0-9]*) ([-0-9]*) ([-0-9]*)
\"([^ ]*) ([^ ]*) (- |[^ ]*)\" \"([^\"]*)\" ([A-Z0-9-]+) ([A-Za-z0-9.-]*) ([^
]*) \"([^\"]*)\" \"([^\"]*)\" \"([^\"]*)\" ([-.0-9]*) ([^ ]*) \"([^\"]*)\"($|
\"[^ ]*\")(.*)",
"extension": "gz",
"maxErrors": 10,
"schema": [
{
"fieldName": "type"
},
{
"fieldName": "time",
"fieldType": "TIMESTAMP",
"format": "yyyy-MM-dd''T''HH:mm:ssZ"
},
{
"fieldName": "elb"
},
{
"fieldName": "client_ip"
},
{
"fieldName": "client_port",
"fieldType": "INT"
},
{
"fieldName": "target_ip"
},
{
"fieldName": "target_port",
"fieldType": "INT"
},
{
"fieldName": "request_processing_time",
"fieldType": "FLOAT8"
},
{
"fieldName": "target_processing_time",
"fieldType": "FLOAT8"
},
{
"fieldName": "response_processing_time",
"fieldType": "FLOAT8"
},
{
"fieldName": "elb_status_code"
},
{
"fieldName": "target_status_code"
},
{
"fieldName": "received_bytes",
"fieldType": "BIGINT"
},
{
"fieldName": "sent_bytes",
"fieldType": "BIGINT"
},
{
"fieldName": "request_verb"
},
{
"fieldName": "request_url"
},
{
"fieldName": "request_proto"
},
{
"fieldName": "user_agent"
},
{
"fieldName": "ssl_cipher"
},
{
"fieldName": "ssl_protocol"
},
{
"fieldName": "target_group_arn"
},
{
"fieldName": "trace_id"
},
{
"fieldName": "domain_name"
},
{
"fieldName": "chosen_cert_arn"
},
{
"fieldName": "matched_rule_priority"
},
{
"fieldName": "request_creation_time"
},
{
"fieldName": "actions_executed"
},
{
"fieldName": "redirect_url"
},
{
"fieldName": "new_field"
}
]
}
},
"enabled": true
}
{code}
{noformat}
apache drill> select * from dfs.root.`2021` limit 5;
{noformat}
> java.lang.NoSuchMethodException:
> org.apache.drill.exec.physical.impl.scan.convert.ConvertStringToTimeStamp.<init>(org.apache.drill.exec.vector.accessor.ScalarWriter)
> ---------------------------------------------------------------------------------------------------------------------------------------------------------------------
>
> Key: DRILL-7853
> URL: https://issues.apache.org/jira/browse/DRILL-7853
> Project: Apache Drill
> Issue Type: Bug
> Affects Versions: 1.18.0
> Reporter: Nick Venenga
> Priority: Major
> Attachments: sample.log.gz
>
>
> Exception when attempting to parse strings to timestamp using logRegex
>
> {noformat}
> $ tree data
> data
> └── 2021
> └── 01
> └── 20
> └── sample.log.gz
> {noformat}
> {code:java}
> {
> "type": "file",
> "connection": "file:///",
> "config": {},
> "workspaces": {
> "tmp": {
> "location": "/tmp",
> "writable": true,
> "defaultInputFormat": null,
> "allowAccessOutsideWorkspace": false
> },
> "root": {
> "location": "/data",
> "writable": false,
> "defaultInputFormat": null,
> "allowAccessOutsideWorkspace": false
> }
> },
> "formats": {
> "log": {
> "type": "logRegex",
> "regex": "([^ ]*) ([^ ]*) ([^ ]*) ([^ ]*):([0-9]*) ([^ ]*)[:-]([0-9]*)
> ([-.0-9]*) ([-.0-9]*) ([-.0-9]*) (|[-0-9]*) (-|[-0-9]*) ([-0-9]*) ([-0-9]*)
> \"([^ ]*) ([^ ]*) (- |[^ ]*)\" \"([^\"]*)\" ([A-Z0-9-]+) ([A-Za-z0-9.-]*) ([^
> ]*) \"([^\"]*)\" \"([^\"]*)\" \"([^\"]*)\" ([-.0-9]*) ([^ ]*) \"([^\"]*)\"($|
> \"[^ ]*\")(.*)",
> "extension": "gz",
> "maxErrors": 10,
> "schema": [
> {
> "fieldName": "type"
> },
> {
> "fieldName": "time",
> "fieldType": "TIMESTAMP",
> "format": "yyyy-MM-dd''T''HH:mm:ssZ"
> },
> {
> "fieldName": "elb"
> },
> {
> "fieldName": "client_ip"
> },
> {
> "fieldName": "client_port",
> "fieldType": "INT"
> },
> {
> "fieldName": "target_ip"
> },
> {
> "fieldName": "target_port",
> "fieldType": "INT"
> },
> {
> "fieldName": "request_processing_time",
> "fieldType": "FLOAT8"
> },
> {
> "fieldName": "target_processing_time",
> "fieldType": "FLOAT8"
> },
> {
> "fieldName": "response_processing_time",
> "fieldType": "FLOAT8"
> },
> {
> "fieldName": "elb_status_code"
> },
> {
> "fieldName": "target_status_code"
> },
> {
> "fieldName": "received_bytes",
> "fieldType": "BIGINT"
> },
> {
> "fieldName": "sent_bytes",
> "fieldType": "BIGINT"
> },
> {
> "fieldName": "request_verb"
> },
> {
> "fieldName": "request_url"
> },
> {
> "fieldName": "request_proto"
> },
> {
> "fieldName": "user_agent"
> },
> {
> "fieldName": "ssl_cipher"
> },
> {
> "fieldName": "ssl_protocol"
> },
> {
> "fieldName": "target_group_arn"
> },
> {
> "fieldName": "trace_id"
> },
> {
> "fieldName": "domain_name"
> },
> {
> "fieldName": "chosen_cert_arn"
> },
> {
> "fieldName": "matched_rule_priority"
> },
> {
> "fieldName": "request_creation_time"
> },
> {
> "fieldName": "actions_executed"
> },
> {
> "fieldName": "redirect_url"
> },
> {
> "fieldName": "new_field"
> }
> ]
> }
> },
> "enabled": true
> }
> {code}
> {noformat}
> apache drill> select * from dfs.root.`2021` limit 5;
> {noformat}
>
> {noformat}
> Caused by: java.lang.IllegalStateException: java.lang.NoSuchMethodException:
> org.apache.drill.exec.physical.impl.scan.convert.ConvertStringToTimeStamp.<init>(org.apache.drill.exec.vector.accessor.ScalarWriter)
>
> at
> org.apache.drill.exec.physical.impl.scan.convert.StandardConversions.newInstance(StandardConversions.java:197)
> at
> org.apache.drill.exec.physical.impl.scan.convert.StandardConversions.newInstance(StandardConversions.java:188)
>
>
> at
> org.apache.drill.exec.physical.impl.scan.convert.StandardConversions.converterFor(StandardConversions.java:429)
>
>
> at
> org.apache.drill.exec.physical.impl.scan.convert.StandardConversions.converterFor(StandardConversions.java:446)
>
>
> at
> org.apache.drill.exec.store.log.LogBatchReader$ScalarGroupWriter.<init>(LogBatchReader.java:93)
>
>
> at
> org.apache.drill.exec.store.log.LogBatchReader.bindColumns(LogBatchReader.java:184)
>
>
>
> at
> org.apache.drill.exec.store.log.LogBatchReader.open(LogBatchReader.java:148)
>
>
>
> at
> org.apache.drill.exec.store.log.LogBatchReader.open(LogBatchReader.java:44)
>
>
>
> at
> org.apache.drill.exec.physical.impl.scan.framework.ManagedScanFramework.open(ManagedScanFramework.java:208)
>
>
> at
> org.apache.drill.exec.physical.impl.scan.file.FileScanFramework.open(FileScanFramework.java:268)
>
>
> at
> org.apache.drill.exec.physical.impl.scan.framework.ShimBatchReader.open(ShimBatchReader.java:75)
>
>
> at
> org.apache.drill.exec.physical.impl.scan.ReaderState.open(ReaderState.java:229)
>
>
>
> at
> org.apache.drill.exec.physical.impl.scan.ScanOperatorExec.nextAction(ScanOperatorExec.java:273)
>
>
> at
> org.apache.drill.exec.physical.impl.scan.ScanOperatorExec.next(ScanOperatorExec.java:229)
>
>
> at
> org.apache.drill.exec.physical.impl.protocol.OperatorDriver.doNext(OperatorDriver.java:201)
> at
> org.apache.drill.exec.physical.impl.protocol.OperatorDriver.start(OperatorDriver.java:179)
>
>
> at
> org.apache.drill.exec.physical.impl.protocol.OperatorDriver.next(OperatorDriver.java:129)
>
>
> at
> org.apache.drill.exec.physical.impl.protocol.OperatorRecordBatch.next(OperatorRecordBatch.java:149)
>
>
> at
> org.apache.drill.exec.record.AbstractRecordBatch.next(AbstractRecordBatch.java:119)
> at
> org.apache.drill.exec.record.AbstractRecordBatch.next(AbstractRecordBatch.java:111)
> at
> org.apache.drill.exec.record.AbstractUnaryRecordBatch.innerNext(AbstractUnaryRecordBatch.java:59)
> at
> org.apache.drill.exec.physical.impl.limit.LimitRecordBatch.innerNext(LimitRecordBatch.java:93)
> at
> org.apache.drill.exec.record.AbstractRecordBatch.next(AbstractRecordBatch.java:170)
> at
> org.apache.drill.exec.record.AbstractRecordBatch.next(AbstractRecordBatch.java:119)
> at
> org.apache.drill.exec.record.AbstractRecordBatch.next(AbstractRecordBatch.java:111)
> at
> org.apache.drill.exec.record.AbstractUnaryRecordBatch.innerNext(AbstractUnaryRecordBatch.java:59)
> at
> org.apache.drill.exec.record.AbstractRecordBatch.next(AbstractRecordBatch.java:170)
> at
> org.apache.drill.exec.physical.impl.BaseRootExec.next(BaseRootExec.java:103)
> at
> org.apache.drill.exec.physical.impl.SingleSenderCreator$SingleSenderRootExec.innerNext(SingleSenderCreator.java:87)
> at
> org.apache.drill.exec.physical.impl.BaseRootExec.next(BaseRootExec.java:93)
> at
> org.apache.drill.exec.work.fragment.FragmentExecutor$1.run(FragmentExecutor.java:323)
> at
> org.apache.drill.exec.work.fragment.FragmentExecutor$1.run(FragmentExecutor.java:310)
> at .......(:0) at
> org.apache.hadoop.security.UserGroupInformation.doAs(UserGroupInformation.java:1730)
> at
> org.apache.drill.exec.work.fragment.FragmentExecutor.run(FragmentExecutor.java:310)
> at
> org.apache.drill.common.SelfCleaningRunnable.run(SelfCleaningRunnable.java:38)
> at .......(:0)Caused by: java.lang.NoSuchMethodException:
> org.apache.drill.exec.physical.impl.scan.convert.ConvertStringToTimeStamp.<init>(org.apache.drill.exec.vector.accessor.ScalarWriter)
> at .......(:0) at
> org.apache.drill.exec.physical.impl.scan.convert.StandardConversions.newInstance(StandardConversions.java:194)
> ... 36 common frames omitted{noformat}
--
This message was sent by Atlassian Jira
(v8.3.4#803005)