[
https://issues.apache.org/jira/browse/PHOENIX-2665?page=com.atlassian.jira.plugin.system.issuetabpanels:comment-tabpanel&focusedCommentId=15138874#comment-15138874
]
Rajeshbabu Chintaguntla commented on PHOENIX-2665:
--------------------------------------------------
These are the logs I have added to reproduce it.
{noformat}
+------------------------------------------+------------------------------------------+
| UNSIG_ID | ID
|
+------------------------------------------+------------------------------------------+
Scan :
{"timeRange":[0,1455020959272],"batch":-1,"startRow":"","stopRow":"\\xC2\\x1A\\x03\\x00\\x80\\x03\\xD1\\xA3","loadColumnFamiliesOnDemand":null,"totalColumns":1,"cacheBlocks":true,"families":{"0":["ALL"]},"maxResultSize":2097152,"maxVersions":1,"filter":"FirstKeyOnlyFilter","caching":100}
Scan in staleRegionBoundary:
{"timeRange":[0,1455020959272],"batch":-1,"startRow":"\\x80\\x00\\xC3O\\xC2\\x05d\\x00","stopRow":"\\xC2\\x1A\\x03\\x00\\x80\\x03\\xD1\\xA3","loadColumnFamiliesOnDemand":null,"totalColumns":1,"cacheBlocks":true,"families":{"0":["ALL"]},"maxResultSize":2097152,"maxVersions":1,"filter":"FirstKeyOnlyFilter","caching":100}
java.util.concurrent.ExecutionException:
org.apache.phoenix.schema.StaleRegionBoundaryCacheException: ERROR 1108
(XCL08): Cache of region boundaries are out of date.
at java.util.concurrent.FutureTask.report(FutureTask.java:122)
at java.util.concurrent.FutureTask.get(FutureTask.java:202)
at
org.apache.phoenix.iterate.BaseResultIterators.getIterators(BaseResultIterators.java:570)
at
org.apache.phoenix.iterate.BaseResultIterators.getIterators(BaseResultIterators.java:518)
at
org.apache.phoenix.iterate.BaseResultIterators.getIterators(BaseResultIterators.java:497)
at
org.apache.phoenix.iterate.MergeSortResultIterator.getIterators(MergeSortResultIterator.java:48)
at
org.apache.phoenix.iterate.MergeSortResultIterator.minIterator(MergeSortResultIterator.java:84)
at
org.apache.phoenix.iterate.MergeSortResultIterator.next(MergeSortResultIterator.java:111)
at
org.apache.phoenix.iterate.BaseGroupedAggregatingResultIterator.next(BaseGroupedAggregatingResultIterator.java:64)
at
org.apache.phoenix.jdbc.PhoenixResultSet.next(PhoenixResultSet.java:765)
at sqlline.IncrementalRows.hasNext(IncrementalRows.java:62)
at sqlline.TableOutputFormat.print(TableOutputFormat.java:33)
at sqlline.SqlLine.print(SqlLine.java:1653)
at sqlline.Commands.execute(Commands.java:833)
at sqlline.Commands.sql(Commands.java:732)
at sqlline.SqlLine.dispatch(SqlLine.java:808)
at sqlline.SqlLine.begin(SqlLine.java:681)
at sqlline.SqlLine.start(SqlLine.java:398)
at sqlline.SqlLine.main(SqlLine.java:292)
Caused by: org.apache.phoenix.schema.StaleRegionBoundaryCacheException: ERROR
1108 (XCL08): Cache of region boundaries are out of date.
at
org.apache.phoenix.exception.SQLExceptionCode$13.newException(SQLExceptionCode.java:311)
at
org.apache.phoenix.exception.SQLExceptionInfo.buildException(SQLExceptionInfo.java:145)
at
org.apache.phoenix.util.ServerUtil.parseRemoteException(ServerUtil.java:131)
at
org.apache.phoenix.util.ServerUtil.parseServerExceptionOrNull(ServerUtil.java:115)
at
org.apache.phoenix.util.ServerUtil.parseServerException(ServerUtil.java:104)
at
org.apache.phoenix.iterate.ScanningResultIterator.next(ScanningResultIterator.java:57)
at
org.apache.phoenix.iterate.TableResultIterator.next(TableResultIterator.java:122)
at
org.apache.phoenix.iterate.SpoolingResultIterator.<init>(SpoolingResultIterator.java:108)
at
org.apache.phoenix.iterate.SpoolingResultIterator.<init>(SpoolingResultIterator.java:75)
at
org.apache.phoenix.iterate.SpoolingResultIterator$SpoolingResultIteratorFactory.newIterator(SpoolingResultIterator.java:69)
at
org.apache.phoenix.iterate.ParallelIterators$1.call(ParallelIterators.java:99)
at
org.apache.phoenix.iterate.ParallelIterators$1.call(ParallelIterators.java:90)
at java.util.concurrent.FutureTask.run(FutureTask.java:262)
at
org.apache.phoenix.job.JobManager$InstrumentedJobFutureTask.run(JobManager.java:172)
at
java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1145)
at
java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:615)
at java.lang.Thread.run(Thread.java:745)
Scan :
{"timeRange":[0,1455020959272],"batch":-1,"startRow":"\\x80\\x00\\xC3O\\xC2\\x05d\\x00","stopRow":"\\xC2\\x0D5\\x00\\x80\\x01\\xE9o","loadColumnFamiliesOnDemand":null,"totalColumns":1,"cacheBlocks":true,"families":{"0":["ALL"]},"maxResultSize":2097152,"maxVersions":1,"filter":"FirstKeyOnlyFilter","caching":100}
Scan :
{"timeRange":[0,1455020959272],"batch":-1,"startRow":"\\xC2\\x0D5\\x00\\x80\\x01\\xE9o","stopRow":"\\xC2\\x1A\\x03\\x00\\x80\\x03\\xD1\\xA3","loadColumnFamiliesOnDemand":null,"totalColumns":1,"cacheBlocks":true,"families":{"0":["ALL"]},"maxResultSize":2097152,"maxVersions":1,"filter":"FirstKeyOnlyFilter","caching":100}
Scan :
{"timeRange":[0,1455020959272],"batch":-1,"startRow":"\\xC2\\x1A\\x03\\x00\\x80\\x03\\xD1\\xA3","stopRow":"","loadColumnFamiliesOnDemand":null,"totalColumns":1,"cacheBlocks":true,"families":{"0":["ALL"]},"maxResultSize":2097152,"maxVersions":1,"filter":"FirstKeyOnlyFilter","caching":100}
Scan :
{"timeRange":[0,1455020959272],"batch":-1,"startRow":"\\xC2\\x1A\\x03\\x00\\x80\\x03\\xD1\\xA3","stopRow":"","loadColumnFamiliesOnDemand":null,"totalColumns":1,"cacheBlocks":true,"families":{"0":["ALL"]},"maxResultSize":2097152,"maxVersions":1,"filter":"FirstKeyOnlyFilter","caching":100}
| 1 | 100
|
{noformat}
> index split while running group by query is returning duplicate results
> -----------------------------------------------------------------------
>
> Key: PHOENIX-2665
> URL: https://issues.apache.org/jira/browse/PHOENIX-2665
> Project: Phoenix
> Issue Type: Bug
> Reporter: Rajeshbabu Chintaguntla
> Assignee: Rajeshbabu Chintaguntla
> Priority: Blocker
> Fix For: 4.7.0
>
>
> When there is a index split while running group by query is returning
> duplicate results.
> Instead of returning 500,000 records it's returning 729,500 records.
> {noformat}
> +------------------------------------------+------------------------------------------+
> | 4999 | 499999
> |
> +------------------------------------------+------------------------------------------+
> 500,000 rows selected (11.996 seconds)
> {noformat}
> {noformat}
> +------------------------------------------+------------------------------------------+
> | 4999 | 499999
> |
> +------------------------------------------+------------------------------------------+
> 729,500 rows selected (15.291 seconds)
> {noformat}
--
This message was sent by Atlassian JIRA
(v6.3.4#6332)