[ 
https://issues.apache.org/jira/browse/PHOENIX-2665?page=com.atlassian.jira.plugin.system.issuetabpanels:comment-tabpanel&focusedCommentId=15138874#comment-15138874
 ] 

Rajeshbabu Chintaguntla commented on PHOENIX-2665:
--------------------------------------------------

These are the logs I have added to reproduce it.
{noformat}
+------------------------------------------+------------------------------------------+
|                 UNSIG_ID                 |                    ID              
      |
+------------------------------------------+------------------------------------------+
 Scan : 
{"timeRange":[0,1455020959272],"batch":-1,"startRow":"","stopRow":"\\xC2\\x1A\\x03\\x00\\x80\\x03\\xD1\\xA3","loadColumnFamiliesOnDemand":null,"totalColumns":1,"cacheBlocks":true,"families":{"0":["ALL"]},"maxResultSize":2097152,"maxVersions":1,"filter":"FirstKeyOnlyFilter","caching":100}
 Scan in staleRegionBoundary: 
{"timeRange":[0,1455020959272],"batch":-1,"startRow":"\\x80\\x00\\xC3O\\xC2\\x05d\\x00","stopRow":"\\xC2\\x1A\\x03\\x00\\x80\\x03\\xD1\\xA3","loadColumnFamiliesOnDemand":null,"totalColumns":1,"cacheBlocks":true,"families":{"0":["ALL"]},"maxResultSize":2097152,"maxVersions":1,"filter":"FirstKeyOnlyFilter","caching":100}
java.util.concurrent.ExecutionException: 
org.apache.phoenix.schema.StaleRegionBoundaryCacheException: ERROR 1108 
(XCL08): Cache of region boundaries are out of date.
        at java.util.concurrent.FutureTask.report(FutureTask.java:122)
        at java.util.concurrent.FutureTask.get(FutureTask.java:202)
        at 
org.apache.phoenix.iterate.BaseResultIterators.getIterators(BaseResultIterators.java:570)
        at 
org.apache.phoenix.iterate.BaseResultIterators.getIterators(BaseResultIterators.java:518)
        at 
org.apache.phoenix.iterate.BaseResultIterators.getIterators(BaseResultIterators.java:497)
        at 
org.apache.phoenix.iterate.MergeSortResultIterator.getIterators(MergeSortResultIterator.java:48)
        at 
org.apache.phoenix.iterate.MergeSortResultIterator.minIterator(MergeSortResultIterator.java:84)
        at 
org.apache.phoenix.iterate.MergeSortResultIterator.next(MergeSortResultIterator.java:111)
        at 
org.apache.phoenix.iterate.BaseGroupedAggregatingResultIterator.next(BaseGroupedAggregatingResultIterator.java:64)
        at 
org.apache.phoenix.jdbc.PhoenixResultSet.next(PhoenixResultSet.java:765)
        at sqlline.IncrementalRows.hasNext(IncrementalRows.java:62)
        at sqlline.TableOutputFormat.print(TableOutputFormat.java:33)
        at sqlline.SqlLine.print(SqlLine.java:1653)
        at sqlline.Commands.execute(Commands.java:833)
        at sqlline.Commands.sql(Commands.java:732)
        at sqlline.SqlLine.dispatch(SqlLine.java:808)
        at sqlline.SqlLine.begin(SqlLine.java:681)
        at sqlline.SqlLine.start(SqlLine.java:398)
        at sqlline.SqlLine.main(SqlLine.java:292)
Caused by: org.apache.phoenix.schema.StaleRegionBoundaryCacheException: ERROR 
1108 (XCL08): Cache of region boundaries are out of date.
        at 
org.apache.phoenix.exception.SQLExceptionCode$13.newException(SQLExceptionCode.java:311)
        at 
org.apache.phoenix.exception.SQLExceptionInfo.buildException(SQLExceptionInfo.java:145)
        at 
org.apache.phoenix.util.ServerUtil.parseRemoteException(ServerUtil.java:131)
        at 
org.apache.phoenix.util.ServerUtil.parseServerExceptionOrNull(ServerUtil.java:115)
        at 
org.apache.phoenix.util.ServerUtil.parseServerException(ServerUtil.java:104)
        at 
org.apache.phoenix.iterate.ScanningResultIterator.next(ScanningResultIterator.java:57)
        at 
org.apache.phoenix.iterate.TableResultIterator.next(TableResultIterator.java:122)
        at 
org.apache.phoenix.iterate.SpoolingResultIterator.<init>(SpoolingResultIterator.java:108)
        at 
org.apache.phoenix.iterate.SpoolingResultIterator.<init>(SpoolingResultIterator.java:75)
        at 
org.apache.phoenix.iterate.SpoolingResultIterator$SpoolingResultIteratorFactory.newIterator(SpoolingResultIterator.java:69)
        at 
org.apache.phoenix.iterate.ParallelIterators$1.call(ParallelIterators.java:99)
        at 
org.apache.phoenix.iterate.ParallelIterators$1.call(ParallelIterators.java:90)
        at java.util.concurrent.FutureTask.run(FutureTask.java:262)
        at 
org.apache.phoenix.job.JobManager$InstrumentedJobFutureTask.run(JobManager.java:172)
        at 
java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1145)
        at 
java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:615)
        at java.lang.Thread.run(Thread.java:745)
 Scan : 
{"timeRange":[0,1455020959272],"batch":-1,"startRow":"\\x80\\x00\\xC3O\\xC2\\x05d\\x00","stopRow":"\\xC2\\x0D5\\x00\\x80\\x01\\xE9o","loadColumnFamiliesOnDemand":null,"totalColumns":1,"cacheBlocks":true,"families":{"0":["ALL"]},"maxResultSize":2097152,"maxVersions":1,"filter":"FirstKeyOnlyFilter","caching":100}
 Scan : 
{"timeRange":[0,1455020959272],"batch":-1,"startRow":"\\xC2\\x0D5\\x00\\x80\\x01\\xE9o","stopRow":"\\xC2\\x1A\\x03\\x00\\x80\\x03\\xD1\\xA3","loadColumnFamiliesOnDemand":null,"totalColumns":1,"cacheBlocks":true,"families":{"0":["ALL"]},"maxResultSize":2097152,"maxVersions":1,"filter":"FirstKeyOnlyFilter","caching":100}
 Scan : 
{"timeRange":[0,1455020959272],"batch":-1,"startRow":"\\xC2\\x1A\\x03\\x00\\x80\\x03\\xD1\\xA3","stopRow":"","loadColumnFamiliesOnDemand":null,"totalColumns":1,"cacheBlocks":true,"families":{"0":["ALL"]},"maxResultSize":2097152,"maxVersions":1,"filter":"FirstKeyOnlyFilter","caching":100}
 Scan : 
{"timeRange":[0,1455020959272],"batch":-1,"startRow":"\\xC2\\x1A\\x03\\x00\\x80\\x03\\xD1\\xA3","stopRow":"","loadColumnFamiliesOnDemand":null,"totalColumns":1,"cacheBlocks":true,"families":{"0":["ALL"]},"maxResultSize":2097152,"maxVersions":1,"filter":"FirstKeyOnlyFilter","caching":100}
| 1                                        | 100                                
      |
{noformat}

> index split while running group by query is returning duplicate results
> -----------------------------------------------------------------------
>
>                 Key: PHOENIX-2665
>                 URL: https://issues.apache.org/jira/browse/PHOENIX-2665
>             Project: Phoenix
>          Issue Type: Bug
>            Reporter: Rajeshbabu Chintaguntla
>            Assignee: Rajeshbabu Chintaguntla
>            Priority: Blocker
>             Fix For: 4.7.0
>
>
> When there is a index split while running group by query is returning 
> duplicate results.
> Instead of returning 500,000 records it's returning 729,500 records.
> {noformat}
> +------------------------------------------+------------------------------------------+
> | 4999                                     | 499999                           
>         |
> +------------------------------------------+------------------------------------------+
> 500,000 rows selected (11.996 seconds)
> {noformat}
> {noformat}
> +------------------------------------------+------------------------------------------+
> | 4999                                     | 499999                           
>         |
> +------------------------------------------+------------------------------------------+
> 729,500 rows selected (15.291 seconds)
> {noformat}



--
This message was sent by Atlassian JIRA
(v6.3.4#6332)

Reply via email to