[ 
https://issues.apache.org/jira/browse/ASTERIXDB-1208?page=com.atlassian.jira.plugin.system.issuetabpanels:all-tabpanel
 ]

Taewoo Kim closed ASTERIXDB-1208.
---------------------------------
    Resolution: Fixed

https://asterix-gerrit.ics.uci.edu/#/c/1448/

> ngram tokenizer failure with negative length
> --------------------------------------------
>
>                 Key: ASTERIXDB-1208
>                 URL: https://issues.apache.org/jira/browse/ASTERIXDB-1208
>             Project: Apache AsterixDB
>          Issue Type: Bug
>          Components: Hyracks Core
>            Reporter: Wenhai
>            Assignee: Taewoo Kim
>
> Schemas
> {noformat}
> drop dataverse test if exists;
> create dataverse test;
> use dataverse test;
> create type DBLPOpenType as open {
>   id: int64,
>   dblpid: string,
>   authors: string,
>   misc: string
> }
> create dataset DBLPOpen(DBLPOpenType) primary key id;
> insert into dataset DBLPOpen { "id": 93, "dblpid": 
> "journals/iandc/IbarraJCR91", "authors": "Some Classes of Languages in NC¹", 
> "misc": "2006-04-25 86-106 Inf. Comput. January 1991 90 1 
> db/journals/iandc/iandc90.html#IbarraJCR91" }
> {noformat}
> Query
> {noformat}
> use dataverse test;
> set import-private-functions 'true'
> for $d in dataset DBLPOpen
> where 
> similarity-jaccard(gram-tokens("",3,false),gram-tokens($d.title,3,false)) >= 
> 0.5
> return {"rec": $d}
> {noformat}



--
This message was sent by Atlassian JIRA
(v6.3.4#6332)

Reply via email to