[ 
https://issues.apache.org/jira/browse/ASTERIXDB-1208?page=com.atlassian.jira.plugin.system.issuetabpanels:all-tabpanel
 ]

Wenhai updated ASTERIXDB-1208:
------------------------------
    Description: 
Schemas
{noformat}
drop dataverse test if exists;
create dataverse test;
use dataverse test;
create type DBLPOpenType as open {
  id: int64,
  dblpid: string,
  authors: string,
  misc: string
}
create dataset DBLPOpen(DBLPOpenType) primary key id;
insert into dataset DBLPOpen { "id": 93, "dblpid": 
"journals/iandc/IbarraJCR91", "authors": "Some Classes of Languages in NC¹", 
"misc": "2006-04-25 86-106 Inf. Comput. January 1991 90 1 
db/journals/iandc/iandc90.html#IbarraJCR91" }
{noformat}
Query
{noformat}
use dataverse test;
set import-private-functions 'true'
for $d in dataset DBLPOpen
where similarity-jaccard(gram-tokens("",3,false),gram-tokens($d.title,3,false)) 
>= 0.5
return {"rec": $d}
{noformat}

  was:
drop dataverse test if exists;
create dataverse test;
use dataverse test;
create type DBLPOpenType as open {
  id: int64,
  dblpid: string,
  authors: string,
  misc: string
}
create dataset DBLPOpen(DBLPOpenType) primary key id;
insert into dataset DBLPOpen { "id": 93, "dblpid": 
"journals/iandc/IbarraJCR91", "authors": "Some Classes of Languages in NC¹", 
"misc": "2006-04-25 86-106 Inf. Comput. January 1991 90 1 
db/journals/iandc/iandc90.html#IbarraJCR91" }

use dataverse test;
set import-private-functions 'true'
for $d in dataset DBLPOpen
where similarity-jaccard(gram-tokens("",3,false),gram-tokens($d.title,3,false)) 
>= 0.5
return {"rec": $d}


> ngram tokenizer failure with negative length
> --------------------------------------------
>
>                 Key: ASTERIXDB-1208
>                 URL: https://issues.apache.org/jira/browse/ASTERIXDB-1208
>             Project: Apache AsterixDB
>          Issue Type: Bug
>          Components: Hyracks Core
>            Reporter: Wenhai
>            Assignee: Taewoo Kim
>
> Schemas
> {noformat}
> drop dataverse test if exists;
> create dataverse test;
> use dataverse test;
> create type DBLPOpenType as open {
>   id: int64,
>   dblpid: string,
>   authors: string,
>   misc: string
> }
> create dataset DBLPOpen(DBLPOpenType) primary key id;
> insert into dataset DBLPOpen { "id": 93, "dblpid": 
> "journals/iandc/IbarraJCR91", "authors": "Some Classes of Languages in NC¹", 
> "misc": "2006-04-25 86-106 Inf. Comput. January 1991 90 1 
> db/journals/iandc/iandc90.html#IbarraJCR91" }
> {noformat}
> Query
> {noformat}
> use dataverse test;
> set import-private-functions 'true'
> for $d in dataset DBLPOpen
> where 
> similarity-jaccard(gram-tokens("",3,false),gram-tokens($d.title,3,false)) >= 
> 0.5
> return {"rec": $d}
> {noformat}



--
This message was sent by Atlassian JIRA
(v6.3.4#6332)

Reply via email to