http://git-wip-us.apache.org/repos/asf/asterixdb/blob/d906bd89/asterixdb/asterix-app/data/pub-small/csxauthors.adm
----------------------------------------------------------------------
diff --git a/asterixdb/asterix-app/data/pub-small/csxauthors.adm 
b/asterixdb/asterix-app/data/pub-small/csxauthors.adm
new file mode 100644
index 0000000..05064f7
--- /dev/null
+++ b/asterixdb/asterix-app/data/pub-small/csxauthors.adm
@@ -0,0 +1,196 @@
+{ "authors": "Annegret Weng" }
+{ "authors": "Antti Airola Sampo Pyysalo Jari Björne Tapio Pahikkala Filip 
Ginter Tapio Salakoski" }
+{ "authors": "Christian Poellabauer Karsten Schwan Richard West" }
+{ "authors": "Christina S. Leslie Eleazar Eskin Adiel Cohen Jason Weston 
William Stafford Noble" }
+{ "authors": "Christoph Heinz Bernhard Seeger" }
+{ "authors": "Chunhua Shen Michael J. Brooks Anton Van Den Hengel" }
+{ "authors": "Darrin P. Lewis Tony Jebara William Stafford Noble" }
+{ "authors": "Dawson Engler M. Frans Kaashoek James O'toole" }
+{ "authors": "Francis R. Bach" }
+{ "authors": "Francis R. Bach Michael I. Jordan" }
+{ "authors": "Guang Dai Dit-yan Yeung Hong Chang" }
+{ "authors": "Kenji Hisazumi Teruaki Kitasuka Tsuneo Nakanishi Akira Fukuda" }
+{ "authors": "Matthew Brand" }
+{ "authors": "Michael Engel Bernd Freisleben" }
+{ "authors": "Michael Hohmuth Hendrik Tews Shane G. Stephens" }
+{ "authors": "Robert Jenssen Torbjørn Eltoft" }
+{ "authors": "Sayantan Sur Hyun-wook Jin Dhabaleswar K. Panda" }
+{ "authors": "Songcan Chen Daoqiang Zhang" }
+{ "authors": "W. Chen" }
+{ "authors": "Zhe Wang Songcan Chen" }
+{ "authors": "Zhiwei Gu Tao Mei Jinhui Tang Xiuqing Wu Xian-sheng Hua" }
+{ "authors": "Ajith Abraham Swagatam Das Amit Konar" }
+{ "authors": "Alexei Pozdnoukhov Samy Bengio" }
+{ "authors": "Arvind Seshadri Mark Luk Ning Qu Adrian Perrig" }
+{ "authors": "Benjamin Schrauwen Jan Van Campenhout" }
+{ "authors": "Brian Kulis Mátyás A. Sustik Inderjit S. Dhillon" }
+{ "authors": "Brian N. Bershad Craig Chambers Susan Eggers Chris Maeda Dylan 
McNamee Przemyslaw Pardyak Stefan Savage Emin Gün Sirer Emin Gun Sirer" }
+{ "authors": "Bryan Ford Mike Hibler Jay Lepreau Patrick Tullmann Godmar Back 
Stephen Clawson" }
+{ "authors": "Charles Crowley" }
+{ "authors": "Cheng Soon Ong Er J. Smola Robert C. Williamson" }
+{ "authors": "Dan Tsafrir Yoav Etsion Dror G. Feitelson Scott Kirkpatrick" }
+{ "authors": "Gang Wang Tao Chen Dit-yan Yeung Frederick H. Lochovsky" }
+{ "authors": "Glenn Fung Murat Dundar Jinbo Bi Bharat Rao" }
+{ "authors": "Gregory E. Fasshauer Joseph W. Jerome" }
+{ "authors": "Jezekiel Ben-arie Zhiqian Wang" }
+{ "authors": "Jianjun Yu Shengmin Guo Hao Su Hui Zhang Ke Xu" }
+{ "authors": "Lamia Youseff Jack Dongarra Keith Seymour Rich Wolski Haihang 
You" }
+{ "authors": "Matthew Burnside Angelos D. Keromytis" }
+{ "authors": "Michel Neuhaus Horst Bunke" }
+{ "authors": "Nail Akar Khosrow Sohraby" }
+{ "authors": "Roland Opfer" }
+{ "authors": "Samuel G. Steckley Shane G. Henderson" }
+{ "authors": "Samy Bengio Johnny Mariéthoz" }
+{ "authors": "Subhransu Maji Alexander C. Berg Jitendra Malik" }
+{ "authors": "Tatsuo Nakajima Hideyuki Tokuda" }
+{ "authors": "Aharon Bar Hillel Tomer Hertz Daphna Weinshall" }
+{ "authors": "Andreas Argyriou Raphael Hauser Charles A. Micchelli 
Massimiliano Pontil" }
+{ "authors": "Bastian Blankenburg Rajdeep K. Dash Sarvapali D. Ramchurn 
Matthias Klusch Nicholas R. Jennings" }
+{ "authors": "Brian N. Bershad" }
+{ "authors": "Cheng Soon Ong Alexander J. Smola Robert C. Williamson" }
+{ "authors": "Dawei Liu Xihong Lin Debashis Ghosh" }
+{ "authors": "Erik H. W. Meijering Karel J. Zuiderveld Max A. Viergever" }
+{ "authors": "Ernest Artiaga Albert Serra Marisa Gil" }
+{ "authors": "Francis R. Bach Gert R. G. Lanckriet Michael I. Jordan" }
+{ "authors": "Hiren D. Patel Sandeep K. Shukla" }
+{ "authors": "Hujun Yin" }
+{ "authors": "Ingo Mierswa Katharina Morik" }
+{ "authors": "Jinbo Bi Glenn Fung Murat Dundar Bharat Rao" }
+{ "authors": "Michel Gien" }
+{ "authors": "Min Xu Ravi Sandhu Xuxian Jiang Xinwen Zhang" }
+{ "authors": "Qun Dai Songcan Chen" }
+{ "authors": "Yoshisato Yanagisawa Shigeru Chiba Kenichi Kourai" }
+{ "authors": "Carsten Ditze" }
+{ "authors": "Ding-xuan Zhou" }
+{ "authors": "Faisal N. Abu-khzam Michael A. Langston W. Henry Suters" }
+{ "authors": "Gernot Heiser Volkmar Uhlig Joshua Levasseur" }
+{ "authors": "Jean-charles Fabre" }
+{ "authors": "Jieping Ye Jianhui Chen Shuiwang Ji" }
+{ "authors": "Karsten M. Borgwardt Cheng Soon Ong Stefan Schönauer S. V. N. 
Vishwanathan Alex J. Smola Hans-peter Kriegel" }
+{ "authors": "Moonsang Kwon Yookun Cho" }
+{ "authors": "Pavel P. Kuksa Pai-hsi Huang Vladimir Pavlovic" }
+{ "authors": "Peter Druschel" }
+{ "authors": "Philippe Thévenaz Thierry Blu Michael Unser" }
+{ "authors": "Prasanth B. Nair Arindam Choudhury Andy J. Keane" }
+{ "authors": "R. Venkatesh Babu Patrick Pérez Patrick Bouthemy" }
+{ "authors": "Y. Jeon I.H. Sloan E. P. Stephan J. Elschner" }
+{ "authors": "Zheng Rong Yang" }
+{ "authors": "Carl G. Looney" }
+{ "authors": "Cheng Soon Ong Stéphane Canu Alexander J. Smola" }
+{ "authors": "Florent Lafarge Xavier Descombes Josiane Zerubia" }
+{ "authors": "Gregory D. Benson Ronald A. Olsson" }
+{ "authors": "Huzefa Rangwala George Karypis" }
+{ "authors": "Ingo Steinwart" }
+{ "authors": "Jezekiel Ben-Arie Zhiqian Wang" }
+{ "authors": "Johannes Aßfalg Karsten M. Borgwardt Hans-peter Kriegel" }
+{ "authors": "John Penix Willem Visser Eric Engstrom Aaron Larson Nicholas 
Weininger" }
+{ "authors": "John Penix Willem Visser Seungjoon Park Eric Engstrom Aaron 
Larson Nicholas Weininger" }
+{ "authors": "Jooseuk Kim Clayton D. Scott" }
+{ "authors": "Joseph Reisinger Peter Stone Risto Miikkulainen" }
+{ "authors": "Keith Sullivan Sean Luke" }
+{ "authors": "Majid M. Beigi Andreas Zell" }
+{ "authors": "Mark Baker Hong Ong" }
+{ "authors": "Matthias Daum Jan Dörrenbächer Sebastian Bogan" }
+{ "authors": "Sauro Menchetti Fabrizio Costa Paolo Frasconi" }
+{ "authors": "Shiliang Sun Changshui Zhang" }
+{ "authors": "Volker Roth Bernd Fischer" }
+{ "authors": "Andrea C. Arpaci-Dusseau Remzi H. Arpaci-Dusseau Nathan C. 
Burnett Timothy E. Denehy Thomas J. Engle Haryadi S. Gunawi James A. Nugent 
Florentina I. Popovici" }
+{ "authors": "Cyril Allauzen Mehryar Mohri Ameet Talwalkar" }
+{ "authors": "Daniel Lohmann Fabian Scheler Reinhard Tartler Olaf Spinczyk 
Wolfgang Schröder-preikschat" }
+{ "authors": "David J. Crisp Christopher J. C. Burges" }
+{ "authors": "Francis R. Bach Romain Thibaux Michael I. Jordan" }
+{ "authors": "Greg Kuperberg" }
+{ "authors": "Holger Fröhlich Jörg K. Wegner Florian Sieker Andreas Zell" }
+{ "authors": "Italo J. Dejter Abel A. Delgado" }
+{ "authors": "Kristin P. Bennett Michinari Momma Mark J. Embrechts" }
+{ "authors": "Maria-florina Balcan Avrim Blum Santosh Vempala" }
+{ "authors": "Roberto Manduchi Pietro Perona" }
+{ "authors": "Roger Butenuth" }
+{ "authors": "Sarit Shwartz Michael Zibulevsky Yoav Y. Schechner" }
+{ "authors": "Senjian An Wanquan Liu Svetha Venkatesh" }
+{ "authors": "Swagatam Das Ajith Abraham Amit Konar" }
+{ "authors": "Tony Van Gestel Johan A. K. Suykens Bart Baesens Stijn Viaene 
Jan Vanthienen Guido Dedene Bart De Moor Joos Vandewalle" }
+{ "authors": "Vladimir Vovk" }
+{ "authors": "Vojislav Kecman Te-Ming Huang Michael Vogt" }
+{ "authors": "Wim Van De Velde Johan Opsommer Erik H. D'Hollander" }
+{ "authors": "Yaniv Gurwicz Boaz Lerner" }
+{ "authors": "Zhang Dao-qiang Chen Song-can" }
+{ "authors": "Alexander Schrijver" }
+{ "authors": "Brian Kulis Mátyás Sustik Inderjit Dhillon" }
+{ "authors": "Charles Pecheur" }
+{ "authors": "Daniel Cremers Timo Kohlberger Christoph Schnörr" }
+{ "authors": "Dao-qiang Zhang Song-can Chen" }
+{ "authors": "Daoqiang Zhang Songcan Chen Zhi-hua Zhou" }
+{ "authors": "Daoqiang Zhang Zhi-hua Zhou Songcan Chen" }
+{ "authors": "Dawson R. Engler M. Frans Kaashoek James O'toole Jr." }
+{ "authors": "Dawson R. Engler M. Frans Kaashoek James O’Toole Jr." }
+{ "authors": "En Bedrijfskunde Gent Tony Van Gestel Bart Baesens Johan A. K. 
Suykens Dirk Van Den Poel Dirk-emma Baestaens Marleen Willekens" }
+{ "authors": "Gregory R. Ganger Dawson R. Engler M. Frans Kaashoek Héctor M. 
Briceño Russell Hunt Thomas Pinckney Vividon Inc" }
+{ "authors": "Olivier Chapelle S. Sathiya Keerthi Vikas Sindhwani" }
+{ "authors": "Pancham Shukla Pier Luigi Dragotti" }
+{ "authors": "Pavel B. Brazdil Carlos Soares" }
+{ "authors": "Richard West Karsten Schwan Christian Poellabauer" }
+{ "authors": "Ronald G. Minnich Matthew J. Sottile Sung-eun Choi Erik Hendriks 
Jim Mckie" }
+{ "authors": "Ryohei Fujimaki Takehisa Yairi Kazuo Machida" }
+{ "authors": "Satoshi Niijima Satoru Kuhara" }
+{ "authors": "Shibin Qiu Terran Lane" }
+{ "authors": "Shotaro Akaho" }
+{ "authors": "Si Wu Shun-ichi Amari" }
+{ "authors": "Songcan Chen Daoqiang Zhang Zhi-hua Zhou" }
+{ "authors": "Steven C. H. Hoi Rong Jin Jianke Zhu Michael R. Lyu" }
+{ "authors": "Thomas Gärtner" }
+{ "authors": "Vlad Olaru Walter F. Tichy" }
+{ "authors": "Alessandro Moschitti Fabio Massimo Zanzotto" }
+{ "authors": "Aurélie Bugeau Patrick Pérez" }
+{ "authors": "Brett Fleisch Mark Allan A. Co" }
+{ "authors": "Chang Wang Stephen D. Scott" }
+{ "authors": "Dawson R. Engler M. Frans Kaashoek James O’toole" }
+{ "authors": "Endre Boros Vladimir Gurvich" }
+{ "authors": "Experimental Design Xuanlong Nguyen Martin J. Wainwright Michael 
I. Jordan" }
+{ "authors": "Francis Bach Michael I. Jordan" }
+{ "authors": "Hideyuki Tokuda Tatsuo Nakajima" }
+{ "authors": "Ingo Mierswa" }
+{ "authors": "John Shawe-taylor Christopher K. I. Williams Nello Cristianini 
Jaz Kandola" }
+{ "authors": "Lavi Shpigelman Yoram Singer Rony Paz Eilon Vaadia" }
+{ "authors": "Luc Brun Walter Kropatsch" }
+{ "authors": "Manuel Díaz Sergio Romero Bartolomé Rubio Enrique Soler José 
M. Troya" }
+{ "authors": "Paul Mckenney Jack Slingwine Phil Krueger" }
+{ "authors": "Rafael Serrano-gotarredona Teresa Serrano-gotarredona Antonio 
Acosta-jiménez Bernabé Linares-barranco" }
+{ "authors": "Rafal Kolanski Gerwin Gerwin Klein" }
+{ "authors": "Sean Luke Keith Sullivan" }
+{ "authors": "Thierry Blu Philippe Thévenaz Michael Unser" }
+{ "authors": "Tiffany M. Mintz James P. Davis" }
+{ "authors": "Xuanlong Nguyen Xuanlong Martin J. Wainwright Michael I. Jordan" 
}
+{ "authors": "Alexei Vinokourov Andrei N. Soklakov Craig Saunders" }
+{ "authors": "Andrew Whitaker Marianne Shaw Steven D. Gribble" }
+{ "authors": "Bruno De Bus Dominique Chanet Ludo Van Put Bjorn De Sutter Koen 
De Bosschere" }
+{ "authors": "Carlo Drioli Davide Rocchesso" }
+{ "authors": "Christoph M. Kirsch Marco A. A. Sanvido Thomas A. Henzinger 
Wolfgang Pree" }
+{ "authors": "Fan Zhang Edwin R. Hancock" }
+{ "authors": "Francesca Odone Annalisa Barla Alessandro Verri" }
+{ "authors": "Hae Jong Seo Peyman Milanfar" }
+{ "authors": "Kiran B. Chilakamarri Peter Hamburger" }
+{ "authors": "Koji Tsuda Taishin Kin Kiyoshi Asai" }
+{ "authors": "Kristis Makris Kyung Dong Ryu" }
+{ "authors": "Lin Gu John A. Stankovic" }
+{ "authors": "M. Frans Kaashoek Dawson R. Engler Gregory R. Ganger Russell 
Hunt Thomas Pinckney" }
+{ "authors": "Bernard Haasdonk Hans Burkhardt" }
+{ "authors": "Brian Kulis Sugato Basu Inderjit Dhillon Raymond Mooney" }
+{ "authors": "Charles A. Micchelli Massimiliano Pontil" }
+{ "authors": "Chia-hui Chang Yu-chieh Wu" }
+{ "authors": "Chunhua Shen Anton Van Den Hengel Anthony Dick Michael J. 
Brooks" }
+{ "authors": "Daniel Lohmann Fabian Scheler Wolfgang Schröder-preikschat Olaf 
Spinczyk" }
+{ "authors": "Guang Dai Dit-yan Yeung" }
+{ "authors": "Ihor Kuz Yan Liu Ian Gorton Gernot Heiser" }
+{ "authors": "Jason Weston Christina Leslie Eugene Ie Dengyong Zhou Andre 
Elisseeff William Stafford Noble" }
+{ "authors": "Junbin Gao Daming Shi Xiaomao Liu" }
+{ "authors": "Khawar M. Zuberi Y Padmanabhan Pillai Kang G. Shin" }
+{ "authors": "Koji Tsuda" }
+{ "authors": "Ramani Duraiswami Vikas C. Raykar" }
+{ "authors": "Rudolf Berghammer Thorsten Hoffmann" }
+{ "authors": "Sayantan Sur Lei Chai Hyun-wook Jin Dhabaleswar K. Panda Sun 
Microsystems" }
+{ "authors": "Seung-jean Kim Alessandro Magnani Stephen Boyd" }
+{ "authors": "Stephen R. Schach Bo Jin David R. Wright Gillian Z. Heller A. 
Jefferson Offutt" }
+{ "authors": "Thomas Röblitz Oliver Bühn Frank Mueller" }
+{ "authors": "Xuanlong Nguyen Martin J. Wainwright Michael I. Jordan" }
+{ "authors": "Yongmin Li Shaogang Gong Heather Liddell" }
\ No newline at end of file

http://git-wip-us.apache.org/repos/asf/asterixdb/blob/d906bd89/asterixdb/asterix-app/data/pub-small/dblp-small-multi-id.txt
----------------------------------------------------------------------
diff --git a/asterixdb/asterix-app/data/pub-small/dblp-small-multi-id.txt 
b/asterixdb/asterix-app/data/pub-small/dblp-small-multi-id.txt
new file mode 100644
index 0000000..7ea80e7
--- /dev/null
+++ b/asterixdb/asterix-app/data/pub-small/dblp-small-multi-id.txt
@@ -0,0 +1,100 @@
+1:books/acm/kim95/AnnevelinkACFHK95:Object SQL - A Language for the Design and 
Implementation of Object Databases.:Jurgen Annevelink Rafiul Ahad Amelia 
Carlson Daniel H. Fishman Michael L. Heytens William Kent:2002-01-03 42-68 1995 
Modern Database Systems db/books/collections/kim95.html#AnnevelinkACFHK95
+2:books/acm/kim95/Blakeley95:OQL[C++]  Extending C++ with an Object Query 
Capability.:José A. Blakeley:2002-01-03 69-88 Modern Database Systems 
db/books/collections/kim95.html#Blakeley95 1995
+3:books/acm/kim95/BreitbartGS95:Transaction Management in Multidatabase 
Systems.:Yuri Breitbart Hector Garcia-Molina Abraham Silberschatz:2004-03-08 
573-591 Modern Database Systems books/acm/Kim95 
db/books/collections/kim95.html#BreitbartGS95 1995
+4:books/acm/kim95/ChristodoulakisK95:Multimedia Information Systems  Issues 
and Approaches.:Stavros Christodoulakis Leonidas Koveos:2002-01-03 318-337 1995 
Modern Database Systems db/books/collections/kim95.html#ChristodoulakisK95
+5:books/acm/kim95/DayalHW95:Active Database Systems.:Umeshwar Dayal Eric N. 
Hanson Jennifer Widom:2002-01-03 434-456 1995 Modern Database Systems 
db/books/collections/kim95.html#DayalHW95
+6:books/acm/kim95/DittrichD95:Where Object-Oriented DBMSs Should Do Better  A 
Critique Based on Early Experiences.:Angelika Kotz Dittrich Klaus R. 
Dittrich:2002-01-03 238-254 1995 Modern Database Systems 
db/books/collections/kim95.html#DittrichD95
+7:books/acm/kim95/Garcia-MolinaH95:Distributed Databases.:Hector Garcia-Molina 
Meichun Hsu:2002-01-03 477-493 1995 Modern Database Systems 
db/books/collections/kim95.html#Garcia-MolinaH95
+8:books/acm/kim95/Goodman95:An Object-Oriented DBMS War Story  Developing a 
Genome Mapping Database in C++.:Nathan Goodman:2002-01-03 216-237 1995 Modern 
Database Systems db/books/collections/kim95.html#Goodman95
+9:books/acm/kim95/Kaiser95:Cooperative Transactions for Multiuser 
Environments.:Gail E. Kaiser:2002-01-03 409-433 1995 Modern Database Systems 
db/books/collections/kim95.html#Kaiser95
+10:books/acm/kim95/KelleyGKRG95:Schema Architecture of the UniSQL/M 
Multidatabase System:William Kelley Sunit K. Gala Won Kim Tom C. Reyes Bruce 
Graham:2004-03-08 Modern Database Systems books/acm/Kim95 621-648 1995 
db/books/collections/kim95.html#KelleyGKRG95
+11:books/acm/kim95/KemperM95:Physical Object Management.:Alfons Kemper Guido 
Moerkotte:2002-01-03 175-202 1995 Modern Database Systems 
db/books/collections/kim95.html#KemperM95
+12:books/acm/kim95/Kim95:Introduction to Part 1  Next-Generation Database 
Technology.:Won Kim:2002-01-03 5-17 1995 Modern Database Systems 
db/books/collections/kim95.html#Kim95
+13:books/acm/kim95/Kim95a:Object-Oriented Database Systems  Promises, Reality, 
and Future.:Won Kim:2002-01-03 255-280 1995 Modern Database Systems 
db/books/collections/kim95.html#Kim95a
+14:books/acm/kim95/Kim95b:Introduction to Part 2  Technology for 
Interoperating Legacy Databases.:Won Kim:2002-01-03 515-520 1995 Modern 
Database Systems db/books/collections/kim95.html#Kim95b
+15:books/acm/kim95/KimCGS95:On Resolving Schematic Heterogeneity in 
Multidatabase Systems.:Won Kim Injun Choi Sunit K. Gala Mark 
Scheevel:2002-01-03 521-550 1995 Modern Database Systems 
db/books/collections/kim95.html#KimCGS95
+16:books/acm/kim95/KimG95:Requirements for a Performance Benchmark for 
Object-Oriented Database Systems.:Won Kim Jorge F. Garza:2002-01-03 203-215 
1995 Modern Database Systems db/books/collections/kim95.html#KimG95
+17:books/acm/kim95/KimK95:On View Support in Object-Oriented Databases 
Systems.:Won Kim William Kelley:2002-01-03 108-129 1995 Modern Database Systems 
db/books/collections/kim95.html#KimK95
+18:books/acm/kim95/Kowalski95:The POSC Solution to Managing E&P Data.:Vincent 
J. Kowalski:2002-01-03 281-301 1995 Modern Database Systems 
db/books/collections/kim95.html#Kowalski95
+19:books/acm/kim95/KriegerA95:C++ Bindings to an Object Database.:David 
Krieger Tim Andrews:2002-01-03 89-107 1995 Modern Database Systems 
db/books/collections/kim95.html#KriegerA95
+20:books/acm/kim95/Lunt95:Authorization in Object-Oriented Databases.:Teresa 
F. Lunt:2002-01-03 130-145 1995 Modern Database Systems 
db/books/collections/kim95.html#Lunt95
+21:books/acm/kim95/MengY95:Query Processing in Multidatabase Systems.:Weiyi 
Meng Clement T. Yu:2002-01-03 551-572 1995 Modern Database Systems 
db/books/collections/kim95.html#MengY95
+22:books/acm/kim95/Motro95:Management of Uncerainty in database 
Systems.:Amihai Motro:2002-01-03 457-476 1995 Modern Database Systems 
db/books/collections/kim95.html#Motro95
+23:books/acm/kim95/Omiecinski95:Parallel Relational Database Systems.:Edward 
Omiecinski:2002-01-03 494-512 1995 Modern Database Systems 
db/books/collections/kim95.html#Omiecinski95
+24:books/acm/kim95/OzsuB95:Query Processing in Object-Oriented Database 
Systems.:M. Tamer Özsu José A. Blakeley:2002-01-03 146-174 1995 Modern 
Database Systems db/books/collections/kim95.html#OzsuB95
+25:books/acm/kim95/RusinkiewiczS95:Specification and Execution of 
Transactional Workflows.:Marek Rusinkiewicz Amit P. Sheth:2004-03-08 592-620 
Modern Database Systems books/acm/Kim95 
db/books/collections/kim95.html#RusinkiewiczS95 1995
+26:books/acm/kim95/Samet95:Spatial Data Structures.:Hanan Samet:2004-03-08 
361-385 Modern Database Systems books/acm/Kim95 
db/books/collections/kim95.html#Samet95 1995
+27:books/acm/kim95/SametA95:Spatial Data Models and Query Processing.:Hanan 
Samet Walid G. Aref:2002-01-03 338-360 1995 Modern Database Systems 
db/books/collections/kim95.html#SametA95
+28:books/acm/kim95/ShanADDK95:Pegasus  A Heterogeneous Information Management 
System.:Ming-Chien Shan Rafi Ahmed Jim Davis Weimin Du William Kent:2004-03-08 
664-682 Modern Database Systems books/acm/Kim95 
db/books/collections/kim95.html#ShanADDK95 1995
+29:books/acm/kim95/Snodgrass95:Temporal Object-Oriented Databases  A Critical 
Comparison.:Richard T. Snodgrass:2002-01-03 386-408 1995 Modern Database 
Systems db/books/collections/kim95.html#Snodgrass95
+30:books/acm/kim95/SoleyK95:The OMG Object Model.:Richard Mark Soley William 
Kent:2002-01-03 18-41 1995 Modern Database Systems 
db/books/collections/kim95.html#SoleyK95
+31:books/acm/kim95/Stout95:EDA/SQL.:Ralph L. Stout:2004-03-08 649-663 Modern 
Database Systems books/acm/Kim95 db/books/collections/kim95.html#Stout95 1995
+32:books/acm/kim95/Thompson95:The Changing Database Standards Landscape.:Craig 
W. Thompson:2002-01-03 302-317 1995 Modern Database Systems 
db/books/collections/kim95.html#Thompson95
+33:books/acm/kim95/BreitbartR95:Overview of the ADDS System.:Yuri Breitbart 
Tom C. Reyes:2009-06-12 683-701 Modern Database Systems books/acm/Kim95 
db/books/collections/kim95.html#BreitbartR95 1995
+34:books/acm/Kim95:Modern Database Systems  The Object Model, 
Interoperability, and Beyond.::2004-03-08 Won Kim Modern Database Systems ACM 
Press and Addison-Wesley 1995 0-201-59098-0 db/books/collections/kim95.html
+35:books/ap/MarshallO79:Inequalities  Theory of Majorization and Its 
Application.:Albert W. Marshall Ingram Olkin:2002-01-03 Academic Press 1979 
0-12-473750-1
+36:books/aw/kimL89/BjornerstedtH89:Version Control in an Object-Oriented 
Architecture.:Anders Björnerstedt Christer Hulten:2006-02-24 451-485 
Object-Oriented Concepts, Databases, and Applications ACM Press and 
Addison-Wesley 1989 db/books/collections/kim89.html#BjornerstedtH89
+37:books/aw/kimL89/BretlMOPSSWW89:The GemStone Data Management System.:Robert 
Bretl David Maier Allen Otis D. Jason Penney Bruce Schuchardt Jacob Stein E. 
Harold Williams Monty Williams:2002-01-03 283-308 Object-Oriented Concepts, 
Databases, and Applications ACM Press and Addison-Wesley 1989 
db/books/collections/kim89.html#BretlMOPSSWW89
+38:books/aw/kimL89/CareyDRS89:Storage Management in EXODUS.:Michael J. Carey 
David J. DeWitt Joel E. Richardson Eugene J. Shekita:2002-01-03 341-369 
Object-Oriented Concepts, Databases, and Applications ACM Press and 
Addison-Wesley 1989 db/books/collections/kim89.html#CareyDRS89
+39:books/aw/kimL89/Decouchant89:A Distributed Object Manager for the 
Smalltalk-80 System.:Dominique Decouchant:2002-01-03 487-520 1989 
Object-Oriented Concepts, Databases, and Applications 
db/books/collections/kim89.html#Decouchant89
+40:books/aw/kimL89/DiederichM89:Objects, Messages, and Rules in Database 
Design.:Jim Diederich Jack Milton:2002-01-03 177-197 1989 Object-Oriented 
Concepts, Databases, and Applications 
db/books/collections/kim89.html#DiederichM89
+41:books/aw/kimL89/EllisG89:Active Objects  Ealities and 
Possibilities.:Clarence A. Ellis Simon J. Gibbs:2002-01-03 561-572 1989 
Object-Oriented Concepts, Databases, and Applications 
db/books/collections/kim89.html#EllisG89
+42:books/aw/kimL89/FishmanABCCDHHKLLMNRSW89:Overview of the Iris DBMS.:Daniel 
H. Fishman Jurgen Annevelink David Beech E. C. Chow Tim Connors J. W. Davis 
Waqar Hasan C. G. Hoch William Kent S. Leichner Peter Lyngbæk Brom Mahbod 
Marie-Anne Neimat Tore Risch Ming-Chien Shan W. Kevin Wilkinson:2002-01-03 
219-250 Object-Oriented Concepts, Databases, and Applications ACM Press and 
Addison-Wesley 1989 db/books/collections/kim89.html#FishmanABCCDHHKLLMNRSW89
+43:books/aw/kimL89/KimBCGW89:Features of the ORION Object-Oriented Database 
System.:Won Kim Nat Ballou Hong-Tai Chou Jorge F. Garza Darrell 
Woelk:2002-01-03 251-282 Object-Oriented Concepts, Databases, and Applications 
ACM Press and Addison-Wesley 1989 db/books/collections/kim89.html#KimBCGW89
+44:books/aw/kimL89/KimKD89:Indexing Techniques for Object-Oriented 
Databases.:Won Kim Kyung-Chang Kim Alfred G. Dale:2002-01-03 371-394 
Object-Oriented Concepts, Databases, and Applications ACM Press and 
Addison-Wesley 1989 db/books/collections/kim89.html#KimKD89
+45:books/aw/kimL89/King89:My Cat Is Object-Oriented.:Roger King:2002-01-03 
23-30 1989 Object-Oriented Concepts, Databases, and Applications 
db/books/collections/kim89.html#King89
+46:books/aw/kimL89/Maier89:Making Database Systems Fast Enough for CAD 
Applications.:David Maier:2002-01-03 573-582 1989 Object-Oriented Concepts, 
Databases, and Applications db/books/collections/kim89.html#Maier89
+47:books/aw/kimL89/MellenderRS89:Optimizing Smalltalk Message 
Performance.:Fred Mellender Steve Riegel Andrew Straw:2002-01-03 423-450 1989 
Object-Oriented Concepts, Databases, and Applications 
db/books/collections/kim89.html#MellenderRS89
+48:books/aw/kimL89/Moon89:The Common List Object-Oriented Programming Language 
Standard.:David A. Moon:2002-01-03 49-78 1989 Object-Oriented Concepts, 
Databases, and Applications db/books/collections/kim89.html#Moon89
+49:books/aw/kimL89/Moss89:Object Orientation as Catalyst for Language-Database 
Inegration.:J. Eliot B. Moss:2002-01-03 583-592 1989 Object-Oriented Concepts, 
Databases, and Applications db/books/collections/kim89.html#Moss89
+50:books/aw/kimL89/Nierstrasz89:A Survey of Object-Oriented Concepts.:Oscar 
Nierstrasz:2002-01-03 3-21 1989 Object-Oriented Concepts, Databases, and 
Applications db/books/collections/kim89.html#Nierstrasz89
+51:books/aw/kimL89/NierstraszT89:Integrated Office Systems.:Oscar Nierstrasz 
Dennis Tsichritzis:2002-01-03 199-215 1989 Object-Oriented Concepts, Databases, 
and Applications db/books/collections/kim89.html#NierstraszT89
+52:books/aw/kimL89/Russinoff89:Proteus  A Frame-Based Nonmonotonic Inference 
System.:David M. Russinoff:2002-01-03 127-150 Object-Oriented Concepts, 
Databases, and Applications ACM Press and Addison-Wesley 1989 
db/books/collections/kim89.html#Russinoff89
+53:books/aw/kimL89/SkarraZ89:Concurrency Control and Object-Oriented 
Databases.:Andrea H. Skarra Stanley B. Zdonik:2002-01-03 395-421 1989 
Object-Oriented Concepts, Databases, and Applications 
db/books/collections/kim89.html#SkarraZ89
+54:books/aw/kimL89/SteinLU89:A Shared View of Sharing  The Treaty of 
Orlando.:Lynn Andrea Stein Henry Lieberman David Ungar:2002-01-03 31-48 1989 
Object-Oriented Concepts, Databases, and Applications 
db/books/collections/kim89.html#SteinLU89
+55:books/aw/kimL89/TarltonT89:Pogo  A Declarative Representation System for 
Graphics.:Mark A. Tarlton P. Nong Tarlton:2002-01-03 151-176 1989 
Object-Oriented Concepts, Databases, and Applications 
db/books/collections/kim89.html#TarltonT89
+56:books/aw/kimL89/TomlinsonS89:Concurrent Object-Oriented Programming 
Languages.:Chris Tomlinson Mark Scheevel:2002-01-03 79-124 1989 Object-Oriented 
Concepts, Databases, and Applications 
db/books/collections/kim89.html#TomlinsonS89
+57:books/aw/kimL89/TsichritzisN89:Directions in Object-Oriented 
Research.:Dennis Tsichritzis Oscar Nierstrasz:2002-01-03 523-536 1989 
Object-Oriented Concepts, Databases, and Applications 
db/books/collections/kim89.html#TsichritzisN89
+58:books/aw/kimL89/Wand89:A Proposal for a Formal Model of Objects.:Yair 
Wand:2002-01-03 537-559 1989 Object-Oriented Concepts, Databases, and 
Applications db/books/collections/kim89.html#Wand89
+59:books/aw/kimL89/WeiserL89:OZ+  An Object-Oriented Database System.:Stephen 
P. Weiser Frederick H. Lochovsky:2002-01-03 309-337 1989 Object-Oriented 
Concepts, Databases, and Applications db/books/collections/kim89.html#WeiserL89
+60:books/aw/stonebraker86/RoweS86:The Commercial INGRES Epilogue.:Lawrence A. 
Rowe Michael Stonebraker:2002-01-03 63-82 1986 The INGRES Papers 
db/books/collections/Stonebraker86.html#RoweS86 
db/books/collections/Stonebraker86/RoweS86.html ingres/P063.pdf
+61:books/aw/stonebraker86/Stonebraker86:Design of Relational Systems 
(Introduction to Section 1).:Michael Stonebraker:2002-01-03 1-3 1986 The INGRES 
Papers db/books/collections/Stonebraker86.html#Stonebraker86 
db/books/collections/Stonebraker86/Stonebraker86.html ingres/P001.pdf
+62:books/aw/stonebraker86/Stonebraker86a:Supporting Studies on Relational 
Systems (Introduction to Section 2).:Michael Stonebraker:2002-01-03 83-85 1986 
The INGRES Papers db/books/collections/Stonebraker86.html#Stonebraker86a 
db/books/collections/Stonebraker86/Stonebraker86a.html ingres/P083.pdf
+63:books/aw/stonebraker86/Stonebraker86b:Distributed Database Systems 
(Introduction to Section 3).:Michael Stonebraker:2002-01-03 183-186 1986 The 
INGRES Papers db/books/collections/Stonebraker86.html#Stonebraker86b 
db/books/collections/Stonebraker86/Stonebraker86b.html ingres/P183.pdf
+64:books/aw/stonebraker86/Stonebraker86c:The Design and Implementation of 
Distributed INGRES.:Michael Stonebraker:2002-01-03 187-196 1986 The INGRES 
Papers db/books/collections/Stonebraker86.html#Stonebraker86c 
db/books/collections/Stonebraker86/Stonebraker86c.html ingres/P187.pdf
+65:books/aw/stonebraker86/Stonebraker86d:User Interfaces for Database Systems 
(Introduction to Section 4).:Michael Stonebraker:2002-01-03 243-245 1986 The 
INGRES Papers db/books/collections/Stonebraker86.html#Stonebraker86d 
db/books/collections/Stonebraker86/Stonebraker86d.html ingres/P243.pdf
+66:books/aw/stonebraker86/Stonebraker86e:Extended Semantics for the Relational 
Model (Introduction to Section 5).:Michael Stonebraker:2002-01-03 313-316 1986 
The INGRES Papers db/books/collections/Stonebraker86.html#Stonebraker86e 
db/books/collections/Stonebraker86/Stonebraker86e.html ingres/P313.pdf
+67:books/aw/stonebraker86/Stonebraker86f:Database Design (Introduction to 
Section 6).:Michael Stonebraker:2002-01-03 393-394 1986 The INGRES Papers 
db/books/collections/Stonebraker86.html#Stonebraker86f 
db/books/collections/Stonebraker86/Stonebraker86f.html ingres/P393.pdf
+68:books/aw/stonebraker86/X86:Title, Preface, Contents.::2002-01-03 1986 The 
INGRES Papers db/books/collections/Stonebraker86.html#X86 
db/books/collections/Stonebraker86/X86.html ingres/frontmatter.pdf
+69:books/aw/stonebraker86/X86a:References.::2002-01-03 429-444 1986 The INGRES 
Papers db/books/collections/Stonebraker86.html#X86a 
db/books/collections/Stonebraker86/X86a.html ingres/P429.pdf
+70:books/aw/Knuth86a:TeX  The Program:Donald E. Knuth:2002-01-03 
Addison-Wesley 1986 0-201-13437-3
+71:conf/appt/LiDCMY07:Design and Implementation of a High-Speed Reconfigurable 
Modular Arithmetic Unit.:Wei Li Zibin Dai Tao Chen Tao Meng Xuan 
Yang:2007-11-09 50-59 2007 conf/appt/2007 APPT http 
//dx.doi.org/10.1007/978-3-540-76837-1_9 db/conf/appt/appt2007.html#LiDCMY07
+72:books/aw/Lamport86:LaTeX  User's Guide & Reference Manual:Leslie 
Lamport:2002-01-03 Addison-Wesley 1986 0-201-15790-X
+73:books/aw/AhoHU74:The Design and Analysis of Computer Algorithms.:Alfred V. 
Aho John E. Hopcroft Jeffrey D. Ullman:2002-01-03 Addison-Wesley 1974 
0-201-00029-6
+74:books/aw/Lamport2002:Specifying Systems, The TLA+ Language and Tools for 
Hardware and Software Engineers:Leslie Lamport:2005-07-28 Addison-Wesley 2002 
0-3211-4306-X http //research.microsoft.com/users/lamport/tla/book.html
+75:books/aw/AhoHU83:Data Structures and Algorithms.:Alfred V. Aho John E. 
Hopcroft Jeffrey D. Ullman:2002-01-03 Addison-Wesley 1983 0-201-00023-7
+76:books/aw/LewisBK01:Databases and Transaction Processing  An 
Application-Oriented Approach:Philip M. Lewis Arthur J. Bernstein Michael 
Kifer:2002-01-03 Addison-Wesley 2001 0-201-70872-8
+77:books/aw/AhoKW88:The AWK Programming Language:Alfred V. Aho Brian W. 
Kernighan Peter J. Weinberger:2002-01-03 Addison-Wesley 1988
+78:books/aw/LindholmY97:The Java Virtual Machine Specification:Tim Lindholm 
Frank Yellin:2002-01-28 Addison-Wesley 1997 0-201-63452-X
+79:books/aw/AhoSU86:Compilers  Princiles, Techniques, and Tools.:Alfred V. Aho 
Ravi Sethi Jeffrey D. Ullman:2002-01-03 Addison-Wesley 1986 0-201-10088-6
+80:books/aw/Sedgewick83:Algorithms:Robert Sedgewick:2002-01-03 Addison-Wesley 
1983 0-201-06672-6
+81:journals/siamcomp/AspnesW96:Randomized Consensus in Expected O(n log² n) 
Operations Per Processor.:James Aspnes Orli Waarts:2002-01-03 1024-1044 1996 25 
SIAM J. Comput. 5 db/journals/siamcomp/siamcomp25.html#AspnesW96
+82:conf/focs/AspnesW92:Randomized Consensus in Expected O(n log ^2 n) 
Operations Per Processor:James Aspnes Orli Waarts:2006-04-25 137-146 
conf/focs/FOCS33 1992 FOCS db/conf/focs/focs92.html#AspnesW92
+83:journals/siamcomp/Bloniarz83:A Shortest-Path Algorithm with Expected Time 
O(n² log n log* n).:Peter A. Bloniarz:2002-01-03 588-600 1983 12 SIAM J. 
Comput. 3 db/journals/siamcomp/siamcomp12.html#Bloniarz83
+84:conf/stoc/Bloniarz80:A Shortest-Path Algorithm with Expected Time O(n^2 log 
n log ^* n):Peter A. Bloniarz:2006-04-25 378-384 conf/stoc/STOC12 1980 STOC 
db/conf/stoc/stoc80.html#Bloniarz80
+85:journals/siamcomp/Megiddo83a:Linear-Time Algorithms for Linear Programming 
in R³ and Related Problems.:Nimrod Megiddo:2002-01-03 759-776 1983 12 SIAM J. 
Comput. 4 db/journals/siamcomp/siamcomp12.html#Megiddo83a
+86:conf/focs/Megiddo82:Linear-Time Algorithms for Linear Programming in R^3 
and Related Problems:Nimrod Megiddo:2006-04-25 329-338 conf/focs/FOCS23 1982 
FOCS db/conf/focs/focs82.html#Megiddo82
+87:journals/siamcomp/MoffatT87:An All Pairs Shortest Path Algorithm with 
Expected Time O(n² log n).:Alistair Moffat Tadao Takaoka:2002-01-03 1023-1031 
1987 16 SIAM J. Comput. 6 db/journals/siamcomp/siamcomp16.html#MoffatT87
+88:conf/focs/MoffatT85:An All Pairs Shortest Path Algorithm with Expected 
Running Time O(n^2 log n):Alistair Moffat Tadao Takaoka:2006-04-25 101-105 
conf/focs/FOCS26 1985 FOCS db/conf/focs/focs85.html#MoffatT85
+89:conf/icip/SchonfeldL98:VORTEX  Video Retrieval and Tracking from Compressed 
Multimedia Databases.:Dan Schonfeld Dan Lelescu:2002-11-05 123-127 1998 ICIP 
(3) db/conf/icip/icip1998-3.html#SchonfeldL98
+90:conf/hicss/SchonfeldL99:VORTEX  Video Retrieval and Tracking from 
Compressed Multimedia Databases ¾ Visual Search Engine.:Dan Schonfeld Dan 
Lelescu:2002-01-03 1999 HICSS http 
//computer.org/proceedings/hicss/0001/00013/00013006abs.htm 
db/conf/hicss/hicss1999-3.html#SchonfeldL99
+91:journals/corr/abs-0802-2861:Geometric Set Cover and Hitting Sets for 
Polytopes in $R^3$:Sören Laue:2008-03-03 http //arxiv.org/abs/0802.2861 2008 
CoRR abs/0802.2861 db/journals/corr/corr0802.html#abs-0802-2861 informal 
publication
+92:conf/stacs/Laue08:Geometric Set Cover and Hitting Sets for Polytopes in 
R³.:Sören Laue:2008-03-04 2008 STACS 479-490 http 
//drops.dagstuhl.de/opus/volltexte/2008/1367 conf/stacs/2008 
db/conf/stacs/stacs2008.html#Laue08
+93:journals/iandc/IbarraJCR91:Some Classes of Languages in NC¹:Oscar H. 
Ibarra Tao Jiang Jik H. Chang Bala Ravikumar:2006-04-25 86-106 Inf. Comput. 
January 1991 90 1 db/journals/iandc/iandc90.html#IbarraJCR91
+94:conf/awoc/IbarraJRC88:On Some Languages in NC.:Oscar H. Ibarra Tao Jiang 
Bala Ravikumar Jik H. Chang:2002-08-06 64-73 1988 conf/awoc/1988 AWOC 
db/conf/awoc/awoc88.html#IbarraJRC88
+95:journals/jacm/GalilHLSW87:An O(n³log n) deterministic and an O(n³) Las 
Vegs isomorphism test for trivalent graphs.:Zvi Galil Christoph M. Hoffmann 
Eugene M. Luks Claus-Peter Schnorr Andreas Weber:2003-11-20 513-531 1987 34 J. 
ACM 3 http //doi.acm.org/10.1145/28869.28870 
db/journals/jacm/jacm34.html#GalilHLSW87
+96:conf/focs/GalilHLSW82:An O(n^3 log n) Deterministic and an O(n^3) 
Probabilistic Isomorphism Test for Trivalent Graphs:Zvi Galil Christoph M. 
Hoffmann Eugene M. Luks Claus-Peter Schnorr Andreas Weber:2006-04-25 118-125 
conf/focs/FOCS23 1982 FOCS db/conf/focs/focs82.html#GalilHLSW82
+97:journals/jacm/GalilT88:An O(n²(m + n log n)log n) min-cost flow 
algorithm.:Zvi Galil Éva Tardos:2003-11-20 374-386 1988 35 J. ACM 2 http 
//doi.acm.org/10.1145/42282.214090 db/journals/jacm/jacm35.html#GalilT88
+98:conf/focs/GalilT86:An O(n^2 (m + n log n) log n) Min-Cost Flow 
Algorithm:Zvi Galil Éva Tardos:2006-04-25 1-9 conf/focs/FOCS27 1986 FOCS 
db/conf/focs/focs86.html#GalilT86
+99:series/synthesis/2009Weintraub:Jordan Canonical Form  Theory and 
Practice:Steven H. Weintraub:2009-09-06 Jordan Canonical Form  Theory and 
Practice http //dx.doi.org/10.2200/S00218ED1V01Y200908MAS006 http 
//dx.doi.org/10.2200/S00218ED1V01Y200908MAS006 2009 Synthesis Lectures on 
Mathematics & Statistics Morgan & Claypool Publishers
+100:series/synthesis/2009Brozos:The Geometry of Walker Manifolds:Miguel 
Brozos-Vázquez Eduardo García-Río Peter Gilkey Stana Nikcevic Rámon 
Vázquez-Lorenzo:2009-09-06 The Geometry of Walker Manifolds http 
//dx.doi.org/10.2200/S00197ED1V01Y200906MAS005 http 
//dx.doi.org/10.2200/S00197ED1V01Y200906MAS005 2009 Synthesis Lectures on 
Mathematics & Statistics Morgan & Claypool Publishers

http://git-wip-us.apache.org/repos/asf/asterixdb/blob/d906bd89/asterixdb/asterix-app/data/pub-small/dblpauthors.adm
----------------------------------------------------------------------
diff --git a/asterixdb/asterix-app/data/pub-small/dblpauthors.adm 
b/asterixdb/asterix-app/data/pub-small/dblpauthors.adm
new file mode 100644
index 0000000..7e033ff
--- /dev/null
+++ b/asterixdb/asterix-app/data/pub-small/dblpauthors.adm
@@ -0,0 +1,194 @@
+{ "authors": "Aria Nosratinia" }
+{ "authors": "Cheng Soon Ong Xavier Mary Stéphane Canu Alexander J. Smola" }
+{ "authors": "Dominique Chanet Bjorn De Sutter Bruno De Bus Ludo Van Put Koen 
De Bosschere" }
+{ "authors": "Faisal N. Abu-Khzam Michael A. Langston W. Henry Suters" }
+{ "authors": "Haifeng Li Tao Jiang" }
+{ "authors": "Jean-Philippe Vert" }
+{ "authors": "Liguo Yu Srini Ramaswamy" }
+{ "authors": "Manuel Delgado" }
+{ "authors": "Min Xu Xuxian Jiang Ravi S. Sandhu Xinwen Zhang" }
+{ "authors": "Ping Wah Wong" }
+{ "authors": "Sang-Woon Kim B. John Oommen" }
+{ "authors": "William S. Frantz Charles R. Landau" }
+{ "authors": "Yoshisato Yanagisawa Kenichi Kourai Shigeru Chiba" }
+{ "authors": "Choon Hui Teo S. V. N. Vishwanathan" }
+{ "authors": "Dao-Qiang Zhang Song-Can Chen" }
+{ "authors": "Dario Colazzo Giorgio Ghelli" }
+{ "authors": "Gilles Blanchard Olivier Bousquet Laurent Zwald" }
+{ "authors": "Gregory Gutin Khee Meng Koh Eng Guan Tay Anders Yeo" }
+{ "authors": "Inderjit S. Dhillon Yuqiang Guan Brian Kulis" }
+{ "authors": "Mucuy-kak Guevara Hortensia Galeana-Sánchez" }
+{ "authors": "Ronald Minnich Matthew J. Sottile Sung-Eun Choi Erik A. Hendriks 
Jim McKie" }
+{ "authors": "Shuyuan Yang Min Wang Licheng Jiao" }
+{ "authors": "Stefan Klanke Helge Ritter" }
+{ "authors": "Tzanko Donchev Marc Quincampoix" }
+{ "authors": "Xiaohai Sun Dominik Janzing Bernhard Schölkopf" }
+{ "authors": "Yoav Etsion Dan Tsafrir Scott Kirkpatrick Dror G. Feitelson" }
+{ "authors": "Bastian Blankenburg Matthias Klusch Onn Shehory" }
+{ "authors": "Bodhisattwa Mukherjee Karsten Schwan" }
+{ "authors": "Brett D. Fleisch Mark Allan A. Co" }
+{ "authors": "Brian Kan-Wing Mak Roger Wend-Huu Hsiao Simon Ka-Lung Ho James 
T. Kwok" }
+{ "authors": "Gernot Heiser Kevin Elphinstone Ihor Kuz Gerwin Klein Stefan M. 
Petters" }
+{ "authors": "Hortensia Galeana-Sánchez Mucuy-kak Guevara" }
+{ "authors": "Khawar M. Zuberi Padmanabhan Pillai Kang G. Shin" }
+{ "authors": "KÃ¥re J. Lauvset Dag Johansen Keith Marzullo" }
+{ "authors": "Majid Beigi Andreas Zell" }
+{ "authors": "Martin L. Hazelton" }
+{ "authors": "Masashi Sugiyama Hirotaka Hachiya Christopher Towell Sethu 
Vijayakumar" }
+{ "authors": "Meihe Xu Paul M. Thompson Arthur W. Toga" }
+{ "authors": "Nick L. Petroni Jr. Michael W. Hicks" }
+{ "authors": "Pavel P. Kuksa Pai-Hsi Huang Vladimir Pavlovic" }
+{ "authors": "Philip Derrin Kevin Elphinstone Gerwin Klein David Cock Manuel 
M. T. Chakravarty" }
+{ "authors": "Shigeo Abe" }
+{ "authors": "Stephen Plaza Valeria Bertacco" }
+{ "authors": "Amol Shukla Lily Li Anand Subramanian Paul A. S. Ward Tim 
Brecht" }
+{ "authors": "Benjamin Schrauwen Jan M. Van Campenhout" }
+{ "authors": "Christopher J. C. Burges David J. Crisp" }
+{ "authors": "Dima Kuzmin Manfred K. Warmuth" }
+{ "authors": "Gavin C. Cawley Nicola L. C. Talbot" }
+{ "authors": "Hyun-Wook Jin Sayantan Sur Lei Chai Dhabaleswar K. Panda" }
+{ "authors": "Ivor W. Tsang James T. Kwok" }
+{ "authors": "Kun-Yuan Hsieh Yung-Chia Lin Chien-Ching Huang Jenq Kuen Lee" }
+{ "authors": "Shannon R. Campbell Ronald M. Summers" }
+{ "authors": "Thanh N. Tran Ron Wehrens Lutgarde M. C. Buydens" }
+{ "authors": "Tobias Glasmachers" }
+{ "authors": "Zhiqian Wang Jezekiel Ben-Arie" }
+{ "authors": "Aviezri S. Fraenkel" }
+{ "authors": "Dhammika Elkaduwe Gerwin Klein Kevin Elphinstone" }
+{ "authors": "Eli Levin Doron S. Lubinsky" }
+{ "authors": "Jieping Ye Shuiwang Ji Jianhui Chen" }
+{ "authors": "Johnny Mariéthoz Samy Bengio" }
+{ "authors": "Martin O'Connor Brendan Tangney Vinny Cahill Neville Harris" }
+{ "authors": "Min Hu Ken Jackson Jan Janssen Stefan Vandewalle" }
+{ "authors": "Patrick Haffner" }
+{ "authors": "Shun-ichi Amari Si Wu" }
+{ "authors": "Sourangshu Bhattacharya Chiranjib Bhattacharyya Nagasuma 
Chandra" }
+{ "authors": "Thomas Röblitz Frank Mueller Oliver Bühn" }
+{ "authors": "Tony Jebara" }
+{ "authors": "Volkmar Uhlig" }
+{ "authors": "Xiaohai Sun Dominik Janzing" }
+{ "authors": "XuanLong Nguyen Martin J. Wainwright Michael I. Jordan" }
+{ "authors": "Yu-Chieh Wu Chia-Hui Chang" }
+{ "authors": "Annalisa Barla Francesca Odone Alessandro Verri" }
+{ "authors": "Cheong Hee Park Haesun Park" }
+{ "authors": "Kenji Hisazumi Tsuneo Nakanishi Teruaki Kitasuka Akira Fukuda" }
+{ "authors": "Khawar M. Zuberi Kang G. Shin" }
+{ "authors": "Marc M. Van Hulle" }
+{ "authors": "Paul E. McKenney Jack Slingwine Phil Krueger" }
+{ "authors": "Saad Ali Mubarak Shah" }
+{ "authors": "Seung-Jean Kim Alessandro Magnani Stephen P. Boyd" }
+{ "authors": "Shuichi Oikawa Ragunathan Rajkumar" }
+{ "authors": "Susan Hert Michael Hoffmann Lutz Kettner Sylvain Pion Michael 
Seel" }
+{ "authors": "Dell Zhang Robert Mao" }
+{ "authors": "Jiong Guo" }
+{ "authors": "Jiong Guo Rolf Niedermeier" }
+{ "authors": "Jun Suzuki Yutaka Sasaki Eisaku Maeda" }
+{ "authors": "Maria-Florina Balcan Avrim Blum Santosh Vempala" }
+{ "authors": "Mark Heckman Cui Zhang Brian R. Becker Dave Peticolas Karl N. 
Levitt Ronald A. Olsson" }
+{ "authors": "Norman C. Hutchinson Larry L. Peterson" }
+{ "authors": "Thomas C. M. Lee" }
+{ "authors": "Vojislav Kecman Michael Vogt Te Ming Huang" }
+{ "authors": "Weichuan Yu Gerald Sommer Kostas Daniilidis" }
+{ "authors": "Weiming Gu" }
+{ "authors": "Zhihua Zhang James T. Kwok Dit-Yan Yeung" }
+{ "authors": "Alessio Ceroni Fabrizio Costa Paolo Frasconi" }
+{ "authors": "Andrea Vedaldi Stefano Soatto" }
+{ "authors": "Corinna Cortes Mehryar Mohri" }
+{ "authors": "Diomidis Spinellis" }
+{ "authors": "Jianguo Lee Jingdong Wang Changshui Zhang Zhaoqi Bian" }
+{ "authors": "Kai Zhang James T. Kwok" }
+{ "authors": "Kazuhiro Hotta" }
+{ "authors": "Steven C. H. Hoi Rong Jin Michael R. Lyu" }
+{ "authors": "Temujin Gautama Marc M. Van Hulle" }
+{ "authors": "Vikas Sindhwani S. Sathiya Keerthi Olivier Chapelle" }
+{ "authors": "André Elisseeff Jason Weston" }
+{ "authors": "Annegret Weng" }
+{ "authors": "Antti Airola Sampo Pyysalo Jari Björne Tapio Pahikkala Filip 
Ginter Tapio Salakoski" }
+{ "authors": "Christian Poellabauer Karsten Schwan Richard West" }
+{ "authors": "Christina S. Leslie Eleazar Eskin Adiel Cohen Jason Weston 
William Stafford Noble" }
+{ "authors": "Christoph Heinz Bernhard Seeger" }
+{ "authors": "Darrin P. Lewis Tony Jebara William Stafford Noble" }
+{ "authors": "Ding-Xuan Zhou" }
+{ "authors": "Francis R. Bach" }
+{ "authors": "Francis R. Bach Michael I. Jordan" }
+{ "authors": "Francisco J. Ballesteros Christopher K. Hess Fabio Kon Sergio 
Arévalo Roy H. Campbell" }
+{ "authors": "Matthew Brand" }
+{ "authors": "Michael Engel Bernd Freisleben" }
+{ "authors": "Michael Hohmuth Hendrik Tews Shane G. Stephens" }
+{ "authors": "Rafael Serrano-Gotarredona Teresa Serrano-Gotarredona Antonio 
Acosta-Jimenez Bernabé Linares-Barranco" }
+{ "authors": "Robert Jenssen Torbjørn Eltoft" }
+{ "authors": "Songcan Chen Daoqiang Zhang" }
+{ "authors": "W. Chen" }
+{ "authors": "XuanLong Nguyen Michael I. Jordan Bruno Sinopoli" }
+{ "authors": "Zhe Wang Songcan Chen" }
+{ "authors": "Alexei Pozdnoukhov Samy Bengio" }
+{ "authors": "Arvind Seshadri Mark Luk Ning Qu Adrian Perrig" }
+{ "authors": "Benjamin Schrauwen Jan Van Campenhout" }
+{ "authors": "Bryan Ford Mike Hibler Jay Lepreau Patrick Tullmann Godmar Back 
Stephen Clawson" }
+{ "authors": "Carlos Soares Pavel Brazdil" }
+{ "authors": "Charles Crowley" }
+{ "authors": "Constance L. Heitmeyer Myla Archer Elizabeth I. Leonard John D. 
McLean" }
+{ "authors": "Gregory E. Fasshauer Joseph W. Jerome" }
+{ "authors": "Matthew Burnside Angelos D. Keromytis" }
+{ "authors": "Michel Neuhaus Horst Bunke" }
+{ "authors": "Nail Akar Khosrow Sohraby" }
+{ "authors": "Robert D. Russell Philip J. Hatcher" }
+{ "authors": "Roland Opfer" }
+{ "authors": "Samuel G. Steckley Shane G. Henderson" }
+{ "authors": "Subhransu Maji Alexander C. Berg Jitendra Malik" }
+{ "authors": "Tatsuo Nakajima Hideyuki Tokuda" }
+{ "authors": "Wim Van de Velde Johan Opsommer Erik H. D'Hollander" }
+{ "authors": "Andreas Argyriou Raphael Hauser Charles A. Micchelli 
Massimiliano Pontil" }
+{ "authors": "Arindam Choudhury Prasanth B. Nair Andy J. Keane" }
+{ "authors": "Bart Baesens Stijn Viaene Tony Van Gestel Johan A. K. Suykens 
Guido Dedene Bart De Moor Jan Vanthienen" }
+{ "authors": "Bastian Blankenburg Rajdeep K. Dash Sarvapali D. Ramchurn 
Matthias Klusch Nicholas R. Jennings" }
+{ "authors": "Brian N. Bershad" }
+{ "authors": "Cheng Soon Ong Alexander J. Smola Robert C. Williamson" }
+{ "authors": "Dit-Yan Yeung Hong Chang Guang Dai" }
+{ "authors": "Erik H. W. Meijering Karel J. Zuiderveld Max A. Viergever" }
+{ "authors": "Ernest Artiaga Albert Serra Marisa Gil" }
+{ "authors": "Francis R. Bach Gert R. G. Lanckriet Michael I. Jordan" }
+{ "authors": "Gavin C. Cawley Nicola L. C. Talbot Robert J. Foxall Stephen R. 
Dorling Danilo P. Mandic" }
+{ "authors": "Hiren D. Patel Sandeep K. Shukla" }
+{ "authors": "Hua-Yan Wang Qiang Yang Hongbin Zha" }
+{ "authors": "Hujun Yin" }
+{ "authors": "Ingo Mierswa Katharina Morik" }
+{ "authors": "Michel Gien" }
+{ "authors": "Qun Dai Songcan Chen" }
+{ "authors": "Simon Fowler Andy J. Wellings" }
+{ "authors": "Carsten Ditze" }
+{ "authors": "Jieping Ye Jianhui Chen Shuiwang Ji" }
+{ "authors": "Le-Jeng Shiue Ian Jones Jörg Peters" }
+{ "authors": "MoonSang Kwon Yookun Cho" }
+{ "authors": "Peter Druschel" }
+{ "authors": "R. Venkatesh Babu Patrick Pérez Patrick Bouthemy" }
+{ "authors": "Zheng Rong Yang" }
+{ "authors": "Bin Cao Dou Shen Jian-Tao Sun Qiang Yang Zheng Chen" }
+{ "authors": "Carl G. Looney" }
+{ "authors": "Chris H. Q. Ding Rong Jin Tao Li Horst D. Simon" }
+{ "authors": "Florent Lafarge Xavier Descombes Josiane Zerubia" }
+{ "authors": "Gregory D. Benson Ronald A. Olsson" }
+{ "authors": "Huzefa Rangwala George Karypis" }
+{ "authors": "Ingo Steinwart" }
+{ "authors": "Jason Weston Christina S. Leslie Eugene Ie Dengyong Zhou André 
Elisseeff William Stafford Noble" }
+{ "authors": "Johannes Aßfalg Karsten M. Borgwardt Hans-Peter Kriegel" }
+{ "authors": "John Penix Willem Visser Eric Engstrom Aaron Larson Nicholas 
Weininger" }
+{ "authors": "Joseph Reisinger Peter Stone Risto Miikkulainen" }
+{ "authors": "Keith Sullivan Sean Luke" }
+{ "authors": "Mark Baker Hong Ong" }
+{ "authors": "Matthias Daum Jan Dörrenbächer Sebastian Bogan" }
+{ "authors": "Sauro Menchetti Fabrizio Costa Paolo Frasconi" }
+{ "authors": "Shiliang Sun Changshui Zhang" }
+{ "authors": "Tony Van Gestel Bart Baesens Johan A. K. Suykens Dirk Van den 
Poel Dirk-Emma Baestaens Marleen Willekens" }
+{ "authors": "Volker Roth Bernd Fischer" }
+{ "authors": "YongHong Tian Tiejun Huang Wen Gao" }
+{ "authors": "Brian Kulis Sugato Basu Inderjit S. Dhillon Raymond J. Mooney" }
+{ "authors": "Chunhua Shen Anton van den Hengel Michael J. Brooks" }
+{ "authors": "Cyril Allauzen Mehryar Mohri Ameet Talwalkar" }
+{ "authors": "Francis R. Bach Romain Thibaux Michael I. Jordan" }
+{ "authors": "Greg Kuperberg" }
+{ "authors": "Guang Dai Dit-Yan Yeung" }
+{ "authors": "Guo-Jun Qi Xian-Sheng Hua Yong Rui Jinhui Tang Tao Mei Meng Wang 
Hong-Jiang Zhang" }
+{ "authors": "Holger Fröhlich Jörg K. Wegner Florian Sieker Andreas Zell" }
+{ "authors": "Italo J. Dejter Abel A. Delgado" }
+{ "authors": "Karsten M. Borgwardt Cheng Soon Ong Stefan Schönauer S. V. N. 
Vishwanathan Alexander J. Smola Hans-Peter Kriegel" }
\ No newline at end of file

http://git-wip-us.apache.org/repos/asf/asterixdb/blob/d906bd89/asterixdb/asterix-app/src/test/resources/optimizerts/ignore.txt
----------------------------------------------------------------------
diff --git a/asterixdb/asterix-app/src/test/resources/optimizerts/ignore.txt 
b/asterixdb/asterix-app/src/test/resources/optimizerts/ignore.txt
index e43a821..da02111 100644
--- a/asterixdb/asterix-app/src/test/resources/optimizerts/ignore.txt
+++ b/asterixdb/asterix-app/src/test/resources/optimizerts/ignore.txt
@@ -19,4 +19,3 @@
 distinct_aggregate.aql
 unnest_list_in_subplan.aql
 fj-phase2-with-hints.aql
-fj-dblp-csx.aql

http://git-wip-us.apache.org/repos/asf/asterixdb/blob/d906bd89/asterixdb/asterix-app/src/test/resources/optimizerts/queries/fj-dblp-csx-hybrid.aql
----------------------------------------------------------------------
diff --git 
a/asterixdb/asterix-app/src/test/resources/optimizerts/queries/fj-dblp-csx-hybrid.aql
 
b/asterixdb/asterix-app/src/test/resources/optimizerts/queries/fj-dblp-csx-hybrid.aql
new file mode 100644
index 0000000..a753907
--- /dev/null
+++ 
b/asterixdb/asterix-app/src/test/resources/optimizerts/queries/fj-dblp-csx-hybrid.aql
@@ -0,0 +1,69 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+/*
+ * Description    : Multiple fuzzy join on three datasets, with a star join 
condition.
+ *                  Each star join is composed of a linked join condition to 
propagate
+ *                  the fuzzy join results.
+ * Success        : Yes
+ */
+drop dataverse test if exists;
+create dataverse test;
+use dataverse test;
+
+create type DBLPNestedType as closed {
+  id: int64,
+  dblpid: string,
+  title: string,
+  authors: string,
+  misc: string
+}
+
+create type DBLPType as closed {
+  nested: DBLPNestedType
+}
+
+create type CSXNestedType as closed {
+  id: int64,
+  csxid: string,
+  title: string,
+  authors: string,
+  misc: string
+}
+
+create type CSXType as closed {
+  nested: CSXNestedType
+}
+
+create dataset DBLPOpen(DBLPNestedType) primary key id;
+
+create dataset DBLP(DBLPType) primary key nested.id;
+create dataset CSX(CSXType) primary key nested.id;
+
+set import-private-functions 'true';
+set simthreshold "0.5f";
+for $p in dataset DBLP
+for $p1 in dataset CSX
+for $p2 in dataset DBLPOpen
+for $p3 in dataset CSX
+for $p4 in dataset DBLPOpen
+where gram-tokens($p.nested.title, 3, false) ~= gram-tokens($p1.nested.title, 
3, false)
+and word-tokens($p1.nested.title) ~= word-tokens($p2.title)
+and word-tokens($p.authors) ~= word-tokens($p3.nested.authors)
+and gram-tokens($p3.nested.misc, 3, false) ~= gram-tokens($p4.misc, 3, false)
+return { "pid": $p.nested.id, "p1id": $p1.nested.id, "p2id": $p2.id, "p3id": 
$p3.nested.id, "p4id": $p4.id }

http://git-wip-us.apache.org/repos/asf/asterixdb/blob/d906bd89/asterixdb/asterix-app/src/test/resources/optimizerts/queries/fj-dblp-csx-selflink.aql
----------------------------------------------------------------------
diff --git 
a/asterixdb/asterix-app/src/test/resources/optimizerts/queries/fj-dblp-csx-selflink.aql
 
b/asterixdb/asterix-app/src/test/resources/optimizerts/queries/fj-dblp-csx-selflink.aql
new file mode 100644
index 0000000..1b3f930
--- /dev/null
+++ 
b/asterixdb/asterix-app/src/test/resources/optimizerts/queries/fj-dblp-csx-selflink.aql
@@ -0,0 +1,66 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+/*
+ * Description    : Fuzzy join on two datasets, with a series of link join 
conditions.
+ *                  The dataset DBLP will fuzzy join with CSX and propagate 
the results
+ *                  with a series of linked join conditions on CSX.
+ * Success        : Yes
+ */
+drop dataverse test if exists;
+
+create dataverse test;
+
+use dataverse test;
+
+create type DBLPType as open {
+  id: int32,
+  dblpid: string,
+  title: string,
+  authors: string,
+  misc: string
+}
+
+create type CSXType as open {
+  id: int32,
+  csxid: string,
+  title: string,
+  authors: string,
+  misc: string
+}
+
+create nodegroup group1 if not exists on asterix_nc1, asterix_nc2;
+
+create dataset DBLP(DBLPType) primary key id on group1;
+create dataset CSX(CSXType) primary key id on group1;
+
+write output to asterix_nc1:'rttest/test.adm';
+
+use dataverse test;
+set import-private-functions 'true';
+set simthreshold "0.5f";
+for $p in dataset DBLP
+for $p1 in dataset CSX
+for $p2 in dataset CSX
+for $p3 in dataset CSX
+for $p4 in dataset CSX
+where word-tokens($p.title) ~= word-tokens($p1.title)
+and word-tokens($p2.title) ~= word-tokens($p3.title)
+and gram-tokens($p1.authors, 3, false) ~= gram-tokens($p2.authors, 2, false)
+and gram-tokens($p3.misc, 3, false) ~= gram-tokens($p4.misc, 3, false)
+return { "pid":$p.id, "p1id":$p1.id, "p2id": $p2.id, "p3id": $p3.id, "p4id": 
$p4.id }

http://git-wip-us.apache.org/repos/asf/asterixdb/blob/d906bd89/asterixdb/asterix-app/src/test/resources/optimizerts/queries/fj-dblp-csx-simple.aql
----------------------------------------------------------------------
diff --git 
a/asterixdb/asterix-app/src/test/resources/optimizerts/queries/fj-dblp-csx-simple.aql
 
b/asterixdb/asterix-app/src/test/resources/optimizerts/queries/fj-dblp-csx-simple.aql
new file mode 100644
index 0000000..b0beb4d
--- /dev/null
+++ 
b/asterixdb/asterix-app/src/test/resources/optimizerts/queries/fj-dblp-csx-simple.aql
@@ -0,0 +1,54 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+ /*
+  * Description    : Two-way fuzzy join on DBLP and CSX with a fuzzy join 
condition on word tokens of their titles.
+  * Success        : Yes
+  */
+drop dataverse fj-dblp-csx if exists;
+
+create dataverse fj-dblp-csx;
+
+use dataverse fj-dblp-csx;
+
+create type DBLPType as open {
+  id: int32,
+  dblpid: string,
+  title: string,
+  authors: string,
+  misc: string
+}
+
+create type CSXType as open {
+  id: int32,
+  csxid: string,
+  title: string,
+  authors: string,
+  misc: string
+}
+
+create nodegroup group1 if not exists on asterix_nc1, asterix_nc2;
+
+create dataset DBLP(DBLPType) primary key id on group1;
+create dataset CSX(CSXType) primary key id on group1;
+
+write output to asterix_nc1:'rttest/fj-dblp-csx.adm';
+for $s in dataset('DBLP')
+for $t in dataset('CSX')
+where word-tokens($s.title) ~= word-tokens($t.title)
+return {"sid": $s.id, "tid": $t.id}

http://git-wip-us.apache.org/repos/asf/asterixdb/blob/d906bd89/asterixdb/asterix-app/src/test/resources/optimizerts/queries/fj-dblp-csx-star.aql
----------------------------------------------------------------------
diff --git 
a/asterixdb/asterix-app/src/test/resources/optimizerts/queries/fj-dblp-csx-star.aql
 
b/asterixdb/asterix-app/src/test/resources/optimizerts/queries/fj-dblp-csx-star.aql
new file mode 100644
index 0000000..df0cb86
--- /dev/null
+++ 
b/asterixdb/asterix-app/src/test/resources/optimizerts/queries/fj-dblp-csx-star.aql
@@ -0,0 +1,69 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+/*
+ * Description    : Fuzzy join on three datasets, with a set of star join 
conditions.
+ *                  The CSX and DBLP are used twice and will be propagated 
onto the output with their ids.
+ * Success        : Yes
+ */
+
+drop dataverse test if exists;
+create dataverse test;
+use dataverse test;
+
+create type DBLPNestedType as closed {
+  id: int64,
+  dblpid: string,
+  title: string,
+  authors: string,
+  misc: string
+}
+
+create type DBLPType as closed {
+  nested: DBLPNestedType
+}
+
+create type CSXNestedType as closed {
+  id: int64,
+  csxid: string,
+  title: string,
+  authors: string,
+  misc: string
+}
+
+create type CSXType as closed {
+  nested: CSXNestedType
+}
+
+create dataset DBLPOpen(DBLPNestedType) primary key id;
+
+create dataset DBLP(DBLPType) primary key nested.id;
+create dataset CSX(CSXType) primary key nested.id;
+
+set import-private-functions 'true';
+set simthreshold "0.5f";
+for $p in dataset DBLP
+for $p1 in dataset CSX
+for $p2 in dataset DBLPOpen
+for $p3 in dataset CSX
+for $p4 in dataset DBLPOpen
+where word-tokens($p.nested.title) ~= word-tokens($p1.nested.title)
+and word-tokens($p.nested.authors) ~= word-tokens($p3.nested.authors)
+and word-tokens($p.nested.title) ~= word-tokens($p2.title)
+and gram-tokens($p.nested.title, 3, false) ~= gram-tokens($p4.title, 3, false)
+return { "pid": $p.nested.id, "p1id": $p1.nested.id, "p2id": $p2.id, "p3id": 
$p3.nested.id, "p4id": $p4.id }

http://git-wip-us.apache.org/repos/asf/asterixdb/blob/d906bd89/asterixdb/asterix-app/src/test/resources/optimizerts/queries/fj-dblp-csx.aql
----------------------------------------------------------------------
diff --git 
a/asterixdb/asterix-app/src/test/resources/optimizerts/queries/fj-dblp-csx.aql 
b/asterixdb/asterix-app/src/test/resources/optimizerts/queries/fj-dblp-csx.aql
index 966d0b6..a79afdb 100644
--- 
a/asterixdb/asterix-app/src/test/resources/optimizerts/queries/fj-dblp-csx.aql
+++ 
b/asterixdb/asterix-app/src/test/resources/optimizerts/queries/fj-dblp-csx.aql
@@ -45,50 +45,59 @@ create dataset CSX(CSXType) primary key id on group1;
 
 write output to asterix_nc1:'rttest/fj-dblp-csx.adm';
 
-    for $paperDBLP in dataset('DBLP')
-    let $idDBLP := $paperDBLP.id
-    let $unrankedTokensDBLP := counthashed-word-tokens($paperDBLP.title)
-    let $tokensDBLP :=
-        for $token in $unrankedTokensDBLP
-        for $tokenRanked at $i in
-            //
-            // -- - Stage 1 - --
-            //
-            // for $paper in dataset('DBLP')
-            // for $token in counthashed-word-tokens($paper.title) 
-            // group by $tokenGroupped := $token with $paper
-            // order by count($paper), $tokenGroupped
-            // return $tokenGroupped
-            for $paper in dataset('DBLP')
-            return $paper.title            
-        where $token = $tokenRanked
-        order by $i
-        return $i
-   
-    for $prefixTokenDBLP in $tokensDBLP 
+set import-private-functions 'true'
 
-    for $paperCSX in dataset('CSX')
-    let $idCSX := $paperCSX.id
-    let $unrankedTokensCSX := counthashed-word-tokens($paperCSX.title)
-    let $tokensCSX :=        
-        for $token in $unrankedTokensCSX
-        for $tokenRanked at $i in
-            //
-            // -- - Stage 1 - --
-            //
-            // for $paper in dataset('DBLP')
-            // for $token in counthashed-word-tokens($paper.title) 
-            // group by $tokenGroupped := $token with $paper
-            // order by count($paper), $tokenGroupped
-            // return $tokenGroupped
-            for $paper in dataset('DBLP')
-            return $paper.title
-        where $token = $tokenRanked
-        order by $i
-        return $i
-        
-    for $prefixTokenCSX in $tokensCSX    
-    where $prefixTokenDBLP = $prefixTokenCSX
-    group by $idDBLP := $idDBLP, $idCSX := $idCSX with $paperDBLP 
-    order by $idDBLP, $idCSX
-    return {'idDBLP': $idDBLP, 'idCSX': $idCSX}
+for $paperDBLP in dataset('DBLP')
+let $idDBLP := $paperDBLP.id
+let $unrankedTokensDBLP := counthashed-word-tokens($paperDBLP.title)
+let $lenDBLP := len($unrankedTokensDBLP)
+let $tokensDBLP :=
+    for $token in $unrankedTokensDBLP
+    for $tokenRanked at $i in
+        //
+        // -- - Stage 1 - --
+        //
+        for $paper in dataset('DBLP')
+        let $id := $paper.id
+        for $token in counthashed-word-tokens($paper.title)
+        /*+ hash */
+        group by $tokenGroupped := $token with $id
+        /*+ inmem 16 16384 */
+        order by count($id), $tokenGroupped
+        return $tokenGroupped
+    where $token = /*+ bcast */ $tokenRanked
+    order by $i
+    return $i
+for $prefixTokenDBLP in subset-collection($tokensDBLP, 0, 
prefix-len-jaccard(len($tokensDBLP), .8f))
+
+for $paperCSX in dataset('CSX')
+let $idCSX := $paperCSX.id
+let $unrankedTokensCSX := counthashed-word-tokens($paperCSX.title)
+let $lenCSX := len($unrankedTokensCSX)
+let $tokensCSX :=
+    for $token in $unrankedTokensCSX
+    for $tokenRanked at $i in
+        //
+        // -- - Stage 1 - --
+        //
+        for $paper in dataset('DBLP')
+        let $id := $paper.id
+        for $token in counthashed-word-tokens($paper.title)
+        /*+ hash */
+        group by $tokenGroupped := $token with $id
+        /*+ inmem 16 16384 */
+        order by count($id), $tokenGroupped
+        return $tokenGroupped
+    where $token = /*+ bcast */ $tokenRanked
+    order by $i
+    return $i
+let $actualPrefixLen := prefix-len-jaccard(len($unrankedTokensCSX), .8f) - 
len($unrankedTokensCSX) + len($tokensCSX)
+for $prefixTokenCSX in subset-collection($tokensCSX, 0, $actualPrefixLen)
+
+where $prefixTokenDBLP = $prefixTokenCSX
+
+/*+ hash */
+group by $idDBLP := $idDBLP, $idCSX := $idCSX with $unrankedTokensDBLP, 
$unrankedTokensCSX
+let $sim := similarity-jaccard-check($unrankedTokensDBLP[0], 
$unrankedTokensCSX[0], .8f)
+where $sim[1] >= .8f
+return {'idDBLP': $idDBLP, 'idCSX': $idCSX}

http://git-wip-us.apache.org/repos/asf/asterixdb/blob/d906bd89/asterixdb/asterix-app/src/test/resources/optimizerts/queries/similarity/jaccard-similarity-join-dual-order.aql
----------------------------------------------------------------------
diff --git 
a/asterixdb/asterix-app/src/test/resources/optimizerts/queries/similarity/jaccard-similarity-join-dual-order.aql
 
b/asterixdb/asterix-app/src/test/resources/optimizerts/queries/similarity/jaccard-similarity-join-dual-order.aql
new file mode 100644
index 0000000..d3da872
--- /dev/null
+++ 
b/asterixdb/asterix-app/src/test/resources/optimizerts/queries/similarity/jaccard-similarity-join-dual-order.aql
@@ -0,0 +1,109 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+/*
+ * Description    : Tests the plan of runtimes/fuzzyjoin/basic_1_3_1/6
+ * Success        : Yes
+ */
+
+drop dataverse fuzzyjoin_basic if exists;
+
+create dataverse fuzzyjoin_basic;
+
+use dataverse fuzzyjoin_basic;
+
+create type BasicType as closed {
+    id: uuid,
+    authors: string
+}
+
+create dataset left(BasicType) primary key id autogenerated;
+create dataset right(BasicType) primary key id autogenerated;
+
+write output to asterix_nc1:"rttest/jaccard-similarity-join-right-ahead.adm";
+
+set import-private-functions 'true'
+
+for $right in dataset('right')
+let $idRight := $right.id
+let $tokensUnrankedRight := word-tokens($right.authors)
+let $lenRight := len($tokensUnrankedRight)
+let $tokensRight :=
+    for $tokenUnranked in $tokensUnrankedRight
+    for $tokenRanked at $i in
+        //
+        // -- - Stage 1 - --
+        //
+        for $r in
+            for $orderRight in dataset('right')
+            let $rightId := $orderRight.id
+            for $orderTokenRight in word-tokens($orderRight.authors)
+                /*+ hash */ group by $tokenRightGrouped := $orderTokenRight 
with $rightId
+            return {"rt": $tokenRightGrouped, "rc": count($rightId)}
+        for $l in
+            for $orderLeft in dataset('left')
+            let $leftId := $orderLeft.id
+            for $orderTokenLeft in word-tokens($orderLeft.authors)
+                /*+ hash */ group by $tokenLeftGrouped := $orderTokenLeft with 
$leftId
+            return {"lt": $tokenLeftGrouped, "lc": count($leftId)}
+        where $r.rt = $l.lt
+        /*+ inmem 1 302 */ order by $r.rc * $l.lc
+        return $r.rt
+
+    where $tokenUnranked = /*+ bcast */ $tokenRanked
+    order by $i
+    return $i
+for $prefixTokenRight in subset-collection($tokensRight, 0, 
prefix-len-jaccard(len($tokensRight), .8f))
+
+for $left in dataset('left')
+let $idLeft := $left.id
+let $tokensUnrankedLeft := word-tokens($left.authors)
+let $lenLeft := len($tokensUnrankedLeft)
+let $tokensLeft :=
+    for $tokenUnranked in $tokensUnrankedLeft
+    for $tokenRanked at $i in
+        //
+        // -- - Stage 1 - --
+        //
+        for $r in
+            for $orderRight in dataset('right')
+            let $rightId := $orderRight.id
+            for $orderTokenRight in word-tokens($orderRight.authors)
+                /*+ hash */ group by $tokenRightGrouped := $orderTokenRight 
with $rightId
+            return {"rt": $tokenRightGrouped, "rc": count($rightId)}
+        for $l in
+            for $orderLeft in dataset('left')
+            let $leftId := $orderLeft.id
+            for $orderTokenLeft in word-tokens($orderLeft.authors)
+                /*+ hash */ group by $tokenLeftGrouped := $orderTokenLeft with 
$leftId
+            return {"lt": $tokenLeftGrouped, "lc": count($leftId)}
+        where $r.rt = $l.lt
+        /*+ inmem 1 302 */ order by $r.rc * $l.lc
+        return $r.rt
+
+    where $tokenUnranked = /*+ bcast */ $tokenRanked
+    order by $i
+    return $i
+let $actualPrefixLen := prefix-len-jaccard(len($tokensUnrankedLeft), .8f) - 
len($tokensUnrankedLeft) + len($tokensLeft)
+for $prefixTokenLeft in subset-collection($tokensLeft, 0, $actualPrefixLen)
+
+where $prefixTokenRight = $prefixTokenLeft
+let $sim := similarity-jaccard-prefix($lenRight, $tokensRight, $lenLeft, 
$tokensLeft, $prefixTokenLeft, .8f)
+where $sim >= .8f
+/*+ hash*/ group by $idRight := $idRight, $idLeft := $idLeft with $sim
+return {'idDBLP': $idRight, 'idCSX': $idLeft, "sim": $sim[0]}

http://git-wip-us.apache.org/repos/asf/asterixdb/blob/d906bd89/asterixdb/asterix-app/src/test/resources/optimizerts/queries/similarity/jaccard-similarity-join-right-ahead.aql
----------------------------------------------------------------------
diff --git 
a/asterixdb/asterix-app/src/test/resources/optimizerts/queries/similarity/jaccard-similarity-join-right-ahead.aql
 
b/asterixdb/asterix-app/src/test/resources/optimizerts/queries/similarity/jaccard-similarity-join-right-ahead.aql
new file mode 100644
index 0000000..661ce00
--- /dev/null
+++ 
b/asterixdb/asterix-app/src/test/resources/optimizerts/queries/similarity/jaccard-similarity-join-right-ahead.aql
@@ -0,0 +1,89 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+/*
+ * Description    : Tests the plan of runtimes/fuzzyjoin/basic_1_3_1/5
+ * Success        : Yes
+ */
+
+drop dataverse fuzzyjoin_basic if exists;
+
+create dataverse fuzzyjoin_basic;
+
+use dataverse fuzzyjoin_basic;
+
+create type BasicType as closed {
+    id: uuid,
+    authors: string
+}
+
+create dataset left(BasicType) primary key id autogenerated;
+create dataset right(BasicType) primary key id autogenerated;
+
+write output to asterix_nc1:"rttest/jaccard-similarity-join-right-ahead.adm";
+
+set import-private-functions 'true'
+
+for $right in dataset('right')
+let $idRight := $right.id
+let $tokensUnrankedRight := word-tokens($right.authors)
+let $lenRight := len($tokensUnrankedRight)
+let $tokensRight :=
+    for $tokenUnranked in $tokensUnrankedRight
+    for $tokenRanked at $i in
+        //
+        // -- - Stage 1 - --
+        //
+        for $orderRight in dataset('right')
+        let $rightId := $orderRight.id
+        for $orderTokenRight in word-tokens($orderRight.authors)
+            /*+ hash */ group by $tokenRightGrouped := $orderTokenRight with 
$rightId
+        /*+ inmem 1 302 */ order by count($rightId)
+        return $tokenRightGrouped
+    where $tokenUnranked = /*+ bcast */ $tokenRanked
+    order by $i
+    return $i
+for $prefixTokenRight in subset-collection($tokensRight, 0, 
prefix-len-jaccard(len($tokensRight), .8f))
+
+for $left in dataset('left')
+let $idLeft := $left.id
+let $tokensUnrankedLeft := word-tokens($left.authors)
+let $lenLeft := len($tokensUnrankedLeft)
+let $tokensLeft :=
+    for $tokenUnranked in $tokensUnrankedLeft
+    for $tokenRanked at $i in
+        //
+        // -- - Stage 1 - --
+        //
+        for $orderRight in dataset('right')
+        let $rightId := $orderRight.id
+        for $orderTokenRight in word-tokens($orderRight.authors)
+            /*+ hash */ group by $tokenRightGrouped := $orderTokenRight with 
$rightId
+        /*+ inmem 1 302 */ order by count($rightId)
+        return $tokenRightGrouped
+    where $tokenUnranked = /*+ bcast */ $tokenRanked
+    order by $i
+    return $i
+let $actualPrefixLen := prefix-len-jaccard(len($tokensUnrankedLeft), .8f) - 
len($tokensUnrankedLeft) + len($tokensLeft)
+for $prefixTokenLeft in subset-collection($tokensLeft, 0, $actualPrefixLen)
+
+where $prefixTokenRight = $prefixTokenLeft
+let $sim := similarity-jaccard-prefix($lenRight, $tokensRight, $lenLeft, 
$tokensLeft, $prefixTokenLeft, .8f)
+where $sim >= .8f
+/*+ hash*/ group by $idRight := $idRight, $idLeft := $idLeft with $sim
+return {'idDBLP': $idRight, 'idCSX': $idLeft, "sim": $sim[0]}

Reply via email to