Wenhai Li has uploaded a new change for review. https://asterix-gerrit.ics.uci.edu/3008
Change subject: Test the comparablity of fuzzyjoin. ...................................................................... Test the comparablity of fuzzyjoin. The following commits from your working branch will be included: commit a924f718b2537c856bfd470f622d8fb8879f1e07 Merge: f6aeca5 2a42da45 Author: Michael <lwhay...@gmail.com> Date: Fri Oct 26 13:36:12 2018 -0700 Merge branch 'master' into fuzzy commit f6aeca5f21dfc91497b2f718815353149cd4ff03 Merge: e237045 80225e2 Author: Michael <lwhay...@gmail.com> Date: Fri Oct 26 13:35:08 2018 -0700 Merge branch 'master' into fuzzy commit e237045dbcbd17bc6344d298027152b9da4ec982 Merge: 9a1a68b 1aeb8b6 Author: Michael <lwhay...@gmail.com> Date: Fri Sep 28 10:02:08 2018 -0700 Merge branch 'master' into fuzzy commit 9a1a68b560c9abd30fc3c44a67c3f578a8ab9227 Merge: aa39e75 b71d9ff Author: Michael <lwhay...@gmail.com> Date: Fri Sep 21 09:56:39 2018 -0700 Merge branch 'master' into fuzzy commit aa39e75a89bda84a3ff63545b166a0611c299def Merge: 5d5afc1 42f17d2 Author: Michael <lwhay...@gmail.com> Date: Fri Sep 7 10:13:50 2018 -0700 Merge branch 'master' into fuzzy commit 5d5afc19067e3909a887cc86c7917b79be885467 Merge: 8fbe7cc 8bf93fa Author: Michael <lwhay...@gmail.com> Date: Fri Aug 31 09:16:55 2018 -0700 Merge branch 'master' into fuzzy commit 8fbe7cc54e570c71306f95040cd015482981011c Merge: b11a785 90114df Author: Michael <lwhay...@gmail.com> Date: Fri Aug 24 10:55:16 2018 -0700 Merge branch 'master' into fuzzy commit b11a785df47fc4a7ea69611f54bf32d7151ae606 Merge: f252acc 13860fb Author: Michael <lwhay...@gmail.com> Date: Mon Aug 13 09:48:42 2018 -0700 Merge branch 'master' into fuzzy commit f252acc3eec2546bfc403c3fb2e2fa26f3383e20 Merge: aa57719 31d03f0 Author: Michael <lwhay...@gmail.com> Date: Fri Aug 10 09:38:53 2018 -0700 Merge branch 'master' into fuzzy commit aa57719117ee94162a5aba521c8657ae136bce5b Merge: 4d7c16c 0a2fb11 Author: Michael <lwhay...@gmail.com> Date: Wed Aug 8 02:45:56 2018 -0700 Merge branch 'master' into fuzzy commit 4d7c16c702325aee6aa871bedb92aa128107a409 Merge: 7f4f7ac 5de12d0 Author: Michael <lwhay...@gmail.com> Date: Fri Aug 3 09:37:03 2018 -0700 Merge branch 'master' into fuzzy commit 7f4f7ac2b4d54f2ef2492b248c1184e200bbbf9c Merge: db30fa8 6b1b52c Author: Michael <lwhay...@gmail.com> Date: Sat Jul 28 09:14:26 2018 -0700 Merge branch 'master' into fuzzy commit db30fa8f10b007d44ea03321ccacc63d1ed95fc8 Merge: 4c3af5f 428a5ee Author: Michael <lwhay...@gmail.com> Date: Fri Jul 27 10:53:56 2018 -0700 Merge branch 'master' into fuzzy commit 4c3af5f0347b361b92bf1a8871cfc46652e81095 Merge: a919ce3 072da02 Author: Michael <lwhay...@gmail.com> Date: Tue Jul 24 09:12:07 2018 -0700 Merge branch 'master' into fuzzy commit a919ce354053cbd90b3019bbe7f62f092388169d Merge: 0f867e3 9a98768 Author: Michael <lwhay...@gmail.com> Date: Fri Jul 20 14:20:58 2018 -0700 Merge branch 'master' into fuzzy commit 0f867e32b070b9b2dfa77bf0aadbe18d628c9f26 Merge: 57785ff 0f6df16 Author: Michael <lwhay...@gmail.com> Date: Sun Jul 15 02:51:10 2018 -0700 Merge branch 'master' into fuzzy commit 57785ff1614ec2177fbd053f4d630b50f5a14127 Merge: 0974fd7 0d7974f Author: Michael <lwhay...@gmail.com> Date: Fri Jul 13 03:26:41 2018 -0700 Merge branch 'master' into fuzzy commit 0974fd783d4fdd928b6fae7f153a714d350b8c1a Merge: c3f8654 aae5753 Author: Michael <lwhay...@gmail.com> Date: Fri Jul 6 10:15:40 2018 -0700 Merge branch 'master' into fuzzy commit c3f86546bedcf8bb09abf23c5f8e68ed699938f0 Merge: 173dd2a 9087e0b Author: Michael <lwhay...@gmail.com> Date: Fri Jun 29 09:59:21 2018 -0700 Merge branch 'master' into fuzzy commit 173dd2aa1a855b4d1bc252926ef57b71f1b89948 Merge: bc6ab30 4ba23de Author: Michael <lwhay...@gmail.com> Date: Fri Jun 22 10:06:01 2018 -0700 Merge branch 'master' into fuzzy commit bc6ab3084c26ab169e3803e31365a5689848ff33 Merge: c8ddc9c 8d04d7d Author: Michael <lwhay...@gmail.com> Date: Wed Jun 20 11:29:47 2018 -0700 Merge branch 'master' into fuzzy commit c8ddc9c76841e3b9c5730e9c0ec1d29ee2a6d1ff Merge: a9a6167 1bdf808 Author: Michael <lwhay...@gmail.com> Date: Fri Jun 15 10:07:45 2018 -0700 Merge branch 'master' into fuzzy commit a9a61673ed1eb33c82e361ce6f784b951f98cf8d Merge: 4ea5cb3 e7422b0 Author: Michael <lwhay...@gmail.com> Date: Fri Jun 8 09:56:42 2018 -0700 Merge branch 'master' into fuzzy commit 4ea5cb340f4ce82d2991bc5a193aabab2ea8a1dc Merge: eb1af35 13632a7 Author: Michael <lwhay...@gmail.com> Date: Fri Jun 1 10:18:22 2018 -0700 Merge branch 'master' into fuzzy commit eb1af35a8a99d80de9e3b7fed03085fd481381be Merge: d165d95 af17baa Author: Michael <lwhay...@gmail.com> Date: Sat May 26 10:16:23 2018 -0700 Merge branch 'master' into fuzzy commit d165d95715463a54ec9042351c2ae63fc2923e88 Merge: a7732c7 c7eb0c5 Author: Michael <lwhay...@gmail.com> Date: Fri May 25 10:13:24 2018 -0700 Merge branch 'master' into fuzzy commit a7732c78b7d783603cdc6f2784c974bcadf91c9d Merge: 3d1781b 1a6de0b Author: Michael <lwhay...@gmail.com> Date: Fri May 18 01:01:04 2018 +0800 Merge branch 'master' into fuzzy commit 3d1781b1b7a7148858caba896e56bd36de2bab85 Merge: 159dbcb 1b0bbad Author: Michael <lwhay...@gmail.com> Date: Fri May 11 22:51:08 2018 +0800 Merge branch 'master' into fuzzy commit 159dbcb2ce81cca49ea4688c9261df898c8c130c Author: Michael <lwhay...@gmail.com> Date: Mon Apr 30 09:45:47 2018 -0700 Add results for counthashed-word-tokens. commit 94deadf295d9bfcbb1e6e4b3031378e218f7d761 Author: Michael <lwhay...@gmail.com> Date: Mon Apr 30 09:43:59 2018 -0700 Add function test for counthashed-word-tokens. commit faf7a5224e1563c3b42f8a62ae1e02cde92e50c9 Merge: a930ded 9410ddd Author: Michael <lwhay...@gmail.com> Date: Sat Apr 28 08:14:24 2018 -0700 Merge branch 'master' into fuzzy commit a930dedc45a7e7427850e8bd57b01acec0662041 Merge: 363601b 6f75f05 Author: Michael <lwhay...@gmail.com> Date: Fri Apr 20 11:29:11 2018 -0700 Fired the replicate case in high level. commit 363601b480bb935c5695835e95568428bef540e1 Merge: 5079fd4 aac1e93 Author: Michael <lwhay...@gmail.com> Date: Fri Apr 13 09:48:17 2018 -0700 Merge branch 'master' into fuzzy commit 5079fd4ba0ee423cd3d80c9287e902d8822282db Merge: 5059c3a c1f39fe Author: Michael <lwhay...@gmail.com> Date: Thu Apr 12 06:44:00 2018 -0700 Merge branch 'master' into fuzzy commit 5059c3a176f0c0d98aaf4172c075fdb84c055418 Merge: 433c9ad b001400 Author: Michael <lwhay...@gmail.com> Date: Fri Apr 6 10:19:14 2018 -0700 Merge branch 'master' into fuzzy commit 433c9add04de3992fa29b9e89b5b588633b113e6 Author: Michael <lwhay...@gmail.com> Date: Fri Mar 30 10:51:34 2018 -0700 Wrong plan for self join. commit 8d619ad24b2eab272b1bd59f176ce1fa0a82421b Merge: 3ab2554 3036c98 Author: Michael <lwhay...@gmail.com> Date: Fri Mar 30 09:19:17 2018 -0700 Merge branch 'master' into fuzzy commit 3ab2554225a6cba4c5ce3af46061f8145c594fe9 Merge: 8f4b087 8aa13ca Author: Michael <lwhay...@gmail.com> Date: Fri Mar 23 10:51:01 2018 -0700 Merge branch 'master' into fuzzy commit 8f4b08744dfabb46df1f197426ca0726503b7f0f Merge: 2193ab8 e455287 Author: Michael <lwhay...@gmail.com> Date: Fri Mar 23 10:50:36 2018 -0700 Merge branch 'master' into fuzzy commit 2193ab82e700b5ff811fadbf44c09956339c966b Merge: fc185cb d8d4eef Author: Michael <lwhay...@gmail.com> Date: Fri Jan 19 04:16:48 2018 -0800 Merge branch 'master' into fuzzy commit fc185cb7cfc2ff71e81c236d51cf45fd7461f30f Merge: 1ff8967 94aa28c Author: Michael <lwhay...@gmail.com> Date: Fri Jan 19 04:16:16 2018 -0800 Merge branch 'master' into fuzzy commit 1ff896717124a897ac17568f93887d1a7ddfff65 Merge: 36e0cc6 6a58866 Author: Michael <lwhay...@gmail.com> Date: Fri Jan 12 08:08:21 2018 -0800 Merge branch 'master' into fuzzy commit 36e0cc64b89c13158ac160586ba245f544e85c90 Author: Michael <lwhay...@gmail.com> Date: Fri Jan 12 07:24:50 2018 -0800 Split the fuzzy query test cases. commit ba0be5b9719671cf074f9c1fb7a4f3546239b17a Merge: 2825b97 b4d166b Author: Michael <lwhay...@gmail.com> Date: Mon Dec 18 06:19:02 2017 -0800 Merge branch 'master' into fuzzy commit 2825b977f4b39b557d04f3e651df4a59b5a6a546 Author: Michael <lwhay...@gmail.com> Date: Sat Dec 16 05:29:52 2017 -0800 Remove the white space. commit f1f704a23c6f086c7b546690063dc8e6acc12d0a Merge: b79e9f7 ed50308 Author: Michael <lwhay...@gmail.com> Date: Fri Dec 15 23:58:28 2017 -0800 Merge branch 'master' into fuzzy commit b79e9f7c2d7b15f3a4219050332acb7eb68bf571 Merge: 62fe029 62b4a02 Author: Michael <lwhay...@gmail.com> Date: Fri Dec 15 10:54:17 2017 -0800 Merge branch 'master' into fuzzy commit 62fe0293994fceacf45ca965978d4023557728b1 Merge: 8569f77 204b295 Author: Michael <lwhay...@gmail.com> Date: Fri Dec 8 07:48:58 2017 -0800 Merge branch 'master' into fuzzy commit 8569f77278f56800f73cc9a21a9066d2c23ef700 Merge: d420379 3180d87 Author: Michael <lwhay...@gmail.com> Date: Tue Dec 5 21:32:51 2017 -0800 Merge branch 'master' into fuzzy commit d42037953babcd03b766c6a308c35617b40f2a9e Merge: a34df16 f3aa19f Author: Michael <lwhay...@gmail.com> Date: Sat Dec 2 03:50:58 2017 -0800 Merge branch 'master' into fuzzy commit a34df16680ef392c7ad50a7f86fd8ae240d7ba8c Merge: f8825cf 50de666 Author: Michael <lwhay...@gmail.com> Date: Fri Dec 1 10:24:25 2017 -0800 Merge branch 'master' into fuzzy commit f8825cfb6ec8cf82a200e8576655138b0de4cace Merge: ff106dc 6b765f3 Author: Michael <lwhay...@gmail.com> Date: Wed Nov 29 20:40:17 2017 -0800 Merge branch 'master' into fuzzy commit ff106dcda941d9fd9a8a08995106168a160a5761 Merge: 07d86b7 98b9d60 Author: Michael <lwhay...@gmail.com> Date: Sat Nov 25 22:06:19 2017 -0800 Merge branch 'master' into fuzzy commit 07d86b767a09e16ea3f86f85b040c9e2cbe4d6ea Merge: 5aebf42 4dad5df Author: Michael <lwhay...@gmail.com> Date: Wed Nov 22 23:46:25 2017 -0800 Merge branch 'master' into fuzzy commit 5aebf42f4dc95104e2eac8326518b4db00568fb0 Author: Michael <lwhay...@gmail.com> Date: Fri Nov 10 08:50:51 2017 -0800 Remove the multiple simjoin for memory checking. commit d81e42f4f3c5aee5d24ff9c93589cd9f4b6d4b51 Merge: 63dc211 23761dd Author: Michael <lwhay...@gmail.com> Date: Fri Nov 10 02:47:09 2017 -0800 Merge branch 'master' into fuzzy commit 63dc21125cd67860db27697b648496d920309a85 Merge: 7889d1d eadeaf5 Author: Michael <lwhay...@gmail.com> Date: Tue Nov 7 05:25:15 2017 -0800 Merge branch 'master' into fuzzy commit 7889d1da1507ee33eddd78157c45e240b47bdb9f Merge: 3bf34fb 52e5134 Author: Michael <lwhay...@gmail.com> Date: Fri Nov 3 10:48:23 2017 -0700 Merge branch 'master' into fuzzy commit 3bf34fb1b81097b05a491d3bd7830e9a51a98f0e Merge: 23282d4 fbf3c0a Author: Michael <lwhay...@gmail.com> Date: Fri Nov 3 10:01:21 2017 -0700 Merge branch 'master' into fuzzy commit 23282d4c7086c51f10e30f75851ac4d7967406a9 Merge: f4010f4 9782f8a Author: Michael <lwhay...@gmail.com> Date: Fri Oct 20 23:55:28 2017 -0700 Merge branch 'master' into fuzzy commit f4010f49a57d14b3452a55ddd650d46aa319f91f Merge: c407c07 a5b37d6 Author: Michael <lwhay...@gmail.com> Date: Fri Oct 20 23:04:18 2017 -0700 Merge branch 'master' into fuzzy commit c407c0799f2c7f295da1c239c1920d6673ff1830 Merge: 2689238 a14cebb Author: Michael <lwhay...@gmail.com> Date: Sun Aug 6 10:31:20 2017 -0700 Merge branch 'master' into fuzzy commit 26892380596ac793e3835284f484f0d7012cfbbe Merge: 2464015 3c07fe5 Author: Michael <lwhay...@gmail.com> Date: Sat Jun 10 08:04:03 2017 -0700 Merge branch 'master' into fuzzy commit 24640150c92ea09bf0bd230fe8ab7e410b1deff0 Merge: fdd32ff 1bba5bc Author: Michael <lwhay...@gmail.com> Date: Fri Jun 9 06:11:41 2017 -0700 Merge branch 'master' into fuzzy commit fdd32fff6772123589f6aede45cea7e1e73cbefb Merge: 70b7858 1be612a Author: Michael <lwhay...@gmail.com> Date: Fri Jun 2 00:24:15 2017 -0700 Merge branch 'master' into fuzzy commit 70b7858467041044c841b94fa9e9f523b2c6d482 Merge: 4490903 bacf0c5 Author: Michael <lwhay...@gmail.com> Date: Thu May 11 21:12:29 2017 -0700 Merge branch 'master' into fuzzy commit 44909030562677f48556456d8aff1fc5a129dda1 Author: Michael <lwhay...@gmail.com> Date: Thu May 11 18:31:24 2017 -0700 Remove the inmem hint in sj. commit 4e00f7ec38ddacd9212fb435c0feac268a5795e1 Author: Michael <lwhay...@gmail.com> Date: Sun May 7 00:55:44 2017 -0700 Add the optimized order cases in opttest. commit e5c7006d05b05ced98b365025f0b24b2a167cced Author: Michael <lwhay...@gmail.com> Date: Sat May 6 23:07:15 2017 -0700 Add the Optimzed global token order test case. commit 291a41537ce7002cfe5c206231d345af013aadec Author: Michael <lwhay...@gmail.com> Date: Sat May 6 02:38:36 2017 -0700 Remove the exception finder cases of suffix filter. commit c3d3b4ff7d513ab42ca1badeeac991a75a939966 Merge: 47edf1f f086893 Author: Michael <lwhay...@gmail.com> Date: Fri May 5 21:22:30 2017 -0700 Merge branch 'master' into fuzzy commit 47edf1f996c32a6e8f7511a022d0f9cbcb9954ee Author: Michael <lwhay...@gmail.com> Date: Fri May 5 21:21:42 2017 -0700 Fix the suffix filter. commit e5c4335a7e37dfb96680c2fd385465927fcc6c96 Merge: 6534e3d 01a55f8 Author: Michael <lwhay...@gmail.com> Date: Fri May 5 09:18:50 2017 -0700 Merge branch 'master' into fuzzy commit 6534e3d7baa9d170c93f2303740e777201927cd5 Author: Michael <lwhay...@gmail.com> Date: Fri May 5 09:18:04 2017 -0700 Reduce the threshold to reproduce the consistency. commit 86a9b4e1e5f582a09e16ac2c50f9cd5856eff37d Author: Michael <lwhay...@gmail.com> Date: Thu May 4 11:37:55 2017 -0700 Fix the suffix filter. commit 8b3e903097515593970b3d5149dc8744a00f6f67 Merge: 2d16a15 b58572a Author: Michael <lwhay...@gmail.com> Date: Wed Apr 26 11:17:32 2017 -0700 Merge branch 'master' into fuzzy commit 2d16a15c2d25fc42b06f4f427715314be5703ea3 Merge: d0c7ff2 d0baeed Author: Michael <lwhay...@gmail.com> Date: Thu Apr 20 00:09:36 2017 -0700 Merge branch 'master' into fuzzy commit d0c7ff2faca2addf7e9f701a10f148bd83a36ca5 Merge: c2f32d8 f2c6c7a Author: Michael <lwhay...@gmail.com> Date: Fri Apr 14 09:01:04 2017 -0700 Merge branch 'master' into fuzzy commit c2f32d8d5127d8827b9a1589df4f30c216e781e3 Merge: 0716d5f 5e9e92b Author: Michael <lwhay...@gmail.com> Date: Wed Apr 12 20:57:31 2017 -0700 Merge branch 'master' into fuzzy commit 0716d5f164b58a6e7cf082d880a0196b6121866f Author: Michael <lwhay...@gmail.com> Date: Wed Apr 12 09:17:47 2017 -0700 Remove QS problems. commit 955557e424daf35bae1250f1174de731a64c98e4 Author: Michael <lwhay...@gmail.com> Date: Wed Apr 12 03:31:06 2017 -0700 Use right side as probe. commit 66e117f9a34c9600756d96cdfe57d54217947db5 Merge: b480d77 ed15d46 Author: Michael <lwhay...@gmail.com> Date: Wed Apr 12 02:15:00 2017 -0700 Merge branch 'master' into fuzzy commit b480d77d7b06ca80e644e6dbfbebac62788e7eda Author: Michael <lwhay...@gmail.com> Date: Wed Apr 12 02:13:12 2017 -0700 use similarity-jaccard-prefix instead of similarity-jaccard-check. commit 0c66cdd2537584402e095be63a8649af1015c592 Merge: 6727ca3 96fd402 Author: Michael <lwhay...@gmail.com> Date: Tue Apr 11 08:17:56 2017 -0700 Merge branch 'master' into fuzzy commit 6727ca3681fd23f75c2033c0ff8963ae91c74da8 Merge: 33f49d1 5ad0f73 Author: Michael <lwhay...@gmail.com> Date: Sun Apr 9 10:09:13 2017 -0700 Merge branch 'master' into fuzzy commit 33f49d1481653bb5f6ce26005e557bc4bae2adc3 Merge: 11eea52 246fbde Author: Michael <lwhay...@gmail.com> Date: Fri Apr 7 07:17:38 2017 -0700 Merge branch 'master' into fuzzy commit 11eea52c7fa57d3fdb668e00185b106a9323b104 Author: Michael <lwhay...@gmail.com> Date: Fri Apr 7 07:16:59 2017 -0700 Change the threshold. commit 69807be8db71fc0aeb1e40ff59f5d29944ed9916 Merge: 149fb75 05e4256 Author: Michael <lwhay...@gmail.com> Date: Wed Apr 5 07:48:22 2017 -0700 Merge branch 'master' into fuzzy commit 149fb7583313d60f8eff04c3133b25ca1cc48ac9 Merge: 3345aad 4d3cec7 Author: Michael <lwhay...@gmail.com> Date: Sat Apr 1 02:26:28 2017 -0700 Merge branch 'master' into fuzzy commit 3345aadaac8d0a89f3d61974c9b0e464ba20d9c9 Author: Michael <lwhay...@gmail.com> Date: Sat Apr 1 02:22:28 2017 -0700 Add testcase for similarity-jaccard-check issue. commit a7f60f272bace393dac570559236a8e62370c9d7 Merge: a63c52a 8e94744 Author: Michael <lwhay...@gmail.com> Date: Mon Mar 27 08:02:47 2017 -0700 Merge branch 'master' into fuzzy commit a63c52a26d64b4ee872024ea47c39b9d8a8ef134 Merge: 754a040 7d554fc Author: Michael <lwhay...@gmail.com> Date: Thu Mar 23 01:10:39 2017 -0700 Merge branch 'master' into fuzzy commit 754a0406639c9e2619344312826dc9abf92941b3 Merge: e0a9276 653386a Author: Michael <lwhay...@gmail.com> Date: Wed Mar 22 09:30:29 2017 -0700 Merge branch 'master' into fuzzy commit e0a9276cf03a5f430caf45eecd419ea3fbf265ba Merge: e0d33bd 58e0184 Author: Michael <lwhay...@gmail.com> Date: Fri Mar 17 02:34:45 2017 -0700 Merge branch 'master' into fuzzy commit e0d33bdcb37fe7d26b59d6b9079612fac4cbc14b Merge: 57f3f7f 050f509 Author: Michael <lwhay...@gmail.com> Date: Wed Mar 15 09:04:04 2017 -0700 Merge branch 'master' into fuzzy commit 57f3f7f81de884c9c15947678b7ad1665d257700 Merge: 86308aa 89328a8 Author: Michael <lwhay...@gmail.com> Date: Tue Mar 14 10:13:46 2017 -0700 Merge branch 'master' into fuzzy commit 86308aab0d5860c1048037213173e74ce157e3fd Merge: d53040e 61401f9 Author: Michael <lwhay...@gmail.com> Date: Sun Mar 12 23:57:09 2017 -0700 Merge branch 'master' into fuzzy commit d53040ebc61f48bc6a3ca8055e7d6ff14a08487d Merge: f9896b8 a7fad19 Author: Michael <lwhay...@gmail.com> Date: Fri Mar 10 11:25:00 2017 -0800 Merge branch 'master' into fuzzy commit f9896b891bd14b5c5b7437cd543bde4fc99b3b46 Merge: 4995c9c 953eb96 Author: Michael <lwhay...@gmail.com> Date: Fri Mar 10 07:16:02 2017 -0800 Merge branch 'master' into fuzzy commit 4995c9cd3b9e185e938843154ee7fee1cc27d872 Merge: 9033233 2fe1d18 Author: Michael <lwhay...@gmail.com> Date: Thu Mar 9 05:26:28 2017 -0800 Merge branch 'master' into fuzzy commit 90332332181018bb67d50b0ae6b6a136c498377d Merge: aebd2bb 31d8102 Author: Michael <lwhay...@gmail.com> Date: Wed Mar 8 00:34:10 2017 -0800 Merge branch 'master' into fuzzy commit aebd2bb00bf8a3617682b0408af234ad859d9b0a Merge: 27625b4 4d7a17d Author: Michael <lwhay...@gmail.com> Date: Tue Mar 7 07:32:28 2017 -0800 Merge branch 'master' into fuzzy commit 27625b46a095430f106be6ccd717f0ad674d86b3 Merge: df28903 6c7aad2 Author: Michael <lwhay...@gmail.com> Date: Tue Mar 7 07:31:52 2017 -0800 Merge branch 'master' into fuzzy commit df28903d2689e2d533b2a4879465d6b2749247e7 Merge: 131b48d 983dd18 Author: Michael <lwhay...@gmail.com> Date: Sun Mar 5 10:03:51 2017 -0800 Merge branch 'master' into fuzzy commit 131b48d5a82a59bd943d53d4ad4cea075a92910c Author: Michael <lwhay...@gmail.com> Date: Sun Mar 5 10:03:01 2017 -0800 Add a pre-compression before verification. commit 6a5f9f99f7319006895eef8bff7c652523ae4232 Author: Michael <lwhay...@gmail.com> Date: Sat Mar 4 11:23:40 2017 -0800 Slight change on sequences of basic tests-1.2.1 commit 4ae0b00f5c41d12a1b26ca70efbbf158b36c3859 Merge: a281d4f 88b5769 Author: Michael <lwhaym...@yahoo.com> Date: Sat Mar 4 10:02:42 2017 -0800 Merge branch 'master' into fuzzy commit a281d4fa2b654a52e16d4f371be3fb1d5525e252 Author: Michael <lwhaym...@yahoo.com> Date: Sat Mar 4 09:55:34 2017 -0800 Resolved the inconsistent issues derived from partial ordered tokens in RS similarity join. commit 13653bb2c41f97243c5c968dc7765d00aba6f757 Merge: 2a33659 7152182 Author: Michael <lwhaym...@yahoo.com> Date: Wed Mar 1 22:42:41 2017 -0800 Merge branch 'master' into fuzzy commit 2a336592b29a870b21ae64df94e937f84cc25aac Author: Michael <lwhaym...@yahoo.com> Date: Wed Mar 1 22:41:26 2017 -0800 Format Jaccard check. commit 6af8d066f865a385d167f2f2db54cbd3eeae8f00 Author: Michael <lwhaym...@yahoo.com> Date: Wed Mar 1 22:40:55 2017 -0800 add testcase for fj inconsistency commit bc27ab57172c208c7e13449da4776cecd4abd54f Merge: f37d11c 3c764a4 Author: Michael <lwhaym...@yahoo.com> Date: Tue Feb 28 06:55:52 2017 -0800 Merge branch 'master' into fuzzy commit f37d11c6eeb6b2e31c8c4f3a6a8d7afe2946e0b3 Author: Michael <lwhaym...@yahoo.com> Date: Sun Feb 26 08:41:50 2017 -0800 Change the nc.java.opts to 6144m. commit 80f21afdfb51bc4996fc8dd8be98896e8a113f4b Author: Michael <lwhaym...@yahoo.com> Date: Sat Feb 25 23:23:15 2017 -0800 Add datasource for the inconsistent issue. commit ec9a82908007e56be194ef2726932068cf60dc40 Merge: 3ade0fb e85902b Author: Michael <lwhaym...@yahoo.com> Date: Sat Feb 25 08:02:49 2017 -0800 Merge branch 'master' into fuzzy commit 3ade0fbbde8dd757f5aa413aaaff6ccd6986fa26 Author: Michael <lwhaym...@yahoo.com> Date: Sat Feb 25 07:51:29 2017 -0800 Add four categories of similarity join templates. commit f8aeec2123fdc7c5cf1cc091b8f1db8bf7c5e168 Author: Michael <lwhaym...@yahoo.com> Date: Fri Feb 24 07:18:27 2017 -0800 Change prefix-based fuzzy joins onto in-memory groupby/orderby. commit 18763328df2632e351e074ceb0e25c51877ae6ae Author: Michael <lwhaym...@yahoo.com> Date: Fri Feb 24 06:50:00 2017 -0800 Improve the memory configuration of ManagixExecutionIT. commit ecc657318faf1ccf189c115a87e06833b59131c1 Merge: b049f09 34f2384 Author: Michael <lwhaym...@yahoo.com> Date: Thu Feb 23 23:08:07 2017 -0800 Merge branch 'master' into fuzzy commit b049f09a4b5a454a47df399f19801fc7c8c148e1 Merge: 9084dde ea666c9 Author: Michael <lwhaym...@yahoo.com> Date: Thu Feb 23 09:19:44 2017 -0800 Merge branch 'master' into fuzzy commit 9084dded9e357494098c5886fce152c0a4c992ee Merge: c335b99 6fc1f7b Author: Michael <lwhaym...@yahoo.com> Date: Tue Feb 21 23:19:12 2017 -0800 Merge branch 'master' into fuzzy commit c335b99a43f5b224605f3a5db0b93c780b1a0352 Author: Michael <lwhaym...@yahoo.com> Date: Sat Feb 18 22:34:29 2017 -0800 Change the optplans w.r.t metavars in fuzzyjoinrule. commit a928bc902a0277e2290e078d76d4146e3474e8c4 Merge: 91fab7c 692b8a8 Author: Michael <lwhaym...@yahoo.com> Date: Sat Feb 18 22:31:37 2017 -0800 Merge branch 'master' into fuzzy commit 91fab7c64402835f28c8365475b0c281cb7ec5e6 Merge: 487a9c9 e48c24e Author: Michael <lwhaym...@yahoo.com> Date: Sat Feb 18 22:29:40 2017 -0800 Remove the dependency of FuzzyJoinRule on AQL metavars. commit 487a9c94a6b6370a56a162568a54189c8836e6f9 Merge: 07cfe47 e835d5e Author: Michael <lwhaym...@yahoo.com> Date: Wed Feb 15 22:10:44 2017 -0800 Merge branch 'master' of https://github.com/apache/asterixdb commit 07cfe47b252de66b599cfa909e27c7114750473d Merge: 2dee74f 3379669 Author: Michael <lwhaym...@yahoo.com> Date: Sun Feb 12 09:01:11 2017 -0800 Merge branch 'master' of https://github.com/apache/asterixdb commit 2dee74fc334fa97ef9bb4b292680234b94bc45c9 Merge: 19e0c22 3163461 Author: Michael <lwhaym...@yahoo.com> Date: Fri Feb 10 04:43:52 2017 -0800 Merge branch 'fuzzy' commit 31634612f0520ba15ba36a2385fb70c0c5a9b8d8 Merge: ef05c40 2343e1c Author: Michael <lwhaym...@yahoo.com> Date: Sat Feb 4 09:09:29 2017 -0800 Merge branch 'master' into fuzzy commit ef05c40b0955e5fda24ff634ce7a23b2f4cbb996 Merge: a3d4ef9 38553c0 Author: Michael <lwhaym...@yahoo.com> Date: Fri Feb 3 09:18:27 2017 -0800 Merge branch 'master' into fuzzy commit a3d4ef9da4b2f00b0ff490458a48688516cf7fd1 Merge: c3480d3 c7a8fa5 Author: Michael <lwhaym...@yahoo.com> Date: Tue Jan 31 09:08:28 2017 -0800 Merge branch 'master' into fuzzy commit c3480d33ba1df9e0fcc76546eca17b083a758587 Author: Michael <lwhaym...@yahoo.com> Date: Mon Jan 30 07:00:55 2017 -0800 Remove hashgroupby to save memory. commit 83126b2753a076ce480c7db0e25043753f4f645f Author: Michael <lwhaym...@yahoo.com> Date: Mon Jan 30 02:26:59 2017 -0800 Adjust the inmem size. commit 2b8933211e4fc1e2562399a2317e8f3aeb9fcc85 Merge: 09890ee 0f3bf37 Author: Michael <lwhaym...@yahoo.com> Date: Mon Jan 30 01:25:11 2017 -0800 Merge branch 'master' into fuzzy commit 09890ee304762855b9e8dfcd847069af7d11d4bc Merge: b2c1d1d 60e7f12 Author: Michael <lwhaym...@yahoo.com> Date: Fri Jan 27 23:58:35 2017 -0800 Merge branch 'master' into fuzzy commit b2c1d1d51d38e0f9761fc131cf241b97d1ba4332 Merge: 98b7fa0 9d30640 Author: Michael <lwhaym...@yahoo.com> Date: Thu Jan 26 07:20:57 2017 -0800 Merge branch 'master' into fuzzy commit 98b7fa078896f23260b98bc8fa710dc76e32e08f Author: Michael <lwhaym...@yahoo.com> Date: Wed Jan 25 07:33:52 2017 -0800 Revisit the improper variable name and comments. commit 5fc075977451011c7f27009b5834062e295b1ee4 Merge: 727343c e0c232d Author: Michael <lwhaym...@yahoo.com> Date: Wed Jan 25 07:10:31 2017 -0800 Merge branch 'master' into fuzzy commit 727343cecf1e926adac7e8b51ad4ad05419443fe Merge: 50678fe 6e6a80c Author: Michael <lwhaym...@yahoo.com> Date: Sun Jan 22 21:08:54 2017 -0800 Merge branch 'master' into fuzzy commit 50678fe585519609506fdaaaaf19095981ef5231 Author: Michael <lwhaym...@yahoo.com> Date: Sat Jan 21 02:44:53 2017 -0800 Another two formatter issues. commit ca4a6f4d1a1b2e31bf7392af546c47f2c79314d8 Author: Michael <lwhaym...@yahoo.com> Date: Sat Jan 21 02:05:24 2017 -0800 Fixed some comments. commit 0f79da88487faed5bc05dc11cb83d4fcd52c72e6 Author: Michael <lwhaym...@yahoo.com> Date: Fri Jan 20 11:07:12 2017 -0800 Change Fuzzyjoin rule onto firstDFS controller. commit 40e1b192834f0ae02b07919d7ad8f346881106c8 Merge: c10ab65 d5118b0 Author: Michael <lwhaym...@yahoo.com> Date: Fri Jan 20 10:38:27 2017 -0800 Merge branch 'master' into fuzzy commit c10ab658e538f1dffc190427cd18f7f9e1a06f73 Author: Michael <lwhaym...@yahoo.com> Date: Wed Jan 18 22:07:43 2017 -0800 Change the exception name. commit 23a7596d6d7a474b1b977e6cb59c71aaad3040e5 Merge: c88c1f1 7ff91d0 Author: Michael <lwhaym...@yahoo.com> Date: Wed Jan 18 22:04:39 2017 -0800 Merge branch 'master' into fuzzy commit c88c1f12becb9875dedb779f53be7c3323679e07 Author: Michael <lwhaym...@yahoo.com> Date: Tue Jan 17 22:42:21 2017 -0800 Keep the ngram of the current master. commit 65063c30b0a738999eb2eec89d91670e0df1094c Merge: bc895f6 908ae63 Author: Michael <lwhaym...@yahoo.com> Date: Tue Jan 17 22:34:18 2017 -0800 Merge branch 'master' into fuzzy commit bc895f62a46375ad57be3e1bbb68f1743b9d3dc5 Author: Michael <lwhaym...@yahoo.com> Date: Tue Jan 17 22:32:05 2017 -0800 Fix some Exception related issues. commit e90ec826e101a3f825babce04fa72b4d0ad7052f Author: Michael <lwhaym...@yahoo.com> Date: Mon Jan 16 20:53:45 2017 -0800 Revisied for some grammatical issues. commit c3c989b93503018dda9647e1575e465626315eea Merge: 4710c53 c8ea9d6 Author: Michael <lwhaym...@yahoo.com> Date: Mon Jan 16 19:12:23 2017 -0800 Merge branch 'master' into fuzzy commit 4710c53d7119500b2511235ed663b4f41247bc7e Author: Michael <lwhaym...@yahoo.com> Date: Sun Jan 15 22:05:35 2017 -0800 Revisited the function name. commit c80b6898408aaf1ad34c79acde6f138ccc1ca7b6 Author: Michael <lwhaym...@yahoo.com> Date: Sun Jan 15 22:01:36 2017 -0800 Abstract codes outside opPost. commit ac41d08cdcc860c5860c1858620eab000b9b44f9 Author: Michael <lwhaym...@yahoo.com> Date: Sun Jan 15 05:57:39 2017 -0800 Reviewed some grammatic details and vars names. commit 060e76bb27dacfcc119fd98ecb0d6e6761e5b157 Merge: ba7dbc6 66fbbd1 Author: Michael <lwhaym...@yahoo.com> Date: Sun Jan 15 05:17:11 2017 -0800 Merge branch 'master' into fuzzy commit ba7dbc6db0f2ff4d1e01e78ce623717e271c15a0 Author: Michael <lwhaym...@yahoo.com> Date: Thu Jan 12 21:41:16 2017 -0800 Formatted the variable definitions. commit 3e48e356573394f94911dd34d43a7431e6d6674a Merge: 729ebe1 74271c0 Author: Michael <lwhaym...@yahoo.com> Date: Thu Jan 12 21:32:50 2017 -0800 Merge branch 'master' into fuzzy commit 729ebe1693b458fe2917535b6fef18d1fb97f458 Merge: c3c47e7 c49405a Author: Michael <lwhaym...@yahoo.com> Date: Fri Jan 6 10:45:07 2017 -0800 Merge branch 'master' into fuzzy commit c3c47e72855ed573e1602829a7804573f48f515b Merge: 2d5df70 0aeebae Author: Michael <lwhaym...@yahoo.com> Date: Thu Jan 5 22:49:08 2017 -0800 Merge branch 'master' into fuzzy commit 2d5df70420ad2926f5719505dc81814416b8d5d5 Merge: 9935670 8a29c5f Author: Michael <lwhaym...@yahoo.com> Date: Wed Jan 4 21:44:22 2017 -0800 Merge branch 'master' into fuzzy commit 993567029a6c79e95479b1b65a67195a41c5e3f7 Merge: a5365a7 0294b31 Author: Michael <lwhaym...@yahoo.com> Date: Sat Dec 24 05:58:29 2016 -0800 Merge branch 'master' into fuzzy commit a5365a7130239efb842b582b5c451df22bc7107d Merge: 79cb453 eb199d3 Author: Michael <lwhaym...@yahoo.com> Date: Thu Dec 22 05:15:58 2016 -0800 Merge branch 'master' into fuzzy commit 79cb45331c387e7691ad69e782a81c560fd5929c Merge: 739d7e2 aa00bf6 Author: Michael <lwhaym...@yahoo.com> Date: Mon Dec 19 09:24:29 2016 -0800 Merge branch 'master' into fuzzy commit 739d7e2972bdd251e9b32d6599b5fed02acd2954 Merge: a82116d bc3d1b0 Author: Michael <lwhaym...@yahoo.com> Date: Fri Dec 16 01:15:24 2016 -0800 Merge branch 'master' into fuzzy commit a82116d1e7dd300af726c6fd9df6b9018fae4ef4 Merge: dfc2009 9267168 Author: Michael <lwhaym...@yahoo.com> Date: Wed Dec 14 05:09:19 2016 -0800 Merge branch 'master' into fuzzy commit dfc20098be8adabdfa3cba9346a13776539db95e Merge: 90e9a29 44cef24 Author: Michael <lwhaym...@yahoo.com> Date: Sat Dec 10 23:51:52 2016 -0800 Merge branch 'master' into fuzzy commit 90e9a291efd20b4223b8ef68ba700bc26ceecb50 Merge: 1ec33c6 fce8e29 Author: Michael <lwhaym...@yahoo.com> Date: Fri Dec 9 11:06:02 2016 -0800 Merge branch 'master' into fuzzy commit 1ec33c6ce1a229f7de1b2b9238303262185bc7ef Merge: b3f4e70 d810df7 Author: Michael <lwhaym...@yahoo.com> Date: Fri Dec 9 04:59:55 2016 -0800 Merge branch 'master' into fuzzy commit b3f4e709f62a15c29c5237f36a484e53d48f534a Merge: 4341aa3 1170755 Author: Michael <lwhaym...@yahoo.com> Date: Tue Dec 6 21:06:38 2016 -0800 Merge branch 'master' into fuzzy commit 4341aa3cdef7efbc3921440b7229d527ed815ec0 Merge: e274df8 11db8e3 Author: Michael <lwhaym...@yahoo.com> Date: Fri Dec 2 23:28:02 2016 -0800 Merge branch 'master' into fuzzy commit e274df8a4eb0bbae94a5b4f230811f2e26fb3846 Author: Michael <lwhaym...@yahoo.com> Date: Fri Dec 2 23:25:43 2016 -0800 Add function for step1-2. commit 0a2907561882e93d307cae97b2bbec24dc48312b Author: Michael <lwhaym...@yahoo.com> Date: Fri Dec 2 23:14:54 2016 -0800 Polish the steps3-4. commit 7838e24fd3643391235d8cd189c676e54c7e0732 Author: Michael <lwhaym...@yahoo.com> Date: Fri Dec 2 22:58:45 2016 -0800 Remove the incrementedCounter temp var in fuzzyjoinrule. commit 5f540a7d3c7b8324052f288ea563b7381d1b7211 Merge: 3cc518d 2772f12 Author: Michael <lwhaym...@yahoo.com> Date: Thu Dec 1 21:21:04 2016 -0800 Merge branch 'master' into fuzzy commit 3cc518d8d467822328069433fc82a4a09e5aafb6 Merge: 9738fa1 4c958b2 Author: Michael <lwhaym...@yahoo.com> Date: Wed Nov 30 22:09:32 2016 -0800 Merge branch 'master' into fuzzy commit 9738fa1661b297540b73976b4184d56322e6869b Merge: 482b961 8a742fd Author: Michael <lwhaym...@yahoo.com> Date: Wed Nov 30 06:36:47 2016 -0800 Merge branch 'master' into fuzzy commit 482b961a65dd5dc986ef58ec62d8e264f56594dc Merge: 7777c4b 2da225b Author: Michael <lwhaym...@yahoo.com> Date: Wed Nov 30 06:33:15 2016 -0800 Merge branch 'master' into fuzzy commit 7777c4b1c61612221991d441b75496a24088b875 Merge: 7a6e790 3584bdd Author: Michael <lwhaym...@yahoo.com> Date: Sat Nov 26 23:48:35 2016 -0800 Merge branch 'master' into fuzzy commit 7a6e7902ce0f14839ce2563de245ed1e74d986fa Merge: 82c340e 12a502b Author: Michael <lwhaym...@yahoo.com> Date: Sat Nov 26 06:10:42 2016 -0800 Merge branch 'master' into fuzzy commit 82c340e09a8cf62fce63687cafcb677b5eb8538c Author: Michael <lwhaym...@yahoo.com> Date: Thu Nov 24 04:37:15 2016 -0800 Remove the redundant import. commit 378e8caaa8e62e7d8b6244e4bc5e25fc852e4314 Merge: 20d3e82 42620f6 Author: Michael <lwhaym...@yahoo.com> Date: Wed Nov 23 23:34:05 2016 -0800 Merge branch 'master' into fuzzy commit 20d3e82dd86d2f2983b30f8afadb0ae948dcda9f Merge: af50a31 42467cb Author: Michael <lwhaym...@yahoo.com> Date: Wed Nov 16 23:06:13 2016 -0800 Merge branch 'master' into fuzzy commit af50a314014f25486c9b520de17610b63a51c794 Author: Michael <lwhaym...@yahoo.com> Date: Wed Nov 16 09:13:13 2016 -0800 VarReference of TPCH12 changed under fuzzyjoin rule ingestion. commit a6d6c1752f7ebc621ee8382e9973ef97b4c232bc Merge: 2934d2f d7b3ddf Author: Michael <lwhaym...@yahoo.com> Date: Wed Nov 16 06:58:54 2016 -0800 Merge branch 'master' into fuzzy commit 2934d2fde22c53f5577cf4c68af0afee7edafaaa Merge: 1639faf 35a376a Author: Michael <lwhaym...@yahoo.com> Date: Fri Nov 11 19:33:04 2016 -0800 Merge branch 'master' into fuzzy commit 1639faf6a1db5086a5269003f3ea85ed5e46fec4 Merge: a0a279c 38845d5 Author: Michael <lwhaym...@yahoo.com> Date: Wed Nov 9 01:44:51 2016 -0800 Merge branch 'master' into fuzzy commit a0a279cbd073c2f41b75d4a644e1e3e8f9e2eee7 Merge: c6393ab 314c0df Author: Michael <lwhaym...@yahoo.com> Date: Sun Nov 6 01:14:41 2016 -0700 Merge branch 'master' into fuzzy commit c6393abfb25f2281d2eb59022e6d510ea9327e03 Merge: 9815c7e d1f6121 Author: Michael <lwhaym...@yahoo.com> Date: Thu Nov 3 02:24:06 2016 -0700 Merge branch 'master' into fuzzy commit 9815c7e187a92c82985c8fffbd063cd9e8bb85a3 Merge: f1fac3d c02cf81 Author: Michael <lwhaym...@yahoo.com> Date: Wed Nov 2 11:25:04 2016 -0700 Merge branch 'master' into fuzzy commit f1fac3d6007164194abc36bea3a480a1c0636712 Author: Michael <lwhaym...@yahoo.com> Date: Tue Nov 1 23:02:01 2016 -0700 Change the mismatching type exception of fj. commit 4d8abbc1777601a25beeed7caa48c59a6c2f0e54 Merge: 5b8d29e e2e3ab5 Author: Michael <lwhaym...@yahoo.com> Date: Tue Nov 1 22:35:18 2016 -0700 Merge branch 'master' into fuzzy commit 5b8d29e08c1a06887957496419f63da5718875f4 Merge: fcf7d22 7b14477 Author: Michael <lwhaym...@yahoo.com> Date: Mon Oct 31 21:21:54 2016 -0700 Merge branch 'master' into fuzzy commit fcf7d2215e13d6bb4bb504c5938533b21daed8be Merge: 35cded8 9fbff01 Author: Michael <lwhaym...@yahoo.com> Date: Sun Oct 30 22:01:17 2016 -0700 Merge branch 'master' into fuzzy commit 35cded8833dab3d38112269d62d3e4af37ba481b Merge: 676adc6 af85e25 Author: Michael <lwhaym...@yahoo.com> Date: Fri Oct 28 22:38:24 2016 -0700 Merge branch 'master' into fuzzy commit 676adc6b8cd98da09f1fe92b66c9f4c8fa042948 Merge: 513d52c fec04f0 Author: Michael <lwhaym...@yahoo.com> Date: Fri Oct 28 09:13:13 2016 -0700 Merge branch 'master' into fuzzy commit 513d52c4d08cadde19cab52863d6ddc55bef878b Merge: f39bc44 109e485 Author: Michael <lwhaym...@yahoo.com> Date: Wed Oct 26 01:40:36 2016 -0700 Merge branch 'master' into fuzzy commit f39bc44d3741cd74f6849f14cf23d5371d9d8d34 Author: Michael <lwhaym...@yahoo.com> Date: Sun Oct 23 11:52:12 2016 -0700 Remove the redundant expression computation in prefix-based fuzzyjoin. commit e3e45d5db11f5d73715daf5cefdaec2a4e8a137c Author: Michael <lwhaym...@yahoo.com> Date: Sun Oct 23 09:04:58 2016 -0700 A slight change. commit 68548b0e63a8d1087914e6597ca3b25a4bd73578 Merge: 26f03bf 452c5d0 Author: Michael <lwhaym...@yahoo.com> Date: Sun Oct 23 01:07:51 2016 -0700 Merge branch 'master' into fuzzy commit 26f03bf870b8b6f6d69d8379e29f96990810f1e0 Merge: 1c0da45 e17454a Author: Michael <lwhaym...@yahoo.com> Date: Tue Oct 18 05:33:59 2016 -0700 Merge branch 'master' into fuzzy commit 1c0da457751332b7a2dd73f66f49f79f3efa7121 Merge: c9ec9b5 9ddf5e0 Author: Michael <lwhaym...@yahoo.com> Date: Sat Oct 15 10:27:17 2016 -0700 Merge branch 'master' into fuzzy commit c9ec9b53ad880707e8af0e93a3805c636377b924 Merge: 7b59665 6f1c559 Author: Michael <lwhaym...@yahoo.com> Date: Wed Oct 12 08:37:25 2016 -0700 Merge branch 'master' into fuzzy commit 7b59665b8ef0cd7d3120b7103e8d34d0fb144b64 Merge: b0aab9a db1c115 Author: Michael <lwhaym...@yahoo.com> Date: Tue Oct 11 02:17:38 2016 -0700 Merge branch 'master' into fuzzy commit b0aab9a4a2a730b4789864c014cd5c340459bdc8 Author: Michael <lwhaym...@yahoo.com> Date: Sun Oct 9 22:43:09 2016 -0700 Add the simplest nested fuzzyjoin testcase. commit 1e4acd4dc83dea8f21de062f1b16464f581dbd81 Merge: 653971f 8fa8b7a Author: Michael <lwhaym...@yahoo.com> Date: Sat Oct 8 06:29:15 2016 -0700 Merge branch 'master' into fuzzy commit 653971f8bba9763162f3d6488a48b7ec8a5e03ef Author: Michael <lwhaym...@yahoo.com> Date: Sat Oct 8 06:26:09 2016 -0700 Inlined the flattening rules into fuzzycollection commit d8b37358b75765ef41344ec054409c0b15b212fc Author: Michael <lwhaym...@yahoo.com> Date: Thu Oct 6 10:44:09 2016 -0700 Add a simple fj testcase. commit a54472cda375fd0689dd87d0efdbdda05abec05e Merge: cdd58fe ecba52e Author: Michael <lwhaym...@yahoo.com> Date: Thu Oct 6 06:17:38 2016 -0700 Merge branch 'master' into fuzzy commit cdd58fead662fa615664bb3f6287be3802ae6602 Merge: 6098ca8 d97fa75 Author: Michael <lwhaym...@yahoo.com> Date: Wed Oct 5 09:45:45 2016 -0700 Merge branch 'master' into fuzzy commit 6098ca84531dad7cf5068428ea90e305bad41d70 Merge: c98e0dc 6f7c531 Author: Michael <lwhaym...@yahoo.com> Date: Sat Oct 1 07:20:16 2016 -0700 Merge branch 'master' into fuzzy commit c98e0dc5efd01d7580c65a9c9d14d705854f7112 Merge: f86f996 2685b60 Author: Michael <lwhaym...@yahoo.com> Date: Fri Sep 30 07:29:00 2016 -0700 Merge branch 'master' into fuzzy commit f86f9963f339a1ca01c4c3a297705ef345d9ff88 Author: Michael <lwhaym...@yahoo.com> Date: Fri Sep 30 07:27:48 2016 -0700 Polished the comments of aqls commit 33023078a08276e1cbee11902e59a8c4e4b69c52 Author: Michael <lwhaym...@yahoo.com> Date: Wed Sep 28 07:38:39 2016 -0700 Add comments for the Isomorphic and the testCases. commit 43b8d16782788a6cbc82a59fcab8f6a0ea65a0dc Author: Michael <lwhaym...@yahoo.com> Date: Wed Sep 28 06:22:15 2016 -0700 Change the SPLIT onto REPLICATE in the plans. commit 67dc7d42f78d97042c7f8886353b37fc8ca7d349 Merge: 74e541c a79db2a Author: Michael <lwhaym...@yahoo.com> Date: Wed Sep 28 02:33:00 2016 -0700 Merge branch 'master' into fuzzy Conflicts: asterixdb/asterix-app/src/test/resources/optimizerts/results/inverted-index-join/leftouterjoin-probe-pidx-with-join-jaccard-check-idx_01.plan asterixdb/asterix-app/src/test/resources/optimizerts/results/inverted-index-join/word-jaccard-check-after-btree-access.plan asterixdb/asterix-app/src/test/resources/optimizerts/results/nested-index/inverted-index-join/leftouterjoin-probe-pidx-with-join-jaccard-check-idx_01.plan asterixdb/asterix-app/src/test/resources/optimizerts/results/nested-index/inverted-index-join/word-jaccard-check-after-btree-access.plan asterixdb/asterix-app/src/test/resources/optimizerts/results/nested-open-index/inverted-index-join/word-jaccard-check-after-btree-access.plan asterixdb/asterix-app/src/test/resources/optimizerts/results/open-index-enforced/inverted-index-join/word-jaccard-check-after-btree-access.plan commit 74e541c92e68b8f6c012e49c9c1ec5f5f77a2d11 Author: Michael <lwhaym...@yahoo.com> Date: Wed Sep 28 02:27:46 2016 -0700 Remove the grammatic error. commit 84493ddfdad2afbedb2a186bd1f5127b4474a52c Author: Michael <lwhaym...@yahoo.com> Date: Sun Sep 25 08:20:08 2016 -0700 Remove the branch counter. commit be57431c35783d8d8f7e1d4de1932d36d1e101e8 Merge: f2e5013 0ff3d09 Author: Michael <lwhaym...@yahoo.com> Date: Sun Sep 25 07:44:00 2016 -0700 Merge branch 'master' into fuzzy Conflicts: asterixdb/asterix-app/src/test/resources/optimizerts/results/inverted-index-join/issue741.plan commit f2e50135a8649f76e15acab2f4706458d583e7e9 Author: Michael <lwhaym...@yahoo.com> Date: Fri Sep 23 03:56:21 2016 -0700 Change the optimized plan results according to the select-related improvement of master. commit 1d9cd36cf5563b5c38aa798c740a8380269e99c7 Merge: afdd936 473fc18 Author: Michael <lwhaym...@yahoo.com> Date: Thu Sep 22 22:19:26 2016 -0700 Merge branch 'master' into fuzzy commit afdd9364eb979518767ae1f965841ea05e543eb0 Merge: f829f5a e6bb4aa Author: Michael <lwhaym...@yahoo.com> Date: Tue Sep 20 05:53:19 2016 -0700 Merge branch 'master' into fuzzy commit f829f5a96f9f60cccbd632a61b6b6ec149dec183 Merge: 547b3f2 4b30d79 Author: Michael <lwhaym...@yahoo.com> Date: Mon Sep 19 09:58:17 2016 -0700 Merge branch 'master' into fuzzy commit 547b3f2945ea0c32a5a7c8484e082abdceacc2c1 Merge: 24ae6b8 be706d5 Author: Michael <lwhaym...@yahoo.com> Date: Thu Sep 15 01:58:58 2016 -0700 Merge branch 'master' into fuzzy commit 24ae6b8b9ac993ec43edf353c40093a7735fa75f Merge: f8b71bf dd36605 Author: Michael <lwhaym...@yahoo.com> Date: Mon Sep 12 01:11:05 2016 -0700 Merge branch 'master' into fuzzy commit f8b71bf08f499e0db78929c540459c0c808ddbf7 Author: Michael <lwhaym...@yahoo.com> Date: Sun Sep 11 10:37:49 2016 -0700 Remove the SQs and add verification on fuzzyjoin plan. commit acf38556029bc28bd559fa28af59d463ec35c552 Merge: 4e0fb96 7477a58 Author: Michael <lwhaym...@yahoo.com> Date: Sun Sep 11 01:28:16 2016 -0700 Merge branch 'master' into fuzzy Conflicts: asterixdb/asterix-app/src/test/resources/optimizerts/results/inverted-index-join/issue741.plan commit 4e0fb96f8fcf1a51f59fc1cf25ea88ed88ced41f Author: Michael <lwhaym...@yahoo.com> Date: Sun Sep 11 01:25:01 2016 -0700 Add the multiway fuzzyjoin testCases in the optimizer. commit da28fe841b9cc6c3cf00caace0fa91e917198ce8 Merge: dee3107 b4a9a89 Author: Michael <lwhaym...@yahoo.com> Date: Sat Sep 10 06:42:22 2016 -0700 Merge branch 'master' into fuzzy commit dee31076fad7f53593642b292457387bc76d69d2 Author: Michael <lwhaym...@yahoo.com> Date: Sat Sep 10 06:37:51 2016 -0700 Add Optimizer testCases for multiway fuzzyjoins. commit 568f0f1806418666f8b5abdcf67af2c8d1f9c740 Author: Michael <lwhaym...@yahoo.com> Date: Sat Sep 10 06:36:26 2016 -0700 Replace the ComplexInferenceRule onto NestedSubplanToJoinRule. commit 6f68c87cc0e60338ef3d04f7598edf276500b2b7 Author: Michael <lwhaym...@yahoo.com> Date: Thu Sep 8 21:45:50 2016 -0700 Remove the SQs and inproper comments. commit fa6980acf7398cba1f1dfda5e63dcbc2a5bc0b8d Merge: c589e79 f902d66 Author: Michael <lwhaym...@yahoo.com> Date: Thu Sep 8 21:13:10 2016 -0700 Merge branch 'master' into fuzzy commit c589e79ecaea8c0b2bc9efb9d402e53c9f5400e8 Author: Michael <lwhaym...@yahoo.com> Date: Thu Sep 8 21:12:34 2016 -0700 Removed the SQs. commit 6457af804cbe532b567da8ea8e6dfe57b5705a9e Merge: 38a11dd 78c6115 Author: Michael <lwhaym...@yahoo.com> Date: Thu Sep 8 18:57:59 2016 -0700 Merge branch 'master' into fuzzy commit 38a11dd1cb6fb9ad3382d33cb8917cb6a2a35820 Merge: 2af458e c89d668 Author: Michael <lwhaym...@yahoo.com> Date: Thu Sep 8 18:51:32 2016 -0700 Merge branch 'master' into fuzzy and remove the binaryHomogeneous method. Conflicts: asterixdb/asterix-algebra/src/main/java/org/apache/asterix/optimizer/rules/subplan/InlineSubplanInputForNestedTupleSourceRule.java commit 2af458eca76b7a7fe523598f63463252d1adb7f7 Author: Michael <lwhaym...@yahoo.com> Date: Fri Sep 2 08:12:48 2016 -0700 Add comments for the reviewers. commit b2d826a8e941b6f0747dc85c9a71b4bf0c86ba3a Merge: c82d0b0 a9ac670 Author: Michael <lwhaym...@yahoo.com> Date: Thu Sep 1 20:56:57 2016 -0700 Merge branch 'master' into fuzzy commit c82d0b0b2366e99fffde93896e2a49b32c3ef7aa Merge: 871db18 52a9d99 Author: Michael <lwhaym...@yahoo.com> Date: Fri Aug 26 02:26:21 2016 -0700 Merge branch 'master' into fuzzy Conflicts: asterixdb/asterix-app/src/main/java/org/apache/asterix/api/common/APIFramework.java commit 871db186ac1435283a91070877c47a9b298c7450 Merge: 0408d57 7a180bc Author: Michael <lwhaym...@yahoo.com> Date: Fri Aug 19 01:25:45 2016 -0700 Merge branch 'master' into fuzzy commit 0408d575fafa3c1f07b4959c80c0dc9abe9567b5 Author: Michael <lwhaym...@yahoo.com> Date: Fri Aug 12 11:34:21 2016 -0700 Initial fuzzy join framework with multiple split and temporary ngram fix. Change-Id: If5cbb4a133e7d62f9c9aaa05852d3b20c9aa50c3 --- M asterixdb/asterix-algebra/src/main/java/org/apache/asterix/optimizer/rules/subplan/InlineSubplanInputForNestedTupleSourceRule.java M asterixdb/asterix-app/src/test/resources/optimizerts/results/ASTERIXDB-2402.plan M asterixdb/asterix-app/src/test/resources/optimizerts/results/split-materialization-above-join.plan M asterixdb/asterix-app/src/test/resources/runtimets/queries/fuzzyjoin/basic-1_1_1/basic-1_1_1.3.query.aql A asterixdb/asterix-app/src/test/resources/runtimets/queries/fuzzyjoin/basic-1_1_1/basic-1_1_1.4.query.aql A asterixdb/asterix-app/src/test/resources/runtimets/queries/fuzzyjoin/basic-1_2_1/basic-1_2_1.10.query.aql M asterixdb/asterix-app/src/test/resources/runtimets/queries/fuzzyjoin/basic-1_2_1/basic-1_2_1.3.query.aql A asterixdb/asterix-app/src/test/resources/runtimets/queries/fuzzyjoin/basic-1_2_1/basic-1_2_1.8.query.aql A asterixdb/asterix-app/src/test/resources/runtimets/queries/fuzzyjoin/basic-1_2_1/basic-1_2_1.9.query.aql M asterixdb/asterix-app/src/test/resources/runtimets/results/fuzzyjoin/basic-1_1_1/basic-1_1_1.1.adm A asterixdb/asterix-app/src/test/resources/runtimets/results/fuzzyjoin/basic-1_1_1/basic-1_1_1.3.adm A asterixdb/asterix-app/src/test/resources/runtimets/results/fuzzyjoin/basic-1_1_1/basic-1_1_1.4.adm A asterixdb/asterix-app/src/test/resources/runtimets/results/fuzzyjoin/basic-1_2_1/basic-1_2_1.10.adm M asterixdb/asterix-app/src/test/resources/runtimets/results/fuzzyjoin/basic-1_2_1/basic-1_2_1.3.adm A asterixdb/asterix-app/src/test/resources/runtimets/results/fuzzyjoin/basic-1_2_1/basic-1_2_1.8.adm A asterixdb/asterix-app/src/test/resources/runtimets/results/fuzzyjoin/basic-1_2_1/basic-1_2_1.9.adm M asterixdb/asterix-server/src/test/resources/NCServiceExecutionIT/cc.conf 17 files changed, 301 insertions(+), 73 deletions(-) git pull ssh://asterix-gerrit.ics.uci.edu:29418/asterixdb refs/changes/08/3008/1 diff --git a/asterixdb/asterix-algebra/src/main/java/org/apache/asterix/optimizer/rules/subplan/InlineSubplanInputForNestedTupleSourceRule.java b/asterixdb/asterix-algebra/src/main/java/org/apache/asterix/optimizer/rules/subplan/InlineSubplanInputForNestedTupleSourceRule.java index 62f89f1..1c5865f 100644 --- a/asterixdb/asterix-algebra/src/main/java/org/apache/asterix/optimizer/rules/subplan/InlineSubplanInputForNestedTupleSourceRule.java +++ b/asterixdb/asterix-algebra/src/main/java/org/apache/asterix/optimizer/rules/subplan/InlineSubplanInputForNestedTupleSourceRule.java @@ -265,20 +265,13 @@ */ public class InlineSubplanInputForNestedTupleSourceRule implements IAlgebraicRewriteRule { - // To make sure the rule only runs once. - private boolean hasRun = false; - @Override public boolean rewritePre(Mutable<ILogicalOperator> opRef, IOptimizationContext context) throws AlgebricksException { - if (hasRun) { - return false; - } if (context.checkIfInDontApplySet(this, opRef.getValue())) { return false; } Pair<Boolean, LinkedHashMap<LogicalVariable, LogicalVariable>> result = rewriteSubplanOperator(opRef, context); - hasRun = true; return result.first; } diff --git a/asterixdb/asterix-app/src/test/resources/optimizerts/results/ASTERIXDB-2402.plan b/asterixdb/asterix-app/src/test/resources/optimizerts/results/ASTERIXDB-2402.plan index 18ec417..8818d06 100644 --- a/asterixdb/asterix-app/src/test/resources/optimizerts/results/ASTERIXDB-2402.plan +++ b/asterixdb/asterix-app/src/test/resources/optimizerts/results/ASTERIXDB-2402.plan @@ -48,17 +48,17 @@ -- HASH_PARTITION_EXCHANGE [$$222] |PARTITIONED| -- STREAM_PROJECT |PARTITIONED| -- ONE_TO_ONE_EXCHANGE |PARTITIONED| - -- HYBRID_HASH_JOIN [$$268][$$191] |PARTITIONED| - -- HASH_PARTITION_EXCHANGE [$$268] |PARTITIONED| + -- HYBRID_HASH_JOIN [$$273][$$191] |PARTITIONED| + -- HASH_PARTITION_EXCHANGE [$$273] |PARTITIONED| -- ASSIGN |PARTITIONED| -- STREAM_PROJECT |PARTITIONED| -- UNNEST |PARTITIONED| -- STREAM_PROJECT |PARTITIONED| -- ONE_TO_ONE_EXCHANGE |PARTITIONED| - -- PRE_CLUSTERED_GROUP_BY[$$276] |PARTITIONED| + -- PRE_CLUSTERED_GROUP_BY[$$281] |PARTITIONED| { -- AGGREGATE |LOCAL| - -- MICRO_PRE_CLUSTERED_GROUP_BY[$$278, $$280] |LOCAL| + -- MICRO_PRE_CLUSTERED_GROUP_BY[$$283, $$285] |LOCAL| { -- AGGREGATE |LOCAL| -- STREAM_SELECT |LOCAL| @@ -68,8 +68,8 @@ -- NESTED_TUPLE_SOURCE |LOCAL| } -- ONE_TO_ONE_EXCHANGE |PARTITIONED| - -- STABLE_SORT [$$276(ASC), $$278(ASC), $$280(ASC)] |PARTITIONED| - -- HASH_PARTITION_EXCHANGE [$$276] |PARTITIONED| + -- STABLE_SORT [$$281(ASC), $$283(ASC), $$285(ASC)] |PARTITIONED| + -- HASH_PARTITION_EXCHANGE [$$281] |PARTITIONED| -- UNION_ALL |PARTITIONED| -- ONE_TO_ONE_EXCHANGE |PARTITIONED| -- STREAM_PROJECT |PARTITIONED| @@ -94,7 +94,7 @@ -- ONE_TO_ONE_EXCHANGE |PARTITIONED| -- BTREE_SEARCH |PARTITIONED| -- ONE_TO_ONE_EXCHANGE |PARTITIONED| - -- STABLE_SORT [$$290(ASC)] |PARTITIONED| + -- STABLE_SORT [$$295(ASC)] |PARTITIONED| -- ONE_TO_ONE_EXCHANGE |PARTITIONED| -- STREAM_PROJECT |PARTITIONED| -- ONE_TO_ONE_EXCHANGE |PARTITIONED| @@ -117,7 +117,7 @@ -- ONE_TO_ONE_EXCHANGE |PARTITIONED| -- BTREE_SEARCH |PARTITIONED| -- ONE_TO_ONE_EXCHANGE |PARTITIONED| - -- STABLE_SORT [$$229(ASC)] |PARTITIONED| + -- STABLE_SORT [$$234(ASC)] |PARTITIONED| -- ONE_TO_ONE_EXCHANGE |PARTITIONED| -- STREAM_PROJECT |PARTITIONED| -- ONE_TO_ONE_EXCHANGE |PARTITIONED| @@ -145,7 +145,7 @@ -- ONE_TO_ONE_EXCHANGE |PARTITIONED| -- BTREE_SEARCH |PARTITIONED| -- ONE_TO_ONE_EXCHANGE |PARTITIONED| - -- STABLE_SORT [$$290(ASC)] |PARTITIONED| + -- STABLE_SORT [$$295(ASC)] |PARTITIONED| -- ONE_TO_ONE_EXCHANGE |PARTITIONED| -- STREAM_PROJECT |PARTITIONED| -- ONE_TO_ONE_EXCHANGE |PARTITIONED| @@ -168,7 +168,7 @@ -- ONE_TO_ONE_EXCHANGE |PARTITIONED| -- BTREE_SEARCH |PARTITIONED| -- ONE_TO_ONE_EXCHANGE |PARTITIONED| - -- STABLE_SORT [$$229(ASC)] |PARTITIONED| + -- STABLE_SORT [$$234(ASC)] |PARTITIONED| -- ONE_TO_ONE_EXCHANGE |PARTITIONED| -- STREAM_PROJECT |PARTITIONED| -- ONE_TO_ONE_EXCHANGE |PARTITIONED| @@ -194,4 +194,4 @@ -- ONE_TO_ONE_EXCHANGE |PARTITIONED| -- DATASOURCE_SCAN |PARTITIONED| -- ONE_TO_ONE_EXCHANGE |PARTITIONED| - -- EMPTY_TUPLE_SOURCE |PARTITIONED| \ No newline at end of file + -- EMPTY_TUPLE_SOURCE |PARTITIONED| diff --git a/asterixdb/asterix-app/src/test/resources/optimizerts/results/split-materialization-above-join.plan b/asterixdb/asterix-app/src/test/resources/optimizerts/results/split-materialization-above-join.plan index a81a142..ad71134 100644 --- a/asterixdb/asterix-app/src/test/resources/optimizerts/results/split-materialization-above-join.plan +++ b/asterixdb/asterix-app/src/test/resources/optimizerts/results/split-materialization-above-join.plan @@ -157,4 +157,4 @@ -- ONE_TO_ONE_EXCHANGE |PARTITIONED| -- DATASOURCE_SCAN |PARTITIONED| -- ONE_TO_ONE_EXCHANGE |PARTITIONED| - -- EMPTY_TUPLE_SOURCE |PARTITIONED| + -- EMPTY_TUPLE_SOURCE |PARTITIONED| \ No newline at end of file diff --git a/asterixdb/asterix-app/src/test/resources/runtimets/queries/fuzzyjoin/basic-1_1_1/basic-1_1_1.3.query.aql b/asterixdb/asterix-app/src/test/resources/runtimets/queries/fuzzyjoin/basic-1_1_1/basic-1_1_1.3.query.aql index c00681b..0395100 100644 --- a/asterixdb/asterix-app/src/test/resources/runtimets/queries/fuzzyjoin/basic-1_1_1/basic-1_1_1.3.query.aql +++ b/asterixdb/asterix-app/src/test/resources/runtimets/queries/fuzzyjoin/basic-1_1_1/basic-1_1_1.3.query.aql @@ -20,42 +20,35 @@ set import-private-functions 'true' -let $hash := ( - for $r in dataset left - let $c := ( - for $t in counthashed-word-tokens($r.authors) - order by $t - distinct by $t - return $t - ) - order by $r.id - return {"id": $r.id, "authors": $r.authors, "nondup": $c} +let $r := "Tony Van Gestel Bart Baesens Johan A. K. Suykens Dirk Van den Poel Dirk-Emma Baestaens Marleen Willekens" +let $t := ( + for $token in word-tokens($r) + order by $token + distinct by $token + return $token ) - -let $word := ( - for $r in dataset left - let $c := ( - for $t in word-tokens($r.authors) - order by $t - distinct by $t - return $t - ) - order by $r.id - return {"id": $r.id, "authors": $r.authors, "nondup": $c} +let $h := ( + for $token in hashed-word-tokens($r) + order by $token + distinct by $token + return $token ) - -for $s in $hash -for $t in $word -where $s.id = $t.id and count($s.nondup) != count($t.nondup) -order by $s.authors -return { - "authors": $s.authors, - "hdistinct": $s.nondup, - "hcount": count($s.nondup), - "hash": counthashed-word-tokens($s.authors), - "vhcount": count(counthashed-word-tokens($s.authors)), - "wdistinct": $t.nondup, - "wcount": count($t.nondup), - "word": word-tokens($t.authors), - "vwcount": count(word-tokens($t.authors)) - } \ No newline at end of file +let $c := ( + for $token in counthashed-word-tokens($r) + order by $token + distinct by $token + return $token +) +return {"raw string" : $r, + "word-tokens" : word-tokens($r), + "word-tokens-len" : count(word-tokens($r)), + "hashed-word-tokens" : hashed-word-tokens($r), + "hashed-word-tokens-len" : count(hashed-word-tokens($r)), + "counthashed-word-tokens" : counthashed-word-tokens($r), + "counthashed-word-tokens-len" : count(counthashed-word-tokens($r)), + "pre-word-tokens" : $t, + "pre-word-tokens-len" : count($t), + "pre-hashed-word-tokens" : $h, + "pre-hashed-word-tokens-len" : count($h), + "pre-counthashed-word-tokens" : $c, + "pre-counthashed-word-tokens-len" : count($c)} diff --git a/asterixdb/asterix-app/src/test/resources/runtimets/queries/fuzzyjoin/basic-1_1_1/basic-1_1_1.4.query.aql b/asterixdb/asterix-app/src/test/resources/runtimets/queries/fuzzyjoin/basic-1_1_1/basic-1_1_1.4.query.aql new file mode 100644 index 0000000..c00681b --- /dev/null +++ b/asterixdb/asterix-app/src/test/resources/runtimets/queries/fuzzyjoin/basic-1_1_1/basic-1_1_1.4.query.aql @@ -0,0 +1,61 @@ +/* + * Licensed to the Apache Software Foundation (ASF) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. The ASF licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ +use dataverse fuzzyjoin_basic; + +set import-private-functions 'true' + +let $hash := ( + for $r in dataset left + let $c := ( + for $t in counthashed-word-tokens($r.authors) + order by $t + distinct by $t + return $t + ) + order by $r.id + return {"id": $r.id, "authors": $r.authors, "nondup": $c} +) + +let $word := ( + for $r in dataset left + let $c := ( + for $t in word-tokens($r.authors) + order by $t + distinct by $t + return $t + ) + order by $r.id + return {"id": $r.id, "authors": $r.authors, "nondup": $c} +) + +for $s in $hash +for $t in $word +where $s.id = $t.id and count($s.nondup) != count($t.nondup) +order by $s.authors +return { + "authors": $s.authors, + "hdistinct": $s.nondup, + "hcount": count($s.nondup), + "hash": counthashed-word-tokens($s.authors), + "vhcount": count(counthashed-word-tokens($s.authors)), + "wdistinct": $t.nondup, + "wcount": count($t.nondup), + "word": word-tokens($t.authors), + "vwcount": count(word-tokens($t.authors)) + } \ No newline at end of file diff --git a/asterixdb/asterix-app/src/test/resources/runtimets/queries/fuzzyjoin/basic-1_2_1/basic-1_2_1.10.query.aql b/asterixdb/asterix-app/src/test/resources/runtimets/queries/fuzzyjoin/basic-1_2_1/basic-1_2_1.10.query.aql new file mode 100644 index 0000000..af8844f --- /dev/null +++ b/asterixdb/asterix-app/src/test/resources/runtimets/queries/fuzzyjoin/basic-1_2_1/basic-1_2_1.10.query.aql @@ -0,0 +1,35 @@ +/* + * Licensed to the Apache Software Foundation (ASF) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. The ASF licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ +use dataverse fuzzyjoin_basic; + +set import-private-functions 'true' + +let $left := [1, 5, 6, 7] +let $right := [4, 5, 6] +let $leftnull := [null, null, 5, 6, 7] +let $rightnull := [4, 5, 6] +let $nullstring := [null, null, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10] + +let $prefix1 := subset-collection($nullstring, 0, prefix-len-jaccard(len($nullstring), 0.1f)) +let $prefix4 := subset-collection($nullstring, 0, prefix-len-jaccard(len($nullstring), 0.4f)) + +for $s in $prefix4 +for $r in $prefix1 +where $s = $r +return $s \ No newline at end of file diff --git a/asterixdb/asterix-app/src/test/resources/runtimets/queries/fuzzyjoin/basic-1_2_1/basic-1_2_1.3.query.aql b/asterixdb/asterix-app/src/test/resources/runtimets/queries/fuzzyjoin/basic-1_2_1/basic-1_2_1.3.query.aql index 5d9ab27..c7a63b6 100644 --- a/asterixdb/asterix-app/src/test/resources/runtimets/queries/fuzzyjoin/basic-1_2_1/basic-1_2_1.3.query.aql +++ b/asterixdb/asterix-app/src/test/resources/runtimets/queries/fuzzyjoin/basic-1_2_1/basic-1_2_1.3.query.aql @@ -120,4 +120,4 @@ let $cleanup := [$clearnull, $nullstring] return [$prefix, $sim1, $sim2, $sim3, $sim4, $sim5, $bound, $trybound, $checkbound, $negativesub1, $negativesub2, -[$prefix1, $prefix2, $prefix3, $prefix4, $prefix5, $prefix6, $prefix7, $prefix8, $prefix9], $joinpair, $cleanup] \ No newline at end of file +[$prefix1, $prefix2, $prefix3, $prefix4, $prefix5, $prefix6, $prefix7, $prefix8, $prefix9], $joinpair, $cleanup] diff --git a/asterixdb/asterix-app/src/test/resources/runtimets/queries/fuzzyjoin/basic-1_2_1/basic-1_2_1.8.query.aql b/asterixdb/asterix-app/src/test/resources/runtimets/queries/fuzzyjoin/basic-1_2_1/basic-1_2_1.8.query.aql new file mode 100644 index 0000000..56717bd --- /dev/null +++ b/asterixdb/asterix-app/src/test/resources/runtimets/queries/fuzzyjoin/basic-1_2_1/basic-1_2_1.8.query.aql @@ -0,0 +1,88 @@ +/* + * Licensed to the Apache Software Foundation (ASF) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. The ASF licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ +use dataverse fuzzyjoin_basic; + +set import-private-functions 'true' + +let $left := [1, 5, 6, 7] +let $right := [4, 5, 6] +let $leftnull := [null, null, 5, 6, 7] +let $rightnull := [4, 5, 6] +let $nullstring := [null, null, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10] + +let $bound := +for $l in [1] +return [ + [ + similarity-jaccard-prefix(3, [1, 2, 3], 3, [1, 2, 3], 1, 1f), + similarity-jaccard-prefix(3, [1, 2, 3], 3, [1, 2, 4], 1, .5f), + similarity-jaccard-prefix(3, [1, 2, 3], 3, [1, 2, 4], 1, .6f), + similarity-jaccard-prefix(3, [1, 2, 3], 9, [1, 2, 3], 1, .5f), + similarity-jaccard-prefix(4, [1, 2, 3, 4], 2, [1, 2], 1, .5f), + similarity-jaccard-prefix(4, [1, 2, 3, 4], 4, [1, 2], 1, .33f) + ],[ + similarity-jaccard-prefix(3, [1, 2, 3], 3, [1, 2, 3], 2, 1f), + similarity-jaccard-prefix(3, [1, 2, 3], 3, [1, 2, 4], 2, .5f), + similarity-jaccard-prefix(3, [1, 2, 3], 3, [1, 2, 4], 2, .6f), + similarity-jaccard-prefix(3, [1, 2, 3], 9, [1, 2, 3], 2, .5f), + similarity-jaccard-prefix(4, [1, 2, 3, 4], 2, [1, 2], 2, .5f), + similarity-jaccard-prefix(4, [1, 2, 3, 4], 4, [1, 2], 2, .33f) + ],[ + similarity-jaccard-prefix(3, [1, 2, 3], 3, [1, 2, 3], 3, 1f), + similarity-jaccard-prefix(3, [1, 2, 3], 3, [1, 2, 4], 3, .5f), + similarity-jaccard-prefix(3, [1, 2, 3], 3, [1, 2, 4], 3, .6f), + similarity-jaccard-prefix(3, [1, 2, 3], 9, [1, 2, 3], 3, .5f), + similarity-jaccard-prefix(4, [1, 2, 3, 4], 2, [1, 2], 3, .5f), + similarity-jaccard-prefix(4, [1, 2, 3, 4], 4, [1, 2], 3, .33f) + ] +] + +let $trybound := +for $l in [1] +return [ +similarity-jaccard-prefix(8, [3, 4, 5, 6, 7, 8], 10, [0, 0, 3, 4, 5, 6, 7, 8, 9, 10], -1, 0.5f), +similarity-jaccard-prefix(8, [1, 2, 3, 4, 5, 6, 7, 8], 10, [3, 4, 5, 6, 7, 8, 9, 10], 0, 0.5f), +similarity-jaccard-prefix(8, [3, 4, 5, 6, 7, 8], 10, [0, 0, 3, 4, 5, 6, 7, 8, 9, 10], 1, 0.5f), +similarity-jaccard-prefix(8, [1, 2, 3, 4, 5, 6, 7, 8], 10, [3, 4, 5, 6, 7, 8, 9, 10], 2, 0.5f), +similarity-jaccard-prefix(8, [3, 4, 5, 6, 7, 8], 10, [0, 0, 3, 4, 5, 6, 7, 8, 9, 10], 3, 0.5f), +similarity-jaccard-prefix(8, [1, 2, 3, 4, 5, 6, 7, 8], 10, [3, 4, 5, 6, 7, 8, 9, 10], 4, 0.5f), +similarity-jaccard-prefix(8, [3, 4, 5, 6, 7, 8], 10, [0, 0, 3, 4, 5, 6, 7, 8, 9, 10], 5, 0.5f), +similarity-jaccard-prefix(8, [1, 2, 3, 4, 5, 6, 7, 8], 10, [3, 4, 5, 6, 7, 8, 9, 10], 6, 0.5f), +similarity-jaccard-prefix(8, [3, 4, 5, 6, 7, 8], 10, [0, 0, 3, 4, 5, 6, 7, 8, 9, 10], 7, 0.5f), +similarity-jaccard-prefix(8, [1, 2, 3, 4, 5, 6, 7, 8], 10, [0, 0, 3, 4, 5, 6, 7, 8, 9, 10], 8, 0.5f), +similarity-jaccard-prefix(8, [1, 2, 3, 4, 5, 6, 7, 8], 10, [0, 0, 3, 4, 5, 6, 7, 8, 9, 10], 9, 0.5f), +similarity-jaccard-prefix(8, [1, 2, 3, 4, 5, 6, 7, 8], 10, [0, 0, 3, 4, 5, 6, 7, 8, 9, 10], 10, 0.5f), +similarity-jaccard-prefix(8, [1, 2, 5, 6, 7, 3, 4, 8], 10, [4, 5, 0, 0, 3, 6, 7, 8, 9, 10], 11, 0.5f) +] + +let $checkbound := +for $l in [1] +return [ +similarity-jaccard-check([1, 2, 3, 4, 5, 6, 7, 8], [null, 0, 3, 4, 5, 6, 7, 8, 9, 10], 0.1f), +similarity-jaccard-check([null, 2, 3, 4, 5, 6, 7, 8], [null, 0, 3, 4, 5, 6, 7, 8, 9, 10], 0.2f), +similarity-jaccard-check([null, 2, 3, 4, 5, 6, 7, 8], [null, null, 3, 4, 5, 6, 7, 8, 9, 10], 0.3f), +similarity-jaccard-check([null, null, 3, 4, 5, 6, 7, 8], [null, null, 3, 4, 5, 6, 7, 8, 9, 10], 0.4f), +similarity-jaccard-check([1, 2, 3, 4, 5, 6, 7, 8], [null, null, 3, 4, 5, 6, 7, 8, 9, 10], 0.5f), +similarity-jaccard-check([1, 2, 3, 4, 5, 6, 7, 8], [0, 2, 3, 4, 5, 6, 7, 8, 9, 10], 0.6f), +similarity-jaccard-check([1, 2, 3, 4, 5, 6, 7, 8], [null, null, 3, 4, 5, 6, 7, 8, 2], 0.7f), +similarity-jaccard-check([1, 2, 3, 4, 5, 6, 7, 8], [null, null, 3, 4, 5, 6, 7, 8, 1, 2], 0.8f), +similarity-jaccard-check([1, 2, 3, 4, 5, 6, 7, 8, 9], [null, 2, 3, 4, 5, 6, 7, 8, 9, 1], 0.9f) +] + +return [$bound, $trybound, $checkbound] \ No newline at end of file diff --git a/asterixdb/asterix-app/src/test/resources/runtimets/queries/fuzzyjoin/basic-1_2_1/basic-1_2_1.9.query.aql b/asterixdb/asterix-app/src/test/resources/runtimets/queries/fuzzyjoin/basic-1_2_1/basic-1_2_1.9.query.aql new file mode 100644 index 0000000..fa76621 --- /dev/null +++ b/asterixdb/asterix-app/src/test/resources/runtimets/queries/fuzzyjoin/basic-1_2_1/basic-1_2_1.9.query.aql @@ -0,0 +1,36 @@ +/* + * Licensed to the Apache Software Foundation (ASF) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. The ASF licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ +use dataverse fuzzyjoin_basic; + +set import-private-functions 'true' + +let $left := [1, 5, 6, 7] +let $right := [4, 5, 6] +let $leftnull := [null, null, 5, 6, 7] +let $rightnull := [4, 5, 6] +let $nullstring := [null, null, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10] + +let $clearnull := +for $index at $i in $nullstring +where $nullstring[$i] <= null +return int16(string($nullstring[$i])) + 64 + +let $cleanup := [$clearnull, $nullstring] + +return [$cleanup] \ No newline at end of file diff --git a/asterixdb/asterix-app/src/test/resources/runtimets/results/fuzzyjoin/basic-1_1_1/basic-1_1_1.1.adm b/asterixdb/asterix-app/src/test/resources/runtimets/results/fuzzyjoin/basic-1_1_1/basic-1_1_1.1.adm index b72e004..d9b32e5 100644 --- a/asterixdb/asterix-app/src/test/resources/runtimets/results/fuzzyjoin/basic-1_1_1/basic-1_1_1.1.adm +++ b/asterixdb/asterix-app/src/test/resources/runtimets/results/fuzzyjoin/basic-1_1_1/basic-1_1_1.1.adm @@ -1,13 +1 @@ -{ "authors": "Antti Airola Sampo Pyysalo Jari Björne Tapio Pahikkala Filip Ginter Tapio Salakoski", "hdistinct": [ -1703879002, -1473242502, -1260858361, -981055830, -887832212, -658173301, -658173300, 152866250, 1308706204, 1407504920, 1571121603, 1673795737 ], "hcount": 12, "hash": [ 1407504920, -1473242502, -981055830, 1673795737, 152866250, -1260858361, -658173301, -1703879002, -887832212, 1571121603, -658173300, 1308706204 ], "vhcount": 12, "wdistinct": [ "airola", "antti", "björne", "filip", "ginter", "jari", "pahikkala", "pyysalo", "salakoski", "sampo", "tapio" ], "wcount": 11, "word": [ "antti", "airola", "sampo", "pyysalo", "jari", "björne", "tapio", "pahikkala", "filip", "ginter", "tapio", "salakoski" ], "vwcount": 12 } -{ "authors": "Bart Baesens Stijn Viaene Tony Van Gestel Johan A. K. Suykens Guido Dedene Bart De Moor Jan Vanthienen", "hdistinct": [ -1935703338, -1911867284, -1622104926, -1358578075, -935776866, -214094487, 111100446, 178525531, 183137487, 202777881, 387687108, 476250961, 819214362, 1203632773, 1456032451, 2095219701, 2095219702, 2132187494 ], "hcount": 18, "hash": [ 2095219701, -1358578075, -1911867284, -1622104926, 2132187494, -214094487, -935776866, 387687108, 202777881, 1456032451, 111100446, 819214362, 178525531, 2095219702, 476250961, 183137487, 1203632773, -1935703338 ], "vhcount": 18, "wdistinct": [ "a", "baesens", "bart", "de", "dedene", "gestel", "guido", "jan", "johan", "k", "moor", "stijn", "suykens", "tony", "van", "vanthienen", "viaene" ], "wcount": 17, "word": [ "bart", "baesens", "stijn", "viaene", "tony", "van", "gestel", "johan", "a", "k", "suykens", "guido", "dedene", "bart", "de", "moor", "jan", "vanthienen" ], "vwcount": 18 } -{ "authors": "Cheong Hee Park Haesun Park", "hdistinct": [ 201502510, 1474696610, 1474696611, 1810069474, 1813499426 ], "hcount": 5, "hash": [ 1813499426, 1810069474, 1474696610, 201502510, 1474696611 ], "vhcount": 5, "wdistinct": [ "cheong", "haesun", "hee", "park" ], "wcount": 4, "word": [ "cheong", "hee", "park", "haesun", "park" ], "vwcount": 5 } -{ "authors": "Christopher J. C. Burges David J. Crisp", "hdistinct": [ -1980517994, -184499076, -184499075, 471822495, 885695371, 1216682123, 1230204720 ], "hcount": 7, "hash": [ 471822495, -184499076, 1216682123, -1980517994, 1230204720, -184499075, 885695371 ], "vhcount": 7, "wdistinct": [ "burges", "c", "christopher", "crisp", "david", "j" ], "wcount": 6, "word": [ "christopher", "j", "c", "burges", "david", "j", "crisp" ], "vwcount": 7 } -{ "authors": "Dominique Chanet Bjorn De Sutter Bruno De Bus Ludo Van Put Koen De Bosschere", "hdistinct": [ -1827235698, -1316812666, -727391969, -698069955, -690862623, -214094487, -204728799, 38143123, 106094358, 476250961, 476250962, 476250963, 1258550913, 1274211164 ], "hcount": 14, "hash": [ 1258550913, -698069955, 38143123, 476250961, -204728799, -1316812666, 476250962, -1827235698, 1274211164, -214094487, -690862623, -727391969, 476250963, 106094358 ], "vhcount": 14, "wdistinct": [ "bjorn", "bosschere", "bruno", "bus", "chanet", "de", "dominique", "koen", "ludo", "put", "sutter", "van" ], "wcount": 12, "word": [ "dominique", "chanet", "bjorn", "de", "sutter", "bruno", "de", "bus", "ludo", "van", "put", "koen", "de", "bosschere" ], "vwcount": 14 } -{ "authors": "Francis R. Bach Gert R. G. Lanckriet Michael I. Jordan", "hdistinct": [ -2039039025, -1050476689, -448767586, 54851252, 54851253, 419477052, 442128209, 637199601, 900395942, 1674769146 ], "hcount": 10, "hash": [ 419477052, 54851252, 1674769146, 900395942, 54851253, -1050476689, 637199601, -2039039025, 442128209, -448767586 ], "vhcount": 10, "wdistinct": [ "bach", "francis", "g", "gert", "i", "jordan", "lanckriet", "michael", "r" ], "wcount": 9, "word": [ "francis", "r", "bach", "gert", "r", "g", "lanckriet", "michael", "i", "jordan" ], "vwcount": 10 } -{ "authors": "Gavin C. Cawley Nicola L. C. Talbot", "hdistinct": [ -886454414, -534088337, 441647848, 481225853, 829405166, 1216682123, 1216682124 ], "hcount": 7, "hash": [ -534088337, 1216682123, 481225853, 441647848, 829405166, 1216682124, -886454414 ], "vhcount": 7, "wdistinct": [ "c", "cawley", "gavin", "l", "nicola", "talbot" ], "wcount": 6, "word": [ "gavin", "c", "cawley", "nicola", "l", "c", "talbot" ], "vwcount": 7 } -{ "authors": "Gavin C. Cawley Nicola L. C. Talbot Robert J. Foxall Stephen R. Dorling Danilo P. Mandic", "hdistinct": [ -1252796223, -959052990, -886454414, -534088337, -184499076, -130111359, 54851252, 411288970, 414405350, 441647848, 481225853, 829405166, 1216682123, 1216682124, 1304455685, 1784033734 ], "hcount": 16, "hash": [ -534088337, 1216682123, 481225853, 441647848, 829405166, 1216682124, -886454414, 414405350, -184499076, 411288970, -1252796223, 54851252, 1304455685, -130111359, -959052990, 1784033734 ], "vhcount": 16, "wdistinct": [ "c", "cawley", "danilo", "dorling", "foxall", "gavin", "j", "l", "mandic", "nicola", "p", "r", "robert", "stephen", "talbot" ], "wcount": 15, "word": [ "gavin", "c", "cawley", "nicola", "l", "c", "talbot", "robert", "j", "foxall", "stephen", "r", "dorling", "danilo", "p", "mandic" ], "vwcount": 16 } -{ "authors": "R. Venkatesh Babu Patrick Pérez Patrick Bouthemy", "hdistinct": [ -1978580578, -1106952520, -1106952519, 54851252, 199754598, 672789821, 1248452165 ], "hcount": 7, "hash": [ 54851252, 672789821, -1978580578, -1106952520, 199754598, -1106952519, 1248452165 ], "vhcount": 7, "wdistinct": [ "babu", "bouthemy", "patrick", "pérez", "r", "venkatesh" ], "wcount": 6, "word": [ "r", "venkatesh", "babu", "patrick", "pérez", "patrick", "bouthemy" ], "vwcount": 7 } -{ "authors": "Rafael Serrano-Gotarredona Teresa Serrano-Gotarredona Antonio Acosta-Jimenez Bernabé Linares-Barranco", "hdistinct": [ -1956851570, -1956851569, -1726594101, -1691145788, -1282838506, -564025963, -75151904, -75151903, 405246970, 487904168, 819607985, 1017487486 ], "hcount": 12, "hash": [ -564025963, -75151904, -1956851570, -1282838506, -75151903, -1956851569, 1017487486, -1726594101, -1691145788, 819607985, 487904168, 405246970 ], "vhcount": 12, "wdistinct": [ "acosta", "antonio", "barranco", "bernabé", "gotarredona", "jimenez", "linares", "rafael", "serrano", "teresa" ], "wcount": 10, "word": [ "rafael", "serrano", "gotarredona", "teresa", "serrano", "gotarredona", "antonio", "acosta", "jimenez", "bernabé", "linares", "barranco" ], "vwcount": 12 } -{ "authors": "Samuel G. Steckley Shane G. Henderson", "hdistinct": [ -1415708156, -1050476689, -1050476688, 263160025, 723460411, 1321749268 ], "hcount": 6, "hash": [ 723460411, -1050476689, 1321749268, 263160025, -1050476688, -1415708156 ], "vhcount": 6, "wdistinct": [ "g", "henderson", "samuel", "shane", "steckley" ], "wcount": 5, "word": [ "samuel", "g", "steckley", "shane", "g", "henderson" ], "vwcount": 6 } -{ "authors": "Susan Hert Michael Hoffmann Lutz Kettner Sylvain Pion Michael Seel", "hdistinct": [ -2138581461, -2081084774, -2039039025, -2039039024, -1863687409, -735414009, -716104536, -581739473, -340039108, 1858351859 ], "hcount": 10, "hash": [ -340039108, -2138581461, -2039039025, 1858351859, -735414009, -1863687409, -716104536, -2081084774, -2039039024, -581739473 ], "vhcount": 10, "wdistinct": [ "hert", "hoffmann", "kettner", "lutz", "michael", "pion", "seel", "susan", "sylvain" ], "wcount": 9, "word": [ "susan", "hert", "michael", "hoffmann", "lutz", "kettner", "sylvain", "pion", "michael", "seel" ], "vwcount": 10 } -{ "authors": "Tony Van Gestel Bart Baesens Johan A. K. Suykens Dirk Van den Poel Dirk-Emma Baestaens Marleen Willekens", "hdistinct": [ -1424854606, -1358578075, -1067178786, -935776866, -389896470, -214094487, -214094486, 111100446, 202777881, 367084408, 387687108, 395536654, 395536655, 699609214, 1181197775, 1456032451, 2095219701, 2132187494 ], "hcount": 18, "hash": [ 2132187494, -214094487, -935776866, 2095219701, -1358578075, 387687108, 202777881, 1456032451, 111100446, 395536654, -214094486, 1181197775, 367084408, 395536655, 699609214, -1424854606, -1067178786, -389896470 ], "vhcount": 18, "wdistinct": [ "a", "baesens", "baestaens", "bart", "den", "dirk", "emma", "gestel", "johan", "k", "marleen", "poel", "suykens", "tony", "van", "willekens" ], "wcount": 16, "word": [ "tony", "van", "gestel", "bart", "baesens", "johan", "a", "k", "suykens", "dirk", "van", "den", "poel", "dirk", "emma", "baestaens", "marleen", "willekens" ], "vwcount": 18 } +{ "raw string": "Tony Van Gestel Bart Baesens Johan A. K. Suykens Dirk Van den Poel Dirk-Emma Baestaens Marleen Willekens", "word-tokens": [ "tony", "van", "gestel", "bart", "baesens", "johan", "a", "k", "suykens", "dirk", "van", "den", "poel", "dirk", "emma", "baestaens", "marleen", "willekens" ], "word-tokens-len": 18, "hashed-word-tokens": [ 2132187494, -214094487, -935776866, 2095219701, -1358578075, 387687108, 202777881, 1456032451, 111100446, 395536654, -214094487, 1181197775, 367084408, 395536654, 699609214, -1424854606, -1067178786, -389896470 ], "hashed-word-tokens-len": 18, "counthashed-word-tokens": [ 2132187494, -214094487, -935776866, 2095219701, -1358578075, 387687108, 202777881, 1456032451, 111100446, 395536654, -214094486, 1181197775, 367084408, 395536655, 699609214, -1424854606, -1067178786, -389896470 ], "counthashed-word-tokens-len": 18, "pre-word-tokens": [ "a", "baesens", "baestaens", "bart", "den", "dirk", "emma", "gestel", "johan", "k", "marleen", "poel", "suy kens", "tony", "van", "willekens" ], "pre-word-tokens-len": 16, "pre-hashed-word-tokens": [ -1424854606, -1358578075, -1067178786, -935776866, -389896470, -214094487, 111100446, 202777881, 367084408, 387687108, 395536654, 699609214, 1181197775, 1456032451, 2095219701, 2132187494 ], "pre-hashed-word-tokens-len": 16, "pre-counthashed-word-tokens": [ -1424854606, -1358578075, -1067178786, -935776866, -389896470, -214094487, -214094486, 111100446, 202777881, 367084408, 387687108, 395536654, 395536655, 699609214, 1181197775, 1456032451, 2095219701, 2132187494 ], "pre-counthashed-word-tokens-len": 18 } diff --git a/asterixdb/asterix-app/src/test/resources/runtimets/results/fuzzyjoin/basic-1_1_1/basic-1_1_1.3.adm b/asterixdb/asterix-app/src/test/resources/runtimets/results/fuzzyjoin/basic-1_1_1/basic-1_1_1.3.adm new file mode 100644 index 0000000..b72e004 --- /dev/null +++ b/asterixdb/asterix-app/src/test/resources/runtimets/results/fuzzyjoin/basic-1_1_1/basic-1_1_1.3.adm @@ -0,0 +1,13 @@ +{ "authors": "Antti Airola Sampo Pyysalo Jari Björne Tapio Pahikkala Filip Ginter Tapio Salakoski", "hdistinct": [ -1703879002, -1473242502, -1260858361, -981055830, -887832212, -658173301, -658173300, 152866250, 1308706204, 1407504920, 1571121603, 1673795737 ], "hcount": 12, "hash": [ 1407504920, -1473242502, -981055830, 1673795737, 152866250, -1260858361, -658173301, -1703879002, -887832212, 1571121603, -658173300, 1308706204 ], "vhcount": 12, "wdistinct": [ "airola", "antti", "björne", "filip", "ginter", "jari", "pahikkala", "pyysalo", "salakoski", "sampo", "tapio" ], "wcount": 11, "word": [ "antti", "airola", "sampo", "pyysalo", "jari", "björne", "tapio", "pahikkala", "filip", "ginter", "tapio", "salakoski" ], "vwcount": 12 } +{ "authors": "Bart Baesens Stijn Viaene Tony Van Gestel Johan A. K. Suykens Guido Dedene Bart De Moor Jan Vanthienen", "hdistinct": [ -1935703338, -1911867284, -1622104926, -1358578075, -935776866, -214094487, 111100446, 178525531, 183137487, 202777881, 387687108, 476250961, 819214362, 1203632773, 1456032451, 2095219701, 2095219702, 2132187494 ], "hcount": 18, "hash": [ 2095219701, -1358578075, -1911867284, -1622104926, 2132187494, -214094487, -935776866, 387687108, 202777881, 1456032451, 111100446, 819214362, 178525531, 2095219702, 476250961, 183137487, 1203632773, -1935703338 ], "vhcount": 18, "wdistinct": [ "a", "baesens", "bart", "de", "dedene", "gestel", "guido", "jan", "johan", "k", "moor", "stijn", "suykens", "tony", "van", "vanthienen", "viaene" ], "wcount": 17, "word": [ "bart", "baesens", "stijn", "viaene", "tony", "van", "gestel", "johan", "a", "k", "suykens", "guido", "dedene", "bart", "de", "moor", "jan", "vanthienen" ], "vwcount": 18 } +{ "authors": "Cheong Hee Park Haesun Park", "hdistinct": [ 201502510, 1474696610, 1474696611, 1810069474, 1813499426 ], "hcount": 5, "hash": [ 1813499426, 1810069474, 1474696610, 201502510, 1474696611 ], "vhcount": 5, "wdistinct": [ "cheong", "haesun", "hee", "park" ], "wcount": 4, "word": [ "cheong", "hee", "park", "haesun", "park" ], "vwcount": 5 } +{ "authors": "Christopher J. C. Burges David J. Crisp", "hdistinct": [ -1980517994, -184499076, -184499075, 471822495, 885695371, 1216682123, 1230204720 ], "hcount": 7, "hash": [ 471822495, -184499076, 1216682123, -1980517994, 1230204720, -184499075, 885695371 ], "vhcount": 7, "wdistinct": [ "burges", "c", "christopher", "crisp", "david", "j" ], "wcount": 6, "word": [ "christopher", "j", "c", "burges", "david", "j", "crisp" ], "vwcount": 7 } +{ "authors": "Dominique Chanet Bjorn De Sutter Bruno De Bus Ludo Van Put Koen De Bosschere", "hdistinct": [ -1827235698, -1316812666, -727391969, -698069955, -690862623, -214094487, -204728799, 38143123, 106094358, 476250961, 476250962, 476250963, 1258550913, 1274211164 ], "hcount": 14, "hash": [ 1258550913, -698069955, 38143123, 476250961, -204728799, -1316812666, 476250962, -1827235698, 1274211164, -214094487, -690862623, -727391969, 476250963, 106094358 ], "vhcount": 14, "wdistinct": [ "bjorn", "bosschere", "bruno", "bus", "chanet", "de", "dominique", "koen", "ludo", "put", "sutter", "van" ], "wcount": 12, "word": [ "dominique", "chanet", "bjorn", "de", "sutter", "bruno", "de", "bus", "ludo", "van", "put", "koen", "de", "bosschere" ], "vwcount": 14 } +{ "authors": "Francis R. Bach Gert R. G. Lanckriet Michael I. Jordan", "hdistinct": [ -2039039025, -1050476689, -448767586, 54851252, 54851253, 419477052, 442128209, 637199601, 900395942, 1674769146 ], "hcount": 10, "hash": [ 419477052, 54851252, 1674769146, 900395942, 54851253, -1050476689, 637199601, -2039039025, 442128209, -448767586 ], "vhcount": 10, "wdistinct": [ "bach", "francis", "g", "gert", "i", "jordan", "lanckriet", "michael", "r" ], "wcount": 9, "word": [ "francis", "r", "bach", "gert", "r", "g", "lanckriet", "michael", "i", "jordan" ], "vwcount": 10 } +{ "authors": "Gavin C. Cawley Nicola L. C. Talbot", "hdistinct": [ -886454414, -534088337, 441647848, 481225853, 829405166, 1216682123, 1216682124 ], "hcount": 7, "hash": [ -534088337, 1216682123, 481225853, 441647848, 829405166, 1216682124, -886454414 ], "vhcount": 7, "wdistinct": [ "c", "cawley", "gavin", "l", "nicola", "talbot" ], "wcount": 6, "word": [ "gavin", "c", "cawley", "nicola", "l", "c", "talbot" ], "vwcount": 7 } +{ "authors": "Gavin C. Cawley Nicola L. C. Talbot Robert J. Foxall Stephen R. Dorling Danilo P. Mandic", "hdistinct": [ -1252796223, -959052990, -886454414, -534088337, -184499076, -130111359, 54851252, 411288970, 414405350, 441647848, 481225853, 829405166, 1216682123, 1216682124, 1304455685, 1784033734 ], "hcount": 16, "hash": [ -534088337, 1216682123, 481225853, 441647848, 829405166, 1216682124, -886454414, 414405350, -184499076, 411288970, -1252796223, 54851252, 1304455685, -130111359, -959052990, 1784033734 ], "vhcount": 16, "wdistinct": [ "c", "cawley", "danilo", "dorling", "foxall", "gavin", "j", "l", "mandic", "nicola", "p", "r", "robert", "stephen", "talbot" ], "wcount": 15, "word": [ "gavin", "c", "cawley", "nicola", "l", "c", "talbot", "robert", "j", "foxall", "stephen", "r", "dorling", "danilo", "p", "mandic" ], "vwcount": 16 } +{ "authors": "R. Venkatesh Babu Patrick Pérez Patrick Bouthemy", "hdistinct": [ -1978580578, -1106952520, -1106952519, 54851252, 199754598, 672789821, 1248452165 ], "hcount": 7, "hash": [ 54851252, 672789821, -1978580578, -1106952520, 199754598, -1106952519, 1248452165 ], "vhcount": 7, "wdistinct": [ "babu", "bouthemy", "patrick", "pérez", "r", "venkatesh" ], "wcount": 6, "word": [ "r", "venkatesh", "babu", "patrick", "pérez", "patrick", "bouthemy" ], "vwcount": 7 } +{ "authors": "Rafael Serrano-Gotarredona Teresa Serrano-Gotarredona Antonio Acosta-Jimenez Bernabé Linares-Barranco", "hdistinct": [ -1956851570, -1956851569, -1726594101, -1691145788, -1282838506, -564025963, -75151904, -75151903, 405246970, 487904168, 819607985, 1017487486 ], "hcount": 12, "hash": [ -564025963, -75151904, -1956851570, -1282838506, -75151903, -1956851569, 1017487486, -1726594101, -1691145788, 819607985, 487904168, 405246970 ], "vhcount": 12, "wdistinct": [ "acosta", "antonio", "barranco", "bernabé", "gotarredona", "jimenez", "linares", "rafael", "serrano", "teresa" ], "wcount": 10, "word": [ "rafael", "serrano", "gotarredona", "teresa", "serrano", "gotarredona", "antonio", "acosta", "jimenez", "bernabé", "linares", "barranco" ], "vwcount": 12 } +{ "authors": "Samuel G. Steckley Shane G. Henderson", "hdistinct": [ -1415708156, -1050476689, -1050476688, 263160025, 723460411, 1321749268 ], "hcount": 6, "hash": [ 723460411, -1050476689, 1321749268, 263160025, -1050476688, -1415708156 ], "vhcount": 6, "wdistinct": [ "g", "henderson", "samuel", "shane", "steckley" ], "wcount": 5, "word": [ "samuel", "g", "steckley", "shane", "g", "henderson" ], "vwcount": 6 } +{ "authors": "Susan Hert Michael Hoffmann Lutz Kettner Sylvain Pion Michael Seel", "hdistinct": [ -2138581461, -2081084774, -2039039025, -2039039024, -1863687409, -735414009, -716104536, -581739473, -340039108, 1858351859 ], "hcount": 10, "hash": [ -340039108, -2138581461, -2039039025, 1858351859, -735414009, -1863687409, -716104536, -2081084774, -2039039024, -581739473 ], "vhcount": 10, "wdistinct": [ "hert", "hoffmann", "kettner", "lutz", "michael", "pion", "seel", "susan", "sylvain" ], "wcount": 9, "word": [ "susan", "hert", "michael", "hoffmann", "lutz", "kettner", "sylvain", "pion", "michael", "seel" ], "vwcount": 10 } +{ "authors": "Tony Van Gestel Bart Baesens Johan A. K. Suykens Dirk Van den Poel Dirk-Emma Baestaens Marleen Willekens", "hdistinct": [ -1424854606, -1358578075, -1067178786, -935776866, -389896470, -214094487, -214094486, 111100446, 202777881, 367084408, 387687108, 395536654, 395536655, 699609214, 1181197775, 1456032451, 2095219701, 2132187494 ], "hcount": 18, "hash": [ 2132187494, -214094487, -935776866, 2095219701, -1358578075, 387687108, 202777881, 1456032451, 111100446, 395536654, -214094486, 1181197775, 367084408, 395536655, 699609214, -1424854606, -1067178786, -389896470 ], "vhcount": 18, "wdistinct": [ "a", "baesens", "baestaens", "bart", "den", "dirk", "emma", "gestel", "johan", "k", "marleen", "poel", "suykens", "tony", "van", "willekens" ], "wcount": 16, "word": [ "tony", "van", "gestel", "bart", "baesens", "johan", "a", "k", "suykens", "dirk", "van", "den", "poel", "dirk", "emma", "baestaens", "marleen", "willekens" ], "vwcount": 18 } diff --git a/asterixdb/asterix-app/src/test/resources/runtimets/results/fuzzyjoin/basic-1_1_1/basic-1_1_1.4.adm b/asterixdb/asterix-app/src/test/resources/runtimets/results/fuzzyjoin/basic-1_1_1/basic-1_1_1.4.adm new file mode 100644 index 0000000..b72e004 --- /dev/null +++ b/asterixdb/asterix-app/src/test/resources/runtimets/results/fuzzyjoin/basic-1_1_1/basic-1_1_1.4.adm @@ -0,0 +1,13 @@ +{ "authors": "Antti Airola Sampo Pyysalo Jari Björne Tapio Pahikkala Filip Ginter Tapio Salakoski", "hdistinct": [ -1703879002, -1473242502, -1260858361, -981055830, -887832212, -658173301, -658173300, 152866250, 1308706204, 1407504920, 1571121603, 1673795737 ], "hcount": 12, "hash": [ 1407504920, -1473242502, -981055830, 1673795737, 152866250, -1260858361, -658173301, -1703879002, -887832212, 1571121603, -658173300, 1308706204 ], "vhcount": 12, "wdistinct": [ "airola", "antti", "björne", "filip", "ginter", "jari", "pahikkala", "pyysalo", "salakoski", "sampo", "tapio" ], "wcount": 11, "word": [ "antti", "airola", "sampo", "pyysalo", "jari", "björne", "tapio", "pahikkala", "filip", "ginter", "tapio", "salakoski" ], "vwcount": 12 } +{ "authors": "Bart Baesens Stijn Viaene Tony Van Gestel Johan A. K. Suykens Guido Dedene Bart De Moor Jan Vanthienen", "hdistinct": [ -1935703338, -1911867284, -1622104926, -1358578075, -935776866, -214094487, 111100446, 178525531, 183137487, 202777881, 387687108, 476250961, 819214362, 1203632773, 1456032451, 2095219701, 2095219702, 2132187494 ], "hcount": 18, "hash": [ 2095219701, -1358578075, -1911867284, -1622104926, 2132187494, -214094487, -935776866, 387687108, 202777881, 1456032451, 111100446, 819214362, 178525531, 2095219702, 476250961, 183137487, 1203632773, -1935703338 ], "vhcount": 18, "wdistinct": [ "a", "baesens", "bart", "de", "dedene", "gestel", "guido", "jan", "johan", "k", "moor", "stijn", "suykens", "tony", "van", "vanthienen", "viaene" ], "wcount": 17, "word": [ "bart", "baesens", "stijn", "viaene", "tony", "van", "gestel", "johan", "a", "k", "suykens", "guido", "dedene", "bart", "de", "moor", "jan", "vanthienen" ], "vwcount": 18 } +{ "authors": "Cheong Hee Park Haesun Park", "hdistinct": [ 201502510, 1474696610, 1474696611, 1810069474, 1813499426 ], "hcount": 5, "hash": [ 1813499426, 1810069474, 1474696610, 201502510, 1474696611 ], "vhcount": 5, "wdistinct": [ "cheong", "haesun", "hee", "park" ], "wcount": 4, "word": [ "cheong", "hee", "park", "haesun", "park" ], "vwcount": 5 } +{ "authors": "Christopher J. C. Burges David J. Crisp", "hdistinct": [ -1980517994, -184499076, -184499075, 471822495, 885695371, 1216682123, 1230204720 ], "hcount": 7, "hash": [ 471822495, -184499076, 1216682123, -1980517994, 1230204720, -184499075, 885695371 ], "vhcount": 7, "wdistinct": [ "burges", "c", "christopher", "crisp", "david", "j" ], "wcount": 6, "word": [ "christopher", "j", "c", "burges", "david", "j", "crisp" ], "vwcount": 7 } +{ "authors": "Dominique Chanet Bjorn De Sutter Bruno De Bus Ludo Van Put Koen De Bosschere", "hdistinct": [ -1827235698, -1316812666, -727391969, -698069955, -690862623, -214094487, -204728799, 38143123, 106094358, 476250961, 476250962, 476250963, 1258550913, 1274211164 ], "hcount": 14, "hash": [ 1258550913, -698069955, 38143123, 476250961, -204728799, -1316812666, 476250962, -1827235698, 1274211164, -214094487, -690862623, -727391969, 476250963, 106094358 ], "vhcount": 14, "wdistinct": [ "bjorn", "bosschere", "bruno", "bus", "chanet", "de", "dominique", "koen", "ludo", "put", "sutter", "van" ], "wcount": 12, "word": [ "dominique", "chanet", "bjorn", "de", "sutter", "bruno", "de", "bus", "ludo", "van", "put", "koen", "de", "bosschere" ], "vwcount": 14 } +{ "authors": "Francis R. Bach Gert R. G. Lanckriet Michael I. Jordan", "hdistinct": [ -2039039025, -1050476689, -448767586, 54851252, 54851253, 419477052, 442128209, 637199601, 900395942, 1674769146 ], "hcount": 10, "hash": [ 419477052, 54851252, 1674769146, 900395942, 54851253, -1050476689, 637199601, -2039039025, 442128209, -448767586 ], "vhcount": 10, "wdistinct": [ "bach", "francis", "g", "gert", "i", "jordan", "lanckriet", "michael", "r" ], "wcount": 9, "word": [ "francis", "r", "bach", "gert", "r", "g", "lanckriet", "michael", "i", "jordan" ], "vwcount": 10 } +{ "authors": "Gavin C. Cawley Nicola L. C. Talbot", "hdistinct": [ -886454414, -534088337, 441647848, 481225853, 829405166, 1216682123, 1216682124 ], "hcount": 7, "hash": [ -534088337, 1216682123, 481225853, 441647848, 829405166, 1216682124, -886454414 ], "vhcount": 7, "wdistinct": [ "c", "cawley", "gavin", "l", "nicola", "talbot" ], "wcount": 6, "word": [ "gavin", "c", "cawley", "nicola", "l", "c", "talbot" ], "vwcount": 7 } +{ "authors": "Gavin C. Cawley Nicola L. C. Talbot Robert J. Foxall Stephen R. Dorling Danilo P. Mandic", "hdistinct": [ -1252796223, -959052990, -886454414, -534088337, -184499076, -130111359, 54851252, 411288970, 414405350, 441647848, 481225853, 829405166, 1216682123, 1216682124, 1304455685, 1784033734 ], "hcount": 16, "hash": [ -534088337, 1216682123, 481225853, 441647848, 829405166, 1216682124, -886454414, 414405350, -184499076, 411288970, -1252796223, 54851252, 1304455685, -130111359, -959052990, 1784033734 ], "vhcount": 16, "wdistinct": [ "c", "cawley", "danilo", "dorling", "foxall", "gavin", "j", "l", "mandic", "nicola", "p", "r", "robert", "stephen", "talbot" ], "wcount": 15, "word": [ "gavin", "c", "cawley", "nicola", "l", "c", "talbot", "robert", "j", "foxall", "stephen", "r", "dorling", "danilo", "p", "mandic" ], "vwcount": 16 } +{ "authors": "R. Venkatesh Babu Patrick Pérez Patrick Bouthemy", "hdistinct": [ -1978580578, -1106952520, -1106952519, 54851252, 199754598, 672789821, 1248452165 ], "hcount": 7, "hash": [ 54851252, 672789821, -1978580578, -1106952520, 199754598, -1106952519, 1248452165 ], "vhcount": 7, "wdistinct": [ "babu", "bouthemy", "patrick", "pérez", "r", "venkatesh" ], "wcount": 6, "word": [ "r", "venkatesh", "babu", "patrick", "pérez", "patrick", "bouthemy" ], "vwcount": 7 } +{ "authors": "Rafael Serrano-Gotarredona Teresa Serrano-Gotarredona Antonio Acosta-Jimenez Bernabé Linares-Barranco", "hdistinct": [ -1956851570, -1956851569, -1726594101, -1691145788, -1282838506, -564025963, -75151904, -75151903, 405246970, 487904168, 819607985, 1017487486 ], "hcount": 12, "hash": [ -564025963, -75151904, -1956851570, -1282838506, -75151903, -1956851569, 1017487486, -1726594101, -1691145788, 819607985, 487904168, 405246970 ], "vhcount": 12, "wdistinct": [ "acosta", "antonio", "barranco", "bernabé", "gotarredona", "jimenez", "linares", "rafael", "serrano", "teresa" ], "wcount": 10, "word": [ "rafael", "serrano", "gotarredona", "teresa", "serrano", "gotarredona", "antonio", "acosta", "jimenez", "bernabé", "linares", "barranco" ], "vwcount": 12 } +{ "authors": "Samuel G. Steckley Shane G. Henderson", "hdistinct": [ -1415708156, -1050476689, -1050476688, 263160025, 723460411, 1321749268 ], "hcount": 6, "hash": [ 723460411, -1050476689, 1321749268, 263160025, -1050476688, -1415708156 ], "vhcount": 6, "wdistinct": [ "g", "henderson", "samuel", "shane", "steckley" ], "wcount": 5, "word": [ "samuel", "g", "steckley", "shane", "g", "henderson" ], "vwcount": 6 } +{ "authors": "Susan Hert Michael Hoffmann Lutz Kettner Sylvain Pion Michael Seel", "hdistinct": [ -2138581461, -2081084774, -2039039025, -2039039024, -1863687409, -735414009, -716104536, -581739473, -340039108, 1858351859 ], "hcount": 10, "hash": [ -340039108, -2138581461, -2039039025, 1858351859, -735414009, -1863687409, -716104536, -2081084774, -2039039024, -581739473 ], "vhcount": 10, "wdistinct": [ "hert", "hoffmann", "kettner", "lutz", "michael", "pion", "seel", "susan", "sylvain" ], "wcount": 9, "word": [ "susan", "hert", "michael", "hoffmann", "lutz", "kettner", "sylvain", "pion", "michael", "seel" ], "vwcount": 10 } +{ "authors": "Tony Van Gestel Bart Baesens Johan A. K. Suykens Dirk Van den Poel Dirk-Emma Baestaens Marleen Willekens", "hdistinct": [ -1424854606, -1358578075, -1067178786, -935776866, -389896470, -214094487, -214094486, 111100446, 202777881, 367084408, 387687108, 395536654, 395536655, 699609214, 1181197775, 1456032451, 2095219701, 2132187494 ], "hcount": 18, "hash": [ 2132187494, -214094487, -935776866, 2095219701, -1358578075, 387687108, 202777881, 1456032451, 111100446, 395536654, -214094486, 1181197775, 367084408, 395536655, 699609214, -1424854606, -1067178786, -389896470 ], "vhcount": 18, "wdistinct": [ "a", "baesens", "baestaens", "bart", "den", "dirk", "emma", "gestel", "johan", "k", "marleen", "poel", "suykens", "tony", "van", "willekens" ], "wcount": 16, "word": [ "tony", "van", "gestel", "bart", "baesens", "johan", "a", "k", "suykens", "dirk", "van", "den", "poel", "dirk", "emma", "baestaens", "marleen", "willekens" ], "vwcount": 18 } diff --git a/asterixdb/asterix-app/src/test/resources/runtimets/results/fuzzyjoin/basic-1_2_1/basic-1_2_1.10.adm b/asterixdb/asterix-app/src/test/resources/runtimets/results/fuzzyjoin/basic-1_2_1/basic-1_2_1.10.adm new file mode 100644 index 0000000..b414108 --- /dev/null +++ b/asterixdb/asterix-app/src/test/resources/runtimets/results/fuzzyjoin/basic-1_2_1/basic-1_2_1.10.adm @@ -0,0 +1,6 @@ +1 +2 +3 +4 +5 +6 diff --git a/asterixdb/asterix-app/src/test/resources/runtimets/results/fuzzyjoin/basic-1_2_1/basic-1_2_1.3.adm b/asterixdb/asterix-app/src/test/resources/runtimets/results/fuzzyjoin/basic-1_2_1/basic-1_2_1.3.adm index fa92713..1285be3 100644 --- a/asterixdb/asterix-app/src/test/resources/runtimets/results/fuzzyjoin/basic-1_2_1/basic-1_2_1.3.adm +++ b/asterixdb/asterix-app/src/test/resources/runtimets/results/fuzzyjoin/basic-1_2_1/basic-1_2_1.3.adm @@ -1 +1 @@ -[ [ 4, 5 ], 0.33333334, 0.4, 0.33333334, 0.5, 0.5, [ [ [ 1.0, 0.5, 0.0, 0.0, 0.5, 0.33333334 ], [ 1.0, 0.5, 0.0, 0.0, 0.5, 0.33333334 ], [ 1.0, 0.0, 0.0, 0.0, 0.0, 0.0 ] ] ], [ [ 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.0 ] ], [ [ [ true, 0.5 ], [ true, 0.6363636 ], [ true, 0.6363636 ], [ true, 0.8 ], [ true, 0.5 ], [ true, 0.6363636 ], [ true, 0.7 ], [ true, 0.8 ], [ true, 0.9 ] ] ], [ ], [ ], [ [ null, null, 1, 2, 3, 4, 5, 6, 7, 8, 9 ], [ null, null, 1, 2, 3, 4, 5, 6, 7, 8 ], [ null, null, 1, 2, 3, 4, 5, 6, 7 ], [ null, null, 1, 2, 3, 4, 5, 6 ], [ null, null, 1, 2, 3, 4, 5 ], [ null, null, 1, 2, 3 ], [ null, null, 1, 2 ], [ null, null, 1 ], [ null, null ] ], [ 1, 2, 3, 4, 5, 6 ], [ [ ], [ null, null, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10 ] ] ] \ No newline at end of file +[ [ 4, 5 ], 0.33333334, 0.4, 0.33333334, 0.5, 0.5, [ [ [ 1.0, 0.5, 0.0, 0.0, 0.5, 0.33333334 ], [ 1.0, 0.5, 0.0, 0.0, 0.5, 0.33333334 ], [ 1.0, 0.0, 0.0, 0.0, 0.0, 0.0 ] ] ], [ [ 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.0 ] ], [ [ [ true, 0.5 ], [ true, 0.6363636 ], [ true, 0.6363636 ], [ true, 0.8 ], [ true, 0.5 ], [ true, 0.6363636 ], [ true, 0.7 ], [ true, 0.8 ], [ true, 0.9 ] ] ], [ ], [ ], [ [ null, null, 1, 2, 3, 4, 5, 6, 7, 8, 9 ], [ null, null, 1, 2, 3, 4, 5, 6, 7, 8 ], [ null, null, 1, 2, 3, 4, 5, 6, 7 ], [ null, null, 1, 2, 3, 4, 5, 6 ], [ null, null, 1, 2, 3, 4, 5 ], [ null, null, 1, 2, 3 ], [ null, null, 1, 2 ], [ null, null, 1 ], [ null, null ] ], [ 1, 2, 3, 4, 5, 6 ], [ [ ], [ null, null, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10 ] ] ] diff --git a/asterixdb/asterix-app/src/test/resources/runtimets/results/fuzzyjoin/basic-1_2_1/basic-1_2_1.8.adm b/asterixdb/asterix-app/src/test/resources/runtimets/results/fuzzyjoin/basic-1_2_1/basic-1_2_1.8.adm new file mode 100644 index 0000000..d932883 --- /dev/null +++ b/asterixdb/asterix-app/src/test/resources/runtimets/results/fuzzyjoin/basic-1_2_1/basic-1_2_1.8.adm @@ -0,0 +1 @@ +[ [ [ [ 1.0, 0.5, 0.0, 0.0, 0.5, 0.33333334 ], [ 1.0, 0.5, 0.0, 0.0, 0.5, 0.33333334 ], [ 1.0, 0.0, 0.0, 0.0, 0.0, 0.0 ] ] ], [ [ 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.0 ] ], [ [ [ true, 0.5 ], [ true, 0.6363636 ], [ true, 0.6363636 ], [ true, 0.8 ], [ true, 0.5 ], [ true, 0.6363636 ], [ true, 0.7 ], [ true, 0.8 ], [ true, 0.9 ] ] ] ] diff --git a/asterixdb/asterix-app/src/test/resources/runtimets/results/fuzzyjoin/basic-1_2_1/basic-1_2_1.9.adm b/asterixdb/asterix-app/src/test/resources/runtimets/results/fuzzyjoin/basic-1_2_1/basic-1_2_1.9.adm new file mode 100644 index 0000000..39dff83 --- /dev/null +++ b/asterixdb/asterix-app/src/test/resources/runtimets/results/fuzzyjoin/basic-1_2_1/basic-1_2_1.9.adm @@ -0,0 +1 @@ +[ [ [ ], [ null, null, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10 ] ] ] diff --git a/asterixdb/asterix-server/src/test/resources/NCServiceExecutionIT/cc.conf b/asterixdb/asterix-server/src/test/resources/NCServiceExecutionIT/cc.conf index f3dcd63..4ffb974 100644 --- a/asterixdb/asterix-server/src/test/resources/NCServiceExecutionIT/cc.conf +++ b/asterixdb/asterix-server/src/test/resources/NCServiceExecutionIT/cc.conf @@ -36,8 +36,8 @@ address=127.0.0.1 command=asterixnc app.class=org.apache.asterix.hyracks.bootstrap.NCApplication -jvm.args=-Xmx4g -Dnode.Resolver="org.apache.asterix.external.util.IdentitiyResolverFactory" -storage.memorycomponent.globalbudget = 1073741824 +jvm.args=-Xmx7g -Dnode.Resolver="org.apache.asterix.external.util.IdentitiyResolverFactory" +storage.memorycomponent.globalbudget = 536870912 [cc] address = 127.0.0.1 -- To view, visit https://asterix-gerrit.ics.uci.edu/3008 To unsubscribe, visit https://asterix-gerrit.ics.uci.edu/settings Gerrit-MessageType: newchange Gerrit-Change-Id: If5cbb4a133e7d62f9c9aaa05852d3b20c9aa50c3 Gerrit-PatchSet: 1 Gerrit-Project: asterixdb Gerrit-Branch: master Gerrit-Owner: Wenhai Li <lwhay...@gmail.com>