http://git-wip-us.apache.org/repos/asf/incubator-hivemall-site/blob/b8a847fa/userguide/binaryclass/kdd2010b_arow.html ---------------------------------------------------------------------- diff --git a/userguide/binaryclass/kdd2010b_arow.html b/userguide/binaryclass/kdd2010b_arow.html index f98ca28..0e677e4 100644 --- a/userguide/binaryclass/kdd2010b_arow.html +++ b/userguide/binaryclass/kdd2010b_arow.html @@ -221,13 +221,28 @@ </li> - <li class="chapter " data-level="1.3" data-path="../tips/"> + <li class="chapter " data-level="1.3" data-path="../misc/funcs.html"> - <a href="../tips/"> + <a href="../misc/funcs.html"> <b>1.3.</b> + List of Functions + + </a> + + + + </li> + + <li class="chapter " data-level="1.4" data-path="../tips/"> + + <a href="../tips/"> + + + <b>1.4.</b> + Tips for Effective Hivemall </a> @@ -237,12 +252,12 @@ <ul class="articles"> - <li class="chapter " data-level="1.3.1" data-path="../tips/addbias.html"> + <li class="chapter " data-level="1.4.1" data-path="../tips/addbias.html"> <a href="../tips/addbias.html"> - <b>1.3.1.</b> + <b>1.4.1.</b> Explicit add_bias() for better prediction @@ -252,12 +267,12 @@ </li> - <li class="chapter " data-level="1.3.2" data-path="../tips/rand_amplify.html"> + <li class="chapter " data-level="1.4.2" data-path="../tips/rand_amplify.html"> <a href="../tips/rand_amplify.html"> - <b>1.3.2.</b> + <b>1.4.2.</b> Use rand_amplify() to better prediction results @@ -267,14 +282,14 @@ </li> - <li class="chapter " data-level="1.3.3" data-path="../tips/rt_prediction.html"> + <li class="chapter " data-level="1.4.3" data-path="../tips/rt_prediction.html"> <a href="../tips/rt_prediction.html"> - <b>1.3.3.</b> + <b>1.4.3.</b> - Real-time Prediction on RDBMS + Real-time prediction on RDBMS </a> @@ -282,12 +297,12 @@ </li> - <li class="chapter " data-level="1.3.4" data-path="../tips/ensemble_learning.html"> + <li class="chapter " data-level="1.4.4" data-path="../tips/ensemble_learning.html"> <a href="../tips/ensemble_learning.html"> - <b>1.3.4.</b> + <b>1.4.4.</b> Ensemble learning for stable prediction @@ -297,12 +312,12 @@ </li> - <li class="chapter " data-level="1.3.5" data-path="../tips/mixserver.html"> + <li class="chapter " data-level="1.4.5" data-path="../tips/mixserver.html"> <a href="../tips/mixserver.html"> - <b>1.3.5.</b> + <b>1.4.5.</b> Mixing models for a better prediction convergence (MIX server) @@ -312,12 +327,12 @@ </li> - <li class="chapter " data-level="1.3.6" data-path="../tips/emr.html"> + <li class="chapter " data-level="1.4.6" data-path="../tips/emr.html"> <a href="../tips/emr.html"> - <b>1.3.6.</b> + <b>1.4.6.</b> Run Hivemall on Amazon Elastic MapReduce @@ -332,14 +347,14 @@ </li> - <li class="chapter " data-level="1.4" data-path="../tips/general_tips.html"> + <li class="chapter " data-level="1.5" data-path="../tips/general_tips.html"> <a href="../tips/general_tips.html"> - <b>1.4.</b> + <b>1.5.</b> - General Hive/Hadoop tips + General Hive/Hadoop Tips </a> @@ -348,12 +363,12 @@ <ul class="articles"> - <li class="chapter " data-level="1.4.1" data-path="../tips/rowid.html"> + <li class="chapter " data-level="1.5.1" data-path="../tips/rowid.html"> <a href="../tips/rowid.html"> - <b>1.4.1.</b> + <b>1.5.1.</b> Adding rowid for each row @@ -363,12 +378,12 @@ </li> - <li class="chapter " data-level="1.4.2" data-path="../tips/hadoop_tuning.html"> + <li class="chapter " data-level="1.5.2" data-path="../tips/hadoop_tuning.html"> <a href="../tips/hadoop_tuning.html"> - <b>1.4.2.</b> + <b>1.5.2.</b> Hadoop tuning for Hivemall @@ -383,12 +398,12 @@ </li> - <li class="chapter " data-level="1.5" data-path="../troubleshooting/"> + <li class="chapter " data-level="1.6" data-path="../troubleshooting/"> <a href="../troubleshooting/"> - <b>1.5.</b> + <b>1.6.</b> Troubleshooting @@ -399,12 +414,12 @@ <ul class="articles"> - <li class="chapter " data-level="1.5.1" data-path="../troubleshooting/oom.html"> + <li class="chapter " data-level="1.6.1" data-path="../troubleshooting/oom.html"> <a href="../troubleshooting/oom.html"> - <b>1.5.1.</b> + <b>1.6.1.</b> OutOfMemoryError in training @@ -414,14 +429,14 @@ </li> - <li class="chapter " data-level="1.5.2" data-path="../troubleshooting/mapjoin_task_error.html"> + <li class="chapter " data-level="1.6.2" data-path="../troubleshooting/mapjoin_task_error.html"> <a href="../troubleshooting/mapjoin_task_error.html"> - <b>1.5.2.</b> + <b>1.6.2.</b> - SemanticException Generate Map Join Task Error: Cannot serialize object + SemanticException generate map join task error: Cannot serialize object </a> @@ -429,12 +444,12 @@ </li> - <li class="chapter " data-level="1.5.3" data-path="../troubleshooting/asterisk.html"> + <li class="chapter " data-level="1.6.3" data-path="../troubleshooting/asterisk.html"> <a href="../troubleshooting/asterisk.html"> - <b>1.5.3.</b> + <b>1.6.3.</b> Asterisk argument for UDTF does not work @@ -444,12 +459,12 @@ </li> - <li class="chapter " data-level="1.5.4" data-path="../troubleshooting/num_mappers.html"> + <li class="chapter " data-level="1.6.4" data-path="../troubleshooting/num_mappers.html"> <a href="../troubleshooting/num_mappers.html"> - <b>1.5.4.</b> + <b>1.6.4.</b> The number of mappers is less than input splits in Hadoop 2.x @@ -459,14 +474,14 @@ </li> - <li class="chapter " data-level="1.5.5" data-path="../troubleshooting/mapjoin_classcastex.html"> + <li class="chapter " data-level="1.6.5" data-path="../troubleshooting/mapjoin_classcastex.html"> <a href="../troubleshooting/mapjoin_classcastex.html"> - <b>1.5.5.</b> + <b>1.6.5.</b> - Map-side Join causes ClassCastException on Tez + Map-side join causes ClassCastException on Tez </a> @@ -493,7 +508,7 @@ <b>2.1.</b> - List of generic Hivemall functions + List of Generic Hivemall Functions </a> @@ -508,7 +523,7 @@ <b>2.2.</b> - Efficient Top-K query processing + Efficient Top-K Query Processing </a> @@ -620,7 +635,7 @@ <b>3.5.</b> - FEATURE PAIRING + Feature Paring </a> @@ -636,7 +651,7 @@ <b>3.5.1.</b> - Polynomial Features + Polynomial features </a> @@ -656,7 +671,7 @@ <b>3.6.</b> - FEATURE TRANSFORMATION + Feature Transformation </a> @@ -672,7 +687,7 @@ <b>3.6.1.</b> - Feature Vectorization + Feature vectorization </a> @@ -745,7 +760,7 @@ <b>4.1.1.</b> - Area Under the ROC Curve + Area under the ROC curve </a> @@ -780,7 +795,7 @@ <b>4.3.</b> - Regression metrics + Regression Metrics </a> @@ -864,7 +879,7 @@ - <li class="header">Part VI - Binary classification</li> + <li class="header">Part VI - Binary Classification</li> @@ -890,7 +905,7 @@ <b>6.2.</b> - a9a tutorial + a9a Tutorial </a> @@ -936,7 +951,7 @@ <b>6.2.3.</b> - Mini-batch Gradient Descent + Mini-batch gradient descent </a> @@ -956,7 +971,7 @@ <b>6.3.</b> - News20 tutorial + News20 Tutorial </a> @@ -1052,7 +1067,7 @@ <b>6.4.</b> - KDD2010a tutorial + KDD2010a Tutorial </a> @@ -1103,7 +1118,7 @@ <b>6.5.</b> - KDD2010b tutorial + KDD2010b Tutorial </a> @@ -1154,7 +1169,7 @@ <b>6.6.</b> - Webspam tutorial + Webspam Tutorial </a> @@ -1205,7 +1220,7 @@ <b>6.7.</b> - Kaggle Titanic tutorial + Kaggle Titanic Tutorial </a> @@ -1216,7 +1231,7 @@ - <li class="header">Part VII - Multiclass classification</li> + <li class="header">Part VII - Multiclass Classification</li> @@ -1227,7 +1242,7 @@ <b>7.1.</b> - News20 Multiclass tutorial + News20 Multiclass Tutorial </a> @@ -1338,7 +1353,7 @@ <b>7.2.</b> - Iris tutorial + Iris Tutorial </a> @@ -1426,7 +1441,7 @@ <b>8.2.</b> - E2006-tfidf regression tutorial + E2006-tfidf Regression Tutorial </a> @@ -1477,7 +1492,7 @@ <b>8.3.</b> - KDDCup 2012 track 2 CTR prediction tutorial + KDDCup 2012 Track 2 CTR Prediction Tutorial </a> @@ -1523,7 +1538,7 @@ <b>8.3.3.</b> - Logistic Regression with Amplifier + Logistic Regression with amplifier </a> @@ -1581,7 +1596,7 @@ <b>9.1.1.</b> - Item-based Collaborative Filtering + Item-based collaborative filtering </a> @@ -1601,7 +1616,7 @@ <b>9.2.</b> - News20 related article recommendation Tutorial + News20 Related Article Recommendation Tutorial </a> @@ -1632,7 +1647,7 @@ <b>9.2.2.</b> - LSH/Minhash and Jaccard Similarity + LSH/MinHash and Jaccard similarity </a> @@ -1647,7 +1662,7 @@ <b>9.2.3.</b> - LSH/Minhash and Brute-Force Search + LSH/MinHash and brute-force search </a> @@ -1662,7 +1677,7 @@ <b>9.2.4.</b> - kNN search using b-Bits Minhash + kNN search using b-Bits MinHash </a> @@ -1682,7 +1697,7 @@ <b>9.3.</b> - MovieLens movie recommendation Tutorial + MovieLens Movie Recommendation Tutorial </a> @@ -1713,7 +1728,7 @@ <b>9.3.2.</b> - Item-based Collaborative Filtering + Item-based collaborative filtering </a> @@ -1758,7 +1773,7 @@ <b>9.3.5.</b> - SLIM for Fast Top-K Recommendation + SLIM for fast top-k recommendation </a> @@ -1773,7 +1788,7 @@ <b>9.3.6.</b> - 10-fold Cross Validation (Matrix Factorization) + 10-fold cross validation (Matrix Factorization) </a> @@ -1878,7 +1893,7 @@ - <li class="header">Part XII - GeoSpatial functions</li> + <li class="header">Part XII - GeoSpatial Functions</li> @@ -1963,7 +1978,7 @@ <b>13.2.1.</b> - a9a Tutorial for DataFrame + a9a tutorial for DataFrame </a> @@ -1978,7 +1993,7 @@ <b>13.2.2.</b> - a9a Tutorial for SQL + a9a tutorial for SQL </a> @@ -2014,7 +2029,7 @@ <b>13.3.1.</b> - E2006-tfidf regression Tutorial for DataFrame + E2006-tfidf regression tutorial for DataFrame </a> @@ -2029,7 +2044,7 @@ <b>13.3.2.</b> - E2006-tfidf regression Tutorial for SQL + E2006-tfidf regression tutorial for SQL </a> @@ -2065,7 +2080,7 @@ <b>13.4.1.</b> - Top-k Join processing + Top-k join processing </a> @@ -2124,25 +2139,10 @@ <li class="chapter " data-level="15.1" > - <a target="_blank" href="https://github.com/maropu/hivemall-spark"> - - - <b>15.1.</b> - - Hivemall on Apache Spark - - </a> - - - - </li> - - <li class="chapter " data-level="15.2" > - <a target="_blank" href="https://github.com/daijyc/hivemall/wiki/PigHome"> - <b>15.2.</b> + <b>15.1.</b> Hivemall on Apache Pig @@ -2316,7 +2316,7 @@ Apache Hivemall is an effort undergoing incubation at The Apache Software Founda <script> var gitbook = gitbook || []; gitbook.push(function() { - gitbook.page.hasChanged({"page":{"title":"AROW","level":"6.5.2","depth":2,"next":{"title":"Webspam tutorial","level":"6.6","depth":1,"path":"binaryclass/webspam.md","ref":"binaryclass/webspam.md","articles":[{"title":"Data pareparation","level":"6.6.1","depth":2,"path":"binaryclass/webspam_dataset.md","ref":"binaryclass/webspam_dataset.md","articles":[]},{"title":"PA1, AROW, SCW","level":"6.6.2","depth":2,"path":"binaryclass/webspam_scw.md","ref":"binaryclass/webspam_scw.md","articles":[]}]},"previous":{"title":"Data preparation","level":"6.5.1","depth":2,"path":"binaryclass/kdd2010b_dataset.md","ref":"binaryclass/kdd2010b_dataset.md","articles":[]},"dir":"ltr"},"config":{"plugins":["theme-api","edit-link","github","splitter","sitemap","etoc","callouts","toggle-chapters","anchorjs","codeblock-filename","expandable-chapters","multipart","codeblock-filename","katex","emphasize","localized-footer"],"styles":{"website":"styles/website.css","pdf":"styles/pdf.css","epub":"styl es/epub.css","mobi":"styles/mobi.css","ebook":"styles/ebook.css","print":"styles/print.css"},"pluginsConfig":{"emphasize":{},"callouts":{},"etoc":{"h2lb":3,"header":1,"maxdepth":3,"mindepth":1,"notoc":true},"github":{"url":"https://github.com/apache/incubator-hivemall/"},"splitter":{},"search":{},"downloadpdf":{"base":"https://github.com/apache/incubator-hivemall/docs/gitbook","label":"PDF","multilingual":false},"multipart":{},"localized-footer":{"filename":"FOOTER.md","hline":"true"},"lunr":{"maxIndexSize":1000000,"ignoreSpecialCharacters":false},"katex":{},"fontsettings":{"theme":"white","family":"sans","size":2,"font":"sans"},"highlight":{},"codeblock-filename":{},"sitemap":{"hostname":"http://hivemall.incubator.apache.org/"},"theme-api":{"languages":[],"split":false,"theme":"dark"},"sharing":{"facebook":true,"twitter":true,"google":false,"weibo":false,"instapaper":false,"vk":false,"all":["facebook","google","twitter","weibo","instapaper"]},"edit-link":{"label":"Edit","base":"htt ps://github.com/apache/incubator-hivemall/tree/master/docs/gitbook"},"theme-default":{"styles":{"website":"styles/website.css","pdf":"styles/pdf.css","epub":"styles/epub.css","mobi":"styles/mobi.css","ebook":"styles/ebook.css","print":"styles/print.css"},"showLevel":true},"anchorjs":{"selector":"h1,h2,h3,*:not(.callout) > h4,h5"},"toggle-chapters":{},"expandable-chapters":{}},"theme":"default","pdf":{"pageNumbers":true,"fontSize":12,"fontFamily":"Arial","paperSize":"a4","chapterMark":"pagebreak","pageBreaksBefore":"/","margin":{"right":62,"left":62,"top":56,"bottom":56}},"structure":{"langs":"LANGS.md","readme":"README.md","glossary":"GLOSSARY.md","summary":"SUMMARY.md"},"variables":{},"title":"Hivemall User Manual","links":{"sidebar":{"<i class=\"fa fa-home\"></i> Home":"http://hivemall.incubator.apache.org/"}},"gitbook":"3.x.x","description":"User Manual for Apache Hivemall"},"file":{"path":"binaryclass/kdd2010b_arow.md","mtime":"2017-11-02T05:41:05.000Z","type":"markdown"},"gitbo ok":{"version":"3.2.3","time":"2018-03-13T16:05:28.906Z"},"basePath":"..","book":{"language":""}}); + gitbook.page.hasChanged({"page":{"title":"AROW","level":"6.5.2","depth":2,"next":{"title":"Webspam Tutorial","level":"6.6","depth":1,"path":"binaryclass/webspam.md","ref":"binaryclass/webspam.md","articles":[{"title":"Data pareparation","level":"6.6.1","depth":2,"path":"binaryclass/webspam_dataset.md","ref":"binaryclass/webspam_dataset.md","articles":[]},{"title":"PA1, AROW, SCW","level":"6.6.2","depth":2,"path":"binaryclass/webspam_scw.md","ref":"binaryclass/webspam_scw.md","articles":[]}]},"previous":{"title":"Data preparation","level":"6.5.1","depth":2,"path":"binaryclass/kdd2010b_dataset.md","ref":"binaryclass/kdd2010b_dataset.md","articles":[]},"dir":"ltr"},"config":{"plugins":["theme-api","edit-link","github","splitter","sitemap","etoc","callouts","toggle-chapters","anchorjs","codeblock-filename","expandable-chapters","multipart","codeblock-filename","katex","emphasize","localized-footer"],"styles":{"website":"styles/website.css","pdf":"styles/pdf.css","epub":"styl es/epub.css","mobi":"styles/mobi.css","ebook":"styles/ebook.css","print":"styles/print.css"},"pluginsConfig":{"emphasize":{},"callouts":{},"etoc":{"h2lb":3,"header":1,"maxdepth":3,"mindepth":1,"notoc":true},"github":{"url":"https://github.com/apache/incubator-hivemall/"},"splitter":{},"search":{},"downloadpdf":{"base":"https://github.com/apache/incubator-hivemall/docs/gitbook","label":"PDF","multilingual":false},"multipart":{},"localized-footer":{"filename":"FOOTER.md","hline":"true"},"lunr":{"maxIndexSize":1000000,"ignoreSpecialCharacters":false},"katex":{},"fontsettings":{"theme":"white","family":"sans","size":2,"font":"sans"},"highlight":{},"codeblock-filename":{},"sitemap":{"hostname":"http://hivemall.incubator.apache.org/"},"theme-api":{"languages":[],"split":false,"theme":"dark"},"sharing":{"facebook":true,"twitter":true,"google":false,"weibo":false,"instapaper":false,"vk":false,"all":["facebook","google","twitter","weibo","instapaper"]},"edit-link":{"label":"Edit","base":"htt ps://github.com/apache/incubator-hivemall/tree/master/docs/gitbook"},"theme-default":{"styles":{"website":"styles/website.css","pdf":"styles/pdf.css","epub":"styles/epub.css","mobi":"styles/mobi.css","ebook":"styles/ebook.css","print":"styles/print.css"},"showLevel":true},"anchorjs":{"selector":"h1,h2,h3,*:not(.callout) > h4,h5"},"toggle-chapters":{},"expandable-chapters":{}},"theme":"default","pdf":{"pageNumbers":true,"fontSize":12,"fontFamily":"Arial","paperSize":"a4","chapterMark":"pagebreak","pageBreaksBefore":"/","margin":{"right":62,"left":62,"top":56,"bottom":56}},"structure":{"langs":"LANGS.md","readme":"README.md","glossary":"GLOSSARY.md","summary":"SUMMARY.md"},"variables":{},"title":"Hivemall User Manual","links":{"sidebar":{"<i class=\"fa fa-home\"></i> Home":"http://hivemall.incubator.apache.org/"}},"gitbook":"3.x.x","description":"User Manual for Apache Hivemall"},"file":{"path":"binaryclass/kdd2010b_arow.md","mtime":"2017-11-02T05:41:05.000Z","type":"markdown"},"gitbo ok":{"version":"3.2.3","time":"2018-04-16T14:16:24.937Z"},"basePath":"..","book":{"language":""}}); }); </script> </div>
http://git-wip-us.apache.org/repos/asf/incubator-hivemall-site/blob/b8a847fa/userguide/binaryclass/kdd2010b_dataset.html ---------------------------------------------------------------------- diff --git a/userguide/binaryclass/kdd2010b_dataset.html b/userguide/binaryclass/kdd2010b_dataset.html index b50413f..1d749b5 100644 --- a/userguide/binaryclass/kdd2010b_dataset.html +++ b/userguide/binaryclass/kdd2010b_dataset.html @@ -221,13 +221,28 @@ </li> - <li class="chapter " data-level="1.3" data-path="../tips/"> + <li class="chapter " data-level="1.3" data-path="../misc/funcs.html"> - <a href="../tips/"> + <a href="../misc/funcs.html"> <b>1.3.</b> + List of Functions + + </a> + + + + </li> + + <li class="chapter " data-level="1.4" data-path="../tips/"> + + <a href="../tips/"> + + + <b>1.4.</b> + Tips for Effective Hivemall </a> @@ -237,12 +252,12 @@ <ul class="articles"> - <li class="chapter " data-level="1.3.1" data-path="../tips/addbias.html"> + <li class="chapter " data-level="1.4.1" data-path="../tips/addbias.html"> <a href="../tips/addbias.html"> - <b>1.3.1.</b> + <b>1.4.1.</b> Explicit add_bias() for better prediction @@ -252,12 +267,12 @@ </li> - <li class="chapter " data-level="1.3.2" data-path="../tips/rand_amplify.html"> + <li class="chapter " data-level="1.4.2" data-path="../tips/rand_amplify.html"> <a href="../tips/rand_amplify.html"> - <b>1.3.2.</b> + <b>1.4.2.</b> Use rand_amplify() to better prediction results @@ -267,14 +282,14 @@ </li> - <li class="chapter " data-level="1.3.3" data-path="../tips/rt_prediction.html"> + <li class="chapter " data-level="1.4.3" data-path="../tips/rt_prediction.html"> <a href="../tips/rt_prediction.html"> - <b>1.3.3.</b> + <b>1.4.3.</b> - Real-time Prediction on RDBMS + Real-time prediction on RDBMS </a> @@ -282,12 +297,12 @@ </li> - <li class="chapter " data-level="1.3.4" data-path="../tips/ensemble_learning.html"> + <li class="chapter " data-level="1.4.4" data-path="../tips/ensemble_learning.html"> <a href="../tips/ensemble_learning.html"> - <b>1.3.4.</b> + <b>1.4.4.</b> Ensemble learning for stable prediction @@ -297,12 +312,12 @@ </li> - <li class="chapter " data-level="1.3.5" data-path="../tips/mixserver.html"> + <li class="chapter " data-level="1.4.5" data-path="../tips/mixserver.html"> <a href="../tips/mixserver.html"> - <b>1.3.5.</b> + <b>1.4.5.</b> Mixing models for a better prediction convergence (MIX server) @@ -312,12 +327,12 @@ </li> - <li class="chapter " data-level="1.3.6" data-path="../tips/emr.html"> + <li class="chapter " data-level="1.4.6" data-path="../tips/emr.html"> <a href="../tips/emr.html"> - <b>1.3.6.</b> + <b>1.4.6.</b> Run Hivemall on Amazon Elastic MapReduce @@ -332,14 +347,14 @@ </li> - <li class="chapter " data-level="1.4" data-path="../tips/general_tips.html"> + <li class="chapter " data-level="1.5" data-path="../tips/general_tips.html"> <a href="../tips/general_tips.html"> - <b>1.4.</b> + <b>1.5.</b> - General Hive/Hadoop tips + General Hive/Hadoop Tips </a> @@ -348,12 +363,12 @@ <ul class="articles"> - <li class="chapter " data-level="1.4.1" data-path="../tips/rowid.html"> + <li class="chapter " data-level="1.5.1" data-path="../tips/rowid.html"> <a href="../tips/rowid.html"> - <b>1.4.1.</b> + <b>1.5.1.</b> Adding rowid for each row @@ -363,12 +378,12 @@ </li> - <li class="chapter " data-level="1.4.2" data-path="../tips/hadoop_tuning.html"> + <li class="chapter " data-level="1.5.2" data-path="../tips/hadoop_tuning.html"> <a href="../tips/hadoop_tuning.html"> - <b>1.4.2.</b> + <b>1.5.2.</b> Hadoop tuning for Hivemall @@ -383,12 +398,12 @@ </li> - <li class="chapter " data-level="1.5" data-path="../troubleshooting/"> + <li class="chapter " data-level="1.6" data-path="../troubleshooting/"> <a href="../troubleshooting/"> - <b>1.5.</b> + <b>1.6.</b> Troubleshooting @@ -399,12 +414,12 @@ <ul class="articles"> - <li class="chapter " data-level="1.5.1" data-path="../troubleshooting/oom.html"> + <li class="chapter " data-level="1.6.1" data-path="../troubleshooting/oom.html"> <a href="../troubleshooting/oom.html"> - <b>1.5.1.</b> + <b>1.6.1.</b> OutOfMemoryError in training @@ -414,14 +429,14 @@ </li> - <li class="chapter " data-level="1.5.2" data-path="../troubleshooting/mapjoin_task_error.html"> + <li class="chapter " data-level="1.6.2" data-path="../troubleshooting/mapjoin_task_error.html"> <a href="../troubleshooting/mapjoin_task_error.html"> - <b>1.5.2.</b> + <b>1.6.2.</b> - SemanticException Generate Map Join Task Error: Cannot serialize object + SemanticException generate map join task error: Cannot serialize object </a> @@ -429,12 +444,12 @@ </li> - <li class="chapter " data-level="1.5.3" data-path="../troubleshooting/asterisk.html"> + <li class="chapter " data-level="1.6.3" data-path="../troubleshooting/asterisk.html"> <a href="../troubleshooting/asterisk.html"> - <b>1.5.3.</b> + <b>1.6.3.</b> Asterisk argument for UDTF does not work @@ -444,12 +459,12 @@ </li> - <li class="chapter " data-level="1.5.4" data-path="../troubleshooting/num_mappers.html"> + <li class="chapter " data-level="1.6.4" data-path="../troubleshooting/num_mappers.html"> <a href="../troubleshooting/num_mappers.html"> - <b>1.5.4.</b> + <b>1.6.4.</b> The number of mappers is less than input splits in Hadoop 2.x @@ -459,14 +474,14 @@ </li> - <li class="chapter " data-level="1.5.5" data-path="../troubleshooting/mapjoin_classcastex.html"> + <li class="chapter " data-level="1.6.5" data-path="../troubleshooting/mapjoin_classcastex.html"> <a href="../troubleshooting/mapjoin_classcastex.html"> - <b>1.5.5.</b> + <b>1.6.5.</b> - Map-side Join causes ClassCastException on Tez + Map-side join causes ClassCastException on Tez </a> @@ -493,7 +508,7 @@ <b>2.1.</b> - List of generic Hivemall functions + List of Generic Hivemall Functions </a> @@ -508,7 +523,7 @@ <b>2.2.</b> - Efficient Top-K query processing + Efficient Top-K Query Processing </a> @@ -620,7 +635,7 @@ <b>3.5.</b> - FEATURE PAIRING + Feature Paring </a> @@ -636,7 +651,7 @@ <b>3.5.1.</b> - Polynomial Features + Polynomial features </a> @@ -656,7 +671,7 @@ <b>3.6.</b> - FEATURE TRANSFORMATION + Feature Transformation </a> @@ -672,7 +687,7 @@ <b>3.6.1.</b> - Feature Vectorization + Feature vectorization </a> @@ -745,7 +760,7 @@ <b>4.1.1.</b> - Area Under the ROC Curve + Area under the ROC curve </a> @@ -780,7 +795,7 @@ <b>4.3.</b> - Regression metrics + Regression Metrics </a> @@ -864,7 +879,7 @@ - <li class="header">Part VI - Binary classification</li> + <li class="header">Part VI - Binary Classification</li> @@ -890,7 +905,7 @@ <b>6.2.</b> - a9a tutorial + a9a Tutorial </a> @@ -936,7 +951,7 @@ <b>6.2.3.</b> - Mini-batch Gradient Descent + Mini-batch gradient descent </a> @@ -956,7 +971,7 @@ <b>6.3.</b> - News20 tutorial + News20 Tutorial </a> @@ -1052,7 +1067,7 @@ <b>6.4.</b> - KDD2010a tutorial + KDD2010a Tutorial </a> @@ -1103,7 +1118,7 @@ <b>6.5.</b> - KDD2010b tutorial + KDD2010b Tutorial </a> @@ -1154,7 +1169,7 @@ <b>6.6.</b> - Webspam tutorial + Webspam Tutorial </a> @@ -1205,7 +1220,7 @@ <b>6.7.</b> - Kaggle Titanic tutorial + Kaggle Titanic Tutorial </a> @@ -1216,7 +1231,7 @@ - <li class="header">Part VII - Multiclass classification</li> + <li class="header">Part VII - Multiclass Classification</li> @@ -1227,7 +1242,7 @@ <b>7.1.</b> - News20 Multiclass tutorial + News20 Multiclass Tutorial </a> @@ -1338,7 +1353,7 @@ <b>7.2.</b> - Iris tutorial + Iris Tutorial </a> @@ -1426,7 +1441,7 @@ <b>8.2.</b> - E2006-tfidf regression tutorial + E2006-tfidf Regression Tutorial </a> @@ -1477,7 +1492,7 @@ <b>8.3.</b> - KDDCup 2012 track 2 CTR prediction tutorial + KDDCup 2012 Track 2 CTR Prediction Tutorial </a> @@ -1523,7 +1538,7 @@ <b>8.3.3.</b> - Logistic Regression with Amplifier + Logistic Regression with amplifier </a> @@ -1581,7 +1596,7 @@ <b>9.1.1.</b> - Item-based Collaborative Filtering + Item-based collaborative filtering </a> @@ -1601,7 +1616,7 @@ <b>9.2.</b> - News20 related article recommendation Tutorial + News20 Related Article Recommendation Tutorial </a> @@ -1632,7 +1647,7 @@ <b>9.2.2.</b> - LSH/Minhash and Jaccard Similarity + LSH/MinHash and Jaccard similarity </a> @@ -1647,7 +1662,7 @@ <b>9.2.3.</b> - LSH/Minhash and Brute-Force Search + LSH/MinHash and brute-force search </a> @@ -1662,7 +1677,7 @@ <b>9.2.4.</b> - kNN search using b-Bits Minhash + kNN search using b-Bits MinHash </a> @@ -1682,7 +1697,7 @@ <b>9.3.</b> - MovieLens movie recommendation Tutorial + MovieLens Movie Recommendation Tutorial </a> @@ -1713,7 +1728,7 @@ <b>9.3.2.</b> - Item-based Collaborative Filtering + Item-based collaborative filtering </a> @@ -1758,7 +1773,7 @@ <b>9.3.5.</b> - SLIM for Fast Top-K Recommendation + SLIM for fast top-k recommendation </a> @@ -1773,7 +1788,7 @@ <b>9.3.6.</b> - 10-fold Cross Validation (Matrix Factorization) + 10-fold cross validation (Matrix Factorization) </a> @@ -1878,7 +1893,7 @@ - <li class="header">Part XII - GeoSpatial functions</li> + <li class="header">Part XII - GeoSpatial Functions</li> @@ -1963,7 +1978,7 @@ <b>13.2.1.</b> - a9a Tutorial for DataFrame + a9a tutorial for DataFrame </a> @@ -1978,7 +1993,7 @@ <b>13.2.2.</b> - a9a Tutorial for SQL + a9a tutorial for SQL </a> @@ -2014,7 +2029,7 @@ <b>13.3.1.</b> - E2006-tfidf regression Tutorial for DataFrame + E2006-tfidf regression tutorial for DataFrame </a> @@ -2029,7 +2044,7 @@ <b>13.3.2.</b> - E2006-tfidf regression Tutorial for SQL + E2006-tfidf regression tutorial for SQL </a> @@ -2065,7 +2080,7 @@ <b>13.4.1.</b> - Top-k Join processing + Top-k join processing </a> @@ -2124,25 +2139,10 @@ <li class="chapter " data-level="15.1" > - <a target="_blank" href="https://github.com/maropu/hivemall-spark"> - - - <b>15.1.</b> - - Hivemall on Apache Spark - - </a> - - - - </li> - - <li class="chapter " data-level="15.2" > - <a target="_blank" href="https://github.com/daijyc/hivemall/wiki/PigHome"> - <b>15.2.</b> + <b>15.1.</b> Hivemall on Apache Pig @@ -2324,7 +2324,7 @@ Apache Hivemall is an effort undergoing incubation at The Apache Software Founda <script> var gitbook = gitbook || []; gitbook.push(function() { - gitbook.page.hasChanged({"page":{"title":"Data preparation","level":"6.5.1","depth":2,"next":{"title":"AROW","level":"6.5.2","depth":2,"path":"binaryclass/kdd2010b_arow.md","ref":"binaryclass/kdd2010b_arow.md","articles":[]},"previous":{"title":"KDD2010b tutorial","level":"6.5","depth":1,"path":"binaryclass/kdd2010b.md","ref":"binaryclass/kdd2010b.md","articles":[{"title":"Data preparation","level":"6.5.1","depth":2,"path":"binaryclass/kdd2010b_dataset.md","ref":"binaryclass/kdd2010b_dataset.md","articles":[]},{"title":"AROW","level":"6.5.2","depth":2,"path":"binaryclass/kdd2010b_arow.md","ref":"binaryclass/kdd2010b_arow.md","articles":[]}]},"dir":"ltr"},"config":{"plugins":["theme-api","edit-link","github","splitter","sitemap","etoc","callouts","toggle-chapters","anchorjs","codeblock-filename","expandable-chapters","multipart","codeblock-filename","katex","emphasize","localized-footer"],"styles":{"website":"styles/website.css","pdf":"styles/pdf.css","epub":"styles/epub. css","mobi":"styles/mobi.css","ebook":"styles/ebook.css","print":"styles/print.css"},"pluginsConfig":{"emphasize":{},"callouts":{},"etoc":{"h2lb":3,"header":1,"maxdepth":3,"mindepth":1,"notoc":true},"github":{"url":"https://github.com/apache/incubator-hivemall/"},"splitter":{},"search":{},"downloadpdf":{"base":"https://github.com/apache/incubator-hivemall/docs/gitbook","label":"PDF","multilingual":false},"multipart":{},"localized-footer":{"filename":"FOOTER.md","hline":"true"},"lunr":{"maxIndexSize":1000000,"ignoreSpecialCharacters":false},"katex":{},"fontsettings":{"theme":"white","family":"sans","size":2,"font":"sans"},"highlight":{},"codeblock-filename":{},"sitemap":{"hostname":"http://hivemall.incubator.apache.org/"},"theme-api":{"languages":[],"split":false,"theme":"dark"},"sharing":{"facebook":true,"twitter":true,"google":false,"weibo":false,"instapaper":false,"vk":false,"all":["facebook","google","twitter","weibo","instapaper"]},"edit-link":{"label":"Edit","base":"https://git hub.com/apache/incubator-hivemall/tree/master/docs/gitbook"},"theme-default":{"styles":{"website":"styles/website.css","pdf":"styles/pdf.css","epub":"styles/epub.css","mobi":"styles/mobi.css","ebook":"styles/ebook.css","print":"styles/print.css"},"showLevel":true},"anchorjs":{"selector":"h1,h2,h3,*:not(.callout) > h4,h5"},"toggle-chapters":{},"expandable-chapters":{}},"theme":"default","pdf":{"pageNumbers":true,"fontSize":12,"fontFamily":"Arial","paperSize":"a4","chapterMark":"pagebreak","pageBreaksBefore":"/","margin":{"right":62,"left":62,"top":56,"bottom":56}},"structure":{"langs":"LANGS.md","readme":"README.md","glossary":"GLOSSARY.md","summary":"SUMMARY.md"},"variables":{},"title":"Hivemall User Manual","links":{"sidebar":{"<i class=\"fa fa-home\"></i> Home":"http://hivemall.incubator.apache.org/"}},"gitbook":"3.x.x","description":"User Manual for Apache Hivemall"},"file":{"path":"binaryclass/kdd2010b_dataset.md","mtime":"2017-11-02T05:41:05.000Z","type":"markdown"},"gitbook":{ "version":"3.2.3","time":"2018-03-13T16:05:28.906Z"},"basePath":"..","book":{"language":""}}); + gitbook.page.hasChanged({"page":{"title":"Data preparation","level":"6.5.1","depth":2,"next":{"title":"AROW","level":"6.5.2","depth":2,"path":"binaryclass/kdd2010b_arow.md","ref":"binaryclass/kdd2010b_arow.md","articles":[]},"previous":{"title":"KDD2010b Tutorial","level":"6.5","depth":1,"path":"binaryclass/kdd2010b.md","ref":"binaryclass/kdd2010b.md","articles":[{"title":"Data preparation","level":"6.5.1","depth":2,"path":"binaryclass/kdd2010b_dataset.md","ref":"binaryclass/kdd2010b_dataset.md","articles":[]},{"title":"AROW","level":"6.5.2","depth":2,"path":"binaryclass/kdd2010b_arow.md","ref":"binaryclass/kdd2010b_arow.md","articles":[]}]},"dir":"ltr"},"config":{"plugins":["theme-api","edit-link","github","splitter","sitemap","etoc","callouts","toggle-chapters","anchorjs","codeblock-filename","expandable-chapters","multipart","codeblock-filename","katex","emphasize","localized-footer"],"styles":{"website":"styles/website.css","pdf":"styles/pdf.css","epub":"styles/epub. css","mobi":"styles/mobi.css","ebook":"styles/ebook.css","print":"styles/print.css"},"pluginsConfig":{"emphasize":{},"callouts":{},"etoc":{"h2lb":3,"header":1,"maxdepth":3,"mindepth":1,"notoc":true},"github":{"url":"https://github.com/apache/incubator-hivemall/"},"splitter":{},"search":{},"downloadpdf":{"base":"https://github.com/apache/incubator-hivemall/docs/gitbook","label":"PDF","multilingual":false},"multipart":{},"localized-footer":{"filename":"FOOTER.md","hline":"true"},"lunr":{"maxIndexSize":1000000,"ignoreSpecialCharacters":false},"katex":{},"fontsettings":{"theme":"white","family":"sans","size":2,"font":"sans"},"highlight":{},"codeblock-filename":{},"sitemap":{"hostname":"http://hivemall.incubator.apache.org/"},"theme-api":{"languages":[],"split":false,"theme":"dark"},"sharing":{"facebook":true,"twitter":true,"google":false,"weibo":false,"instapaper":false,"vk":false,"all":["facebook","google","twitter","weibo","instapaper"]},"edit-link":{"label":"Edit","base":"https://git hub.com/apache/incubator-hivemall/tree/master/docs/gitbook"},"theme-default":{"styles":{"website":"styles/website.css","pdf":"styles/pdf.css","epub":"styles/epub.css","mobi":"styles/mobi.css","ebook":"styles/ebook.css","print":"styles/print.css"},"showLevel":true},"anchorjs":{"selector":"h1,h2,h3,*:not(.callout) > h4,h5"},"toggle-chapters":{},"expandable-chapters":{}},"theme":"default","pdf":{"pageNumbers":true,"fontSize":12,"fontFamily":"Arial","paperSize":"a4","chapterMark":"pagebreak","pageBreaksBefore":"/","margin":{"right":62,"left":62,"top":56,"bottom":56}},"structure":{"langs":"LANGS.md","readme":"README.md","glossary":"GLOSSARY.md","summary":"SUMMARY.md"},"variables":{},"title":"Hivemall User Manual","links":{"sidebar":{"<i class=\"fa fa-home\"></i> Home":"http://hivemall.incubator.apache.org/"}},"gitbook":"3.x.x","description":"User Manual for Apache Hivemall"},"file":{"path":"binaryclass/kdd2010b_dataset.md","mtime":"2017-11-02T05:41:05.000Z","type":"markdown"},"gitbook":{ "version":"3.2.3","time":"2018-04-16T14:16:24.937Z"},"basePath":"..","book":{"language":""}}); }); </script> </div> http://git-wip-us.apache.org/repos/asf/incubator-hivemall-site/blob/b8a847fa/userguide/binaryclass/news20.html ---------------------------------------------------------------------- diff --git a/userguide/binaryclass/news20.html b/userguide/binaryclass/news20.html index cf85641..e113f10 100644 --- a/userguide/binaryclass/news20.html +++ b/userguide/binaryclass/news20.html @@ -4,7 +4,7 @@ <head> <meta charset="UTF-8"> <meta content="text/html; charset=utf-8" http-equiv="Content-Type"> - <title>News20 tutorial · Hivemall User Manual</title> + <title>News20 Tutorial · Hivemall User Manual</title> <meta http-equiv="X-UA-Compatible" content="IE=edge" /> <meta name="description" content=""> <meta name="generator" content="GitBook 3.2.3"> @@ -221,13 +221,28 @@ </li> - <li class="chapter " data-level="1.3" data-path="../tips/"> + <li class="chapter " data-level="1.3" data-path="../misc/funcs.html"> - <a href="../tips/"> + <a href="../misc/funcs.html"> <b>1.3.</b> + List of Functions + + </a> + + + + </li> + + <li class="chapter " data-level="1.4" data-path="../tips/"> + + <a href="../tips/"> + + + <b>1.4.</b> + Tips for Effective Hivemall </a> @@ -237,12 +252,12 @@ <ul class="articles"> - <li class="chapter " data-level="1.3.1" data-path="../tips/addbias.html"> + <li class="chapter " data-level="1.4.1" data-path="../tips/addbias.html"> <a href="../tips/addbias.html"> - <b>1.3.1.</b> + <b>1.4.1.</b> Explicit add_bias() for better prediction @@ -252,12 +267,12 @@ </li> - <li class="chapter " data-level="1.3.2" data-path="../tips/rand_amplify.html"> + <li class="chapter " data-level="1.4.2" data-path="../tips/rand_amplify.html"> <a href="../tips/rand_amplify.html"> - <b>1.3.2.</b> + <b>1.4.2.</b> Use rand_amplify() to better prediction results @@ -267,14 +282,14 @@ </li> - <li class="chapter " data-level="1.3.3" data-path="../tips/rt_prediction.html"> + <li class="chapter " data-level="1.4.3" data-path="../tips/rt_prediction.html"> <a href="../tips/rt_prediction.html"> - <b>1.3.3.</b> + <b>1.4.3.</b> - Real-time Prediction on RDBMS + Real-time prediction on RDBMS </a> @@ -282,12 +297,12 @@ </li> - <li class="chapter " data-level="1.3.4" data-path="../tips/ensemble_learning.html"> + <li class="chapter " data-level="1.4.4" data-path="../tips/ensemble_learning.html"> <a href="../tips/ensemble_learning.html"> - <b>1.3.4.</b> + <b>1.4.4.</b> Ensemble learning for stable prediction @@ -297,12 +312,12 @@ </li> - <li class="chapter " data-level="1.3.5" data-path="../tips/mixserver.html"> + <li class="chapter " data-level="1.4.5" data-path="../tips/mixserver.html"> <a href="../tips/mixserver.html"> - <b>1.3.5.</b> + <b>1.4.5.</b> Mixing models for a better prediction convergence (MIX server) @@ -312,12 +327,12 @@ </li> - <li class="chapter " data-level="1.3.6" data-path="../tips/emr.html"> + <li class="chapter " data-level="1.4.6" data-path="../tips/emr.html"> <a href="../tips/emr.html"> - <b>1.3.6.</b> + <b>1.4.6.</b> Run Hivemall on Amazon Elastic MapReduce @@ -332,14 +347,14 @@ </li> - <li class="chapter " data-level="1.4" data-path="../tips/general_tips.html"> + <li class="chapter " data-level="1.5" data-path="../tips/general_tips.html"> <a href="../tips/general_tips.html"> - <b>1.4.</b> + <b>1.5.</b> - General Hive/Hadoop tips + General Hive/Hadoop Tips </a> @@ -348,12 +363,12 @@ <ul class="articles"> - <li class="chapter " data-level="1.4.1" data-path="../tips/rowid.html"> + <li class="chapter " data-level="1.5.1" data-path="../tips/rowid.html"> <a href="../tips/rowid.html"> - <b>1.4.1.</b> + <b>1.5.1.</b> Adding rowid for each row @@ -363,12 +378,12 @@ </li> - <li class="chapter " data-level="1.4.2" data-path="../tips/hadoop_tuning.html"> + <li class="chapter " data-level="1.5.2" data-path="../tips/hadoop_tuning.html"> <a href="../tips/hadoop_tuning.html"> - <b>1.4.2.</b> + <b>1.5.2.</b> Hadoop tuning for Hivemall @@ -383,12 +398,12 @@ </li> - <li class="chapter " data-level="1.5" data-path="../troubleshooting/"> + <li class="chapter " data-level="1.6" data-path="../troubleshooting/"> <a href="../troubleshooting/"> - <b>1.5.</b> + <b>1.6.</b> Troubleshooting @@ -399,12 +414,12 @@ <ul class="articles"> - <li class="chapter " data-level="1.5.1" data-path="../troubleshooting/oom.html"> + <li class="chapter " data-level="1.6.1" data-path="../troubleshooting/oom.html"> <a href="../troubleshooting/oom.html"> - <b>1.5.1.</b> + <b>1.6.1.</b> OutOfMemoryError in training @@ -414,14 +429,14 @@ </li> - <li class="chapter " data-level="1.5.2" data-path="../troubleshooting/mapjoin_task_error.html"> + <li class="chapter " data-level="1.6.2" data-path="../troubleshooting/mapjoin_task_error.html"> <a href="../troubleshooting/mapjoin_task_error.html"> - <b>1.5.2.</b> + <b>1.6.2.</b> - SemanticException Generate Map Join Task Error: Cannot serialize object + SemanticException generate map join task error: Cannot serialize object </a> @@ -429,12 +444,12 @@ </li> - <li class="chapter " data-level="1.5.3" data-path="../troubleshooting/asterisk.html"> + <li class="chapter " data-level="1.6.3" data-path="../troubleshooting/asterisk.html"> <a href="../troubleshooting/asterisk.html"> - <b>1.5.3.</b> + <b>1.6.3.</b> Asterisk argument for UDTF does not work @@ -444,12 +459,12 @@ </li> - <li class="chapter " data-level="1.5.4" data-path="../troubleshooting/num_mappers.html"> + <li class="chapter " data-level="1.6.4" data-path="../troubleshooting/num_mappers.html"> <a href="../troubleshooting/num_mappers.html"> - <b>1.5.4.</b> + <b>1.6.4.</b> The number of mappers is less than input splits in Hadoop 2.x @@ -459,14 +474,14 @@ </li> - <li class="chapter " data-level="1.5.5" data-path="../troubleshooting/mapjoin_classcastex.html"> + <li class="chapter " data-level="1.6.5" data-path="../troubleshooting/mapjoin_classcastex.html"> <a href="../troubleshooting/mapjoin_classcastex.html"> - <b>1.5.5.</b> + <b>1.6.5.</b> - Map-side Join causes ClassCastException on Tez + Map-side join causes ClassCastException on Tez </a> @@ -493,7 +508,7 @@ <b>2.1.</b> - List of generic Hivemall functions + List of Generic Hivemall Functions </a> @@ -508,7 +523,7 @@ <b>2.2.</b> - Efficient Top-K query processing + Efficient Top-K Query Processing </a> @@ -620,7 +635,7 @@ <b>3.5.</b> - FEATURE PAIRING + Feature Paring </a> @@ -636,7 +651,7 @@ <b>3.5.1.</b> - Polynomial Features + Polynomial features </a> @@ -656,7 +671,7 @@ <b>3.6.</b> - FEATURE TRANSFORMATION + Feature Transformation </a> @@ -672,7 +687,7 @@ <b>3.6.1.</b> - Feature Vectorization + Feature vectorization </a> @@ -745,7 +760,7 @@ <b>4.1.1.</b> - Area Under the ROC Curve + Area under the ROC curve </a> @@ -780,7 +795,7 @@ <b>4.3.</b> - Regression metrics + Regression Metrics </a> @@ -864,7 +879,7 @@ - <li class="header">Part VI - Binary classification</li> + <li class="header">Part VI - Binary Classification</li> @@ -890,7 +905,7 @@ <b>6.2.</b> - a9a tutorial + a9a Tutorial </a> @@ -936,7 +951,7 @@ <b>6.2.3.</b> - Mini-batch Gradient Descent + Mini-batch gradient descent </a> @@ -956,7 +971,7 @@ <b>6.3.</b> - News20 tutorial + News20 Tutorial </a> @@ -1052,7 +1067,7 @@ <b>6.4.</b> - KDD2010a tutorial + KDD2010a Tutorial </a> @@ -1103,7 +1118,7 @@ <b>6.5.</b> - KDD2010b tutorial + KDD2010b Tutorial </a> @@ -1154,7 +1169,7 @@ <b>6.6.</b> - Webspam tutorial + Webspam Tutorial </a> @@ -1205,7 +1220,7 @@ <b>6.7.</b> - Kaggle Titanic tutorial + Kaggle Titanic Tutorial </a> @@ -1216,7 +1231,7 @@ - <li class="header">Part VII - Multiclass classification</li> + <li class="header">Part VII - Multiclass Classification</li> @@ -1227,7 +1242,7 @@ <b>7.1.</b> - News20 Multiclass tutorial + News20 Multiclass Tutorial </a> @@ -1338,7 +1353,7 @@ <b>7.2.</b> - Iris tutorial + Iris Tutorial </a> @@ -1426,7 +1441,7 @@ <b>8.2.</b> - E2006-tfidf regression tutorial + E2006-tfidf Regression Tutorial </a> @@ -1477,7 +1492,7 @@ <b>8.3.</b> - KDDCup 2012 track 2 CTR prediction tutorial + KDDCup 2012 Track 2 CTR Prediction Tutorial </a> @@ -1523,7 +1538,7 @@ <b>8.3.3.</b> - Logistic Regression with Amplifier + Logistic Regression with amplifier </a> @@ -1581,7 +1596,7 @@ <b>9.1.1.</b> - Item-based Collaborative Filtering + Item-based collaborative filtering </a> @@ -1601,7 +1616,7 @@ <b>9.2.</b> - News20 related article recommendation Tutorial + News20 Related Article Recommendation Tutorial </a> @@ -1632,7 +1647,7 @@ <b>9.2.2.</b> - LSH/Minhash and Jaccard Similarity + LSH/MinHash and Jaccard similarity </a> @@ -1647,7 +1662,7 @@ <b>9.2.3.</b> - LSH/Minhash and Brute-Force Search + LSH/MinHash and brute-force search </a> @@ -1662,7 +1677,7 @@ <b>9.2.4.</b> - kNN search using b-Bits Minhash + kNN search using b-Bits MinHash </a> @@ -1682,7 +1697,7 @@ <b>9.3.</b> - MovieLens movie recommendation Tutorial + MovieLens Movie Recommendation Tutorial </a> @@ -1713,7 +1728,7 @@ <b>9.3.2.</b> - Item-based Collaborative Filtering + Item-based collaborative filtering </a> @@ -1758,7 +1773,7 @@ <b>9.3.5.</b> - SLIM for Fast Top-K Recommendation + SLIM for fast top-k recommendation </a> @@ -1773,7 +1788,7 @@ <b>9.3.6.</b> - 10-fold Cross Validation (Matrix Factorization) + 10-fold cross validation (Matrix Factorization) </a> @@ -1878,7 +1893,7 @@ - <li class="header">Part XII - GeoSpatial functions</li> + <li class="header">Part XII - GeoSpatial Functions</li> @@ -1963,7 +1978,7 @@ <b>13.2.1.</b> - a9a Tutorial for DataFrame + a9a tutorial for DataFrame </a> @@ -1978,7 +1993,7 @@ <b>13.2.2.</b> - a9a Tutorial for SQL + a9a tutorial for SQL </a> @@ -2014,7 +2029,7 @@ <b>13.3.1.</b> - E2006-tfidf regression Tutorial for DataFrame + E2006-tfidf regression tutorial for DataFrame </a> @@ -2029,7 +2044,7 @@ <b>13.3.2.</b> - E2006-tfidf regression Tutorial for SQL + E2006-tfidf regression tutorial for SQL </a> @@ -2065,7 +2080,7 @@ <b>13.4.1.</b> - Top-k Join processing + Top-k join processing </a> @@ -2124,25 +2139,10 @@ <li class="chapter " data-level="15.1" > - <a target="_blank" href="https://github.com/maropu/hivemall-spark"> - - - <b>15.1.</b> - - Hivemall on Apache Spark - - </a> - - - - </li> - - <li class="chapter " data-level="15.2" > - <a target="_blank" href="https://github.com/daijyc/hivemall/wiki/PigHome"> - <b>15.2.</b> + <b>15.1.</b> Hivemall on Apache Pig @@ -2182,7 +2182,7 @@ <!-- Title --> <h1> <i class="fa fa-circle-o-notch fa-spin"></i> - <a href=".." >News20 tutorial</a> + <a href=".." >News20 Tutorial</a> </h1> </div> @@ -2270,7 +2270,7 @@ Apache Hivemall is an effort undergoing incubation at The Apache Software Founda <script> var gitbook = gitbook || []; gitbook.push(function() { - gitbook.page.hasChanged({"page":{"title":"News20 tutorial","level":"6.3","depth":1,"next":{"title":"Data preparation","level":"6.3.1","depth":2,"path":"binaryclass/news20_dataset.md","ref":"binaryclass/news20_dataset.md","articles":[]},"previous":{"title":"Mini-batch Gradient Descent","level":"6.2.3","depth":2,"path":"binaryclass/a9a_minibatch.md","ref":"binaryclass/a9a_minibatch.md","articles":[]},"dir":"ltr"},"config":{"plugins":["theme-api","edit-link","github","splitter","sitemap","etoc","callouts","toggle-chapters","anchorjs","codeblock-filename","expandable-chapters","multipart","codeblock-filename","katex","emphasize","localized-footer"],"styles":{"website":"styles/website.css","pdf":"styles/pdf.css","epub":"styles/epub.css","mobi":"styles/mobi.css","ebook":"styles/ebook.css","print":"styles/print.css"},"pluginsConfig":{"emphasize":{},"callouts":{},"etoc":{"h2lb":3,"header":1,"maxdepth":3,"mindepth":1,"notoc":true},"github":{"url":"https://github.com/apache/incuba tor-hivemall/"},"splitter":{},"search":{},"downloadpdf":{"base":"https://github.com/apache/incubator-hivemall/docs/gitbook","label":"PDF","multilingual":false},"multipart":{},"localized-footer":{"filename":"FOOTER.md","hline":"true"},"lunr":{"maxIndexSize":1000000,"ignoreSpecialCharacters":false},"katex":{},"fontsettings":{"theme":"white","family":"sans","size":2,"font":"sans"},"highlight":{},"codeblock-filename":{},"sitemap":{"hostname":"http://hivemall.incubator.apache.org/"},"theme-api":{"languages":[],"split":false,"theme":"dark"},"sharing":{"facebook":true,"twitter":true,"google":false,"weibo":false,"instapaper":false,"vk":false,"all":["facebook","google","twitter","weibo","instapaper"]},"edit-link":{"label":"Edit","base":"https://github.com/apache/incubator-hivemall/tree/master/docs/gitbook"},"theme-default":{"styles":{"website":"styles/website.css","pdf":"styles/pdf.css","epub":"styles/epub.css","mobi":"styles/mobi.css","ebook":"styles/ebook.css","print":"styles/print.css"}," showLevel":true},"anchorjs":{"selector":"h1,h2,h3,*:not(.callout) > h4,h5"},"toggle-chapters":{},"expandable-chapters":{}},"theme":"default","pdf":{"pageNumbers":true,"fontSize":12,"fontFamily":"Arial","paperSize":"a4","chapterMark":"pagebreak","pageBreaksBefore":"/","margin":{"right":62,"left":62,"top":56,"bottom":56}},"structure":{"langs":"LANGS.md","readme":"README.md","glossary":"GLOSSARY.md","summary":"SUMMARY.md"},"variables":{},"title":"Hivemall User Manual","links":{"sidebar":{"<i class=\"fa fa-home\"></i> Home":"http://hivemall.incubator.apache.org/"}},"gitbook":"3.x.x","description":"User Manual for Apache Hivemall"},"file":{"path":"binaryclass/news20.md","mtime":"2017-11-02T05:41:05.000Z","type":"markdown"},"gitbook":{"version":"3.2.3","time":"2018-03-13T16:05:28.906Z"},"basePath":"..","book":{"language":""}}); + gitbook.page.hasChanged({"page":{"title":"News20 Tutorial","level":"6.3","depth":1,"next":{"title":"Data preparation","level":"6.3.1","depth":2,"path":"binaryclass/news20_dataset.md","ref":"binaryclass/news20_dataset.md","articles":[]},"previous":{"title":"Mini-batch gradient descent","level":"6.2.3","depth":2,"path":"binaryclass/a9a_minibatch.md","ref":"binaryclass/a9a_minibatch.md","articles":[]},"dir":"ltr"},"config":{"plugins":["theme-api","edit-link","github","splitter","sitemap","etoc","callouts","toggle-chapters","anchorjs","codeblock-filename","expandable-chapters","multipart","codeblock-filename","katex","emphasize","localized-footer"],"styles":{"website":"styles/website.css","pdf":"styles/pdf.css","epub":"styles/epub.css","mobi":"styles/mobi.css","ebook":"styles/ebook.css","print":"styles/print.css"},"pluginsConfig":{"emphasize":{},"callouts":{},"etoc":{"h2lb":3,"header":1,"maxdepth":3,"mindepth":1,"notoc":true},"github":{"url":"https://github.com/apache/incuba tor-hivemall/"},"splitter":{},"search":{},"downloadpdf":{"base":"https://github.com/apache/incubator-hivemall/docs/gitbook","label":"PDF","multilingual":false},"multipart":{},"localized-footer":{"filename":"FOOTER.md","hline":"true"},"lunr":{"maxIndexSize":1000000,"ignoreSpecialCharacters":false},"katex":{},"fontsettings":{"theme":"white","family":"sans","size":2,"font":"sans"},"highlight":{},"codeblock-filename":{},"sitemap":{"hostname":"http://hivemall.incubator.apache.org/"},"theme-api":{"languages":[],"split":false,"theme":"dark"},"sharing":{"facebook":true,"twitter":true,"google":false,"weibo":false,"instapaper":false,"vk":false,"all":["facebook","google","twitter","weibo","instapaper"]},"edit-link":{"label":"Edit","base":"https://github.com/apache/incubator-hivemall/tree/master/docs/gitbook"},"theme-default":{"styles":{"website":"styles/website.css","pdf":"styles/pdf.css","epub":"styles/epub.css","mobi":"styles/mobi.css","ebook":"styles/ebook.css","print":"styles/print.css"}," showLevel":true},"anchorjs":{"selector":"h1,h2,h3,*:not(.callout) > h4,h5"},"toggle-chapters":{},"expandable-chapters":{}},"theme":"default","pdf":{"pageNumbers":true,"fontSize":12,"fontFamily":"Arial","paperSize":"a4","chapterMark":"pagebreak","pageBreaksBefore":"/","margin":{"right":62,"left":62,"top":56,"bottom":56}},"structure":{"langs":"LANGS.md","readme":"README.md","glossary":"GLOSSARY.md","summary":"SUMMARY.md"},"variables":{},"title":"Hivemall User Manual","links":{"sidebar":{"<i class=\"fa fa-home\"></i> Home":"http://hivemall.incubator.apache.org/"}},"gitbook":"3.x.x","description":"User Manual for Apache Hivemall"},"file":{"path":"binaryclass/news20.md","mtime":"2017-11-02T05:41:05.000Z","type":"markdown"},"gitbook":{"version":"3.2.3","time":"2018-04-16T14:16:24.937Z"},"basePath":"..","book":{"language":""}}); }); </script> </div>