Fixed links in the user guide
Project: http://git-wip-us.apache.org/repos/asf/incubator-hivemall-site/repo Commit: http://git-wip-us.apache.org/repos/asf/incubator-hivemall-site/commit/68241a08 Tree: http://git-wip-us.apache.org/repos/asf/incubator-hivemall-site/tree/68241a08 Diff: http://git-wip-us.apache.org/repos/asf/incubator-hivemall-site/diff/68241a08 Branch: refs/heads/asf-site Commit: 68241a08770b72737540bd710624048e5e6903ea Parents: 542ae78 Author: myui <[email protected]> Authored: Thu Nov 17 21:18:30 2016 +0900 Committer: myui <[email protected]> Committed: Thu Nov 17 21:18:30 2016 +0900 ---------------------------------------------------------------------- userguide/FOOTER.md | 19 + userguide/anomaly/lof.html | 59 +- userguide/binaryclass/a9a.html | 37 +- userguide/binaryclass/a9a_dataset.html | 37 +- userguide/binaryclass/a9a_lr.html | 63 +- userguide/binaryclass/a9a_minibatch.html | 43 +- userguide/binaryclass/kdd2010a.html | 37 +- userguide/binaryclass/kdd2010a_dataset.html | 46 +- userguide/binaryclass/kdd2010a_scw.html | 37 +- userguide/binaryclass/kdd2010b.html | 37 +- userguide/binaryclass/kdd2010b_arow.html | 37 +- userguide/binaryclass/kdd2010b_dataset.html | 46 +- userguide/binaryclass/news20.html | 37 +- userguide/binaryclass/news20_adagrad.html | 37 +- userguide/binaryclass/news20_dataset.html | 37 +- userguide/binaryclass/news20_pa.html | 37 +- userguide/binaryclass/news20_scw.html | 37 +- userguide/binaryclass/titanic_rf.html | 2081 ++++++++++++++++++ userguide/binaryclass/webspam.html | 37 +- userguide/binaryclass/webspam_dataset.html | 37 +- userguide/binaryclass/webspam_scw.html | 43 +- userguide/eval/datagen.html | 37 +- userguide/eval/lr_datagen.html | 53 +- userguide/eval/stat_eval.html | 57 +- userguide/ft_engineering/ft_trans.html | 37 +- userguide/ft_engineering/hashing.html | 44 +- userguide/ft_engineering/quantify.html | 37 +- userguide/ft_engineering/scaling.html | 37 +- userguide/ft_engineering/tfidf.html | 37 +- userguide/ft_engineering/vectorizer.html | 37 +- userguide/getting_started/index.html | 37 +- userguide/getting_started/input-format.html | 51 +- userguide/getting_started/installation.html | 37 +- .../getting_started/permanent-functions.html | 38 +- userguide/index.html | 37 +- userguide/misc/generic_funcs.html | 268 ++- userguide/misc/tokenizer.html | 37 +- userguide/misc/topk.html | 41 +- userguide/multiclass/iris.html | 37 +- userguide/multiclass/iris_dataset.html | 39 +- userguide/multiclass/iris_randomforest.html | 42 +- userguide/multiclass/iris_scw.html | 41 +- userguide/multiclass/news20.html | 39 +- userguide/multiclass/news20_dataset.html | 37 +- userguide/multiclass/news20_ensemble.html | 37 +- .../multiclass/news20_one-vs-the-rest.html | 37 +- .../news20_one-vs-the-rest_dataset.html | 37 +- userguide/multiclass/news20_pa.html | 37 +- userguide/multiclass/news20_scw.html | 37 +- userguide/recommend/cf.html | 37 +- userguide/recommend/item_based_cf.html | 41 +- userguide/recommend/movielens.html | 37 +- userguide/recommend/movielens_cv.html | 37 +- userguide/recommend/movielens_dataset.html | 37 +- userguide/recommend/movielens_fm.html | 44 +- userguide/recommend/movielens_mf.html | 80 +- userguide/recommend/news20.html | 37 +- userguide/recommend/news20_bbit_minhash.html | 37 +- userguide/recommend/news20_jaccard.html | 37 +- userguide/recommend/news20_knn.html | 39 +- userguide/regression/e2006.html | 37 +- userguide/regression/e2006_arow.html | 41 +- userguide/regression/e2006_dataset.html | 37 +- userguide/regression/kddcup12tr2.html | 37 +- userguide/regression/kddcup12tr2_adagrad.html | 41 +- userguide/regression/kddcup12tr2_dataset.html | 39 +- userguide/regression/kddcup12tr2_lr.html | 37 +- .../regression/kddcup12tr2_lr_amplify.html | 43 +- userguide/resources/images/kddtrack2tables.png | Bin 0 -> 30323 bytes userguide/search_index.json | 2 +- userguide/sitemap.xml | 1 + userguide/tips/addbias.html | 39 +- userguide/tips/emr.html | 53 +- userguide/tips/ensemble_learning.html | 37 +- userguide/tips/general_tips.html | 37 +- userguide/tips/hadoop_tuning.html | 48 +- userguide/tips/index.html | 37 +- userguide/tips/mixserver.html | 64 +- userguide/tips/rand_amplify.html | 57 +- userguide/tips/rowid.html | 63 +- userguide/tips/rt_prediction.html | 66 +- userguide/troubleshooting/asterisk.html | 37 +- userguide/troubleshooting/index.html | 37 +- .../troubleshooting/mapjoin_classcastex.html | 37 +- .../troubleshooting/mapjoin_task_error.html | 37 +- userguide/troubleshooting/num_mappers.html | 37 +- userguide/troubleshooting/oom.html | 37 +- 87 files changed, 5327 insertions(+), 397 deletions(-) ---------------------------------------------------------------------- http://git-wip-us.apache.org/repos/asf/incubator-hivemall-site/blob/68241a08/userguide/FOOTER.md ---------------------------------------------------------------------- diff --git a/userguide/FOOTER.md b/userguide/FOOTER.md index 588afbb..b6f2c55 100644 --- a/userguide/FOOTER.md +++ b/userguide/FOOTER.md @@ -1,3 +1,22 @@ +<!-- + Licensed to the Apache Software Foundation (ASF) under one + or more contributor license agreements. See the NOTICE file + distributed with this work for additional information + regarding copyright ownership. The ASF licenses this file + to you under the Apache License, Version 2.0 (the + "License"); you may not use this file except in compliance + with the License. You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + + Unless required by applicable law or agreed to in writing, + software distributed under the License is distributed on an + "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + KIND, either express or implied. See the License for the + specific language governing permissions and limitations + under the License. +--> + <sub><font color="gray"> Apache Hivemall is an effort undergoing incubation at The Apache Software Foundation (ASF), sponsored by the Apache Incubator. </font></sub> \ No newline at end of file http://git-wip-us.apache.org/repos/asf/incubator-hivemall-site/blob/68241a08/userguide/anomaly/lof.html ---------------------------------------------------------------------- diff --git a/userguide/anomaly/lof.html b/userguide/anomaly/lof.html index 4ccba15..53d6d5b 100644 --- a/userguide/anomaly/lof.html +++ b/userguide/anomaly/lof.html @@ -997,6 +997,21 @@ </li> + <li class="chapter " data-level="5.6" data-path="../binaryclass/titanic_rf.html"> + + <a href="../binaryclass/titanic_rf.html"> + + + <b>5.6.</b> + + Kaggle Titanic Tutorial + + </a> + + + + </li> + @@ -1648,6 +1663,18 @@ under the License. --> <p>This article introduce how to find outliers using <a href="http://en.wikipedia.org/wiki/Local_outlier_factor" target="_blank">Local Outlier Detection (LOF)</a> on Hivemall.</p> +<!-- toc --><div id="toc" class="toc"> + +<ul> +<li><a href="#data-preparation">Data Preparation</a><ul> +<li><a href="#apply-data-normalization">Apply Data Normalization</a></li> +</ul> +</li> +<li><a href="#outlier-detection-using-local-outlier-facotor-lof">Outlier Detection using Local Outlier Facotor (LOF)</a></li> +<li><a href="#parallelize-top-k-computation">Parallelize Top-k computation</a></li> +</ul> + +</div><!-- tocstop --> <h1 id="data-preparation">Data Preparation</h1> <pre><code class="lang-sql"><span class="hljs-keyword">create</span> <span class="hljs-keyword">database</span> lof; <span class="hljs-keyword">use</span> lof; @@ -1662,8 +1689,8 @@ <span class="hljs-keyword">FIELDS</span> <span class="hljs-keyword">TERMINATED</span> <span class="hljs-keyword">BY</span> <span class="hljs-string">' '</span> <span class="hljs-keyword">STORED</span> <span class="hljs-keyword">AS</span> TEXTFILE LOCATION <span class="hljs-string">'/dataset/lof/hundred_balls'</span>; </code></pre> -<p>Download <a href="https://github.com/myui/hivemall/blob/master/resources/examples/lof/hundred_balls.txt" target="_blank">hundred_balls.txt</a> that is originally provides in <a href="http://next.rikunabi.com/tech/docs/ct_s03600.jsp?p=002259" target="_blank">this article</a>.</p> -<p>You can find outliers in <a href="http://next.rikunabi.com/tech/contents/ts_report/img/201303/002259/part1_img1.jpg" target="_blank">this picture</a>. As you can see, Rowid <code>87</code> is apparently an outlier.</p> +<p>Download <a href="https://gist.githubusercontent.com/myui/f8b44ab925bc198e6d11b18fdd21269d/raw/bed05f811e4c351ed959e0159405690f2f11e577/hundred_balls.txt" target="_blank">hundred_balls.txt</a> that is originally provides in <a href="http://next.rikunabi.com/tech/docs/ct_s03600.jsp?p=002259" target="_blank">this article</a>.</p> +<p>In this example, Rowid <code>87</code> is apparently an outlier.</p> <pre><code class="lang-sh">awk <span class="hljs-string">'{FS=" "; OFS=" "; print NR,$0}'</span> hundred_balls.txt | \ hadoop fs -put - /dataset/lof/hundred_balls/hundred_balls.txt </code></pre> @@ -1753,9 +1780,9 @@ norm_fv <span class="hljs-keyword">as</span> ( t1.<span class="hljs-keyword">rowid</span> != t2.<span class="hljs-keyword">rowid</span> ; </code></pre> -<p><em>Note: <code>list_neighbours</code> table SHOULD be created because <code>list_neighbours</code> is used multiple times.</em></p> -<p><em>Note: <a href="https://github.com/myui/hivemall/pull/196" target="_blank"><code>each_top_k</code></a> is supported from Hivemall v0.3.2-3 or later.</em></p> -<p><em>Note: To parallelize a top-k computation, break LEFT-hand table into piece as describe in <a href="https://github.com/myui/hivemall/wiki/Efficient-Top-k-computation-on-Apache-Hive-using-Hivemall-UDTF#parallelization-of-similarity-computation-using-with-clause" target="_blank">this page</a>.</em></p> +<div class="panel panel-warning"><div class="panel-heading"><h3 class="panel-title" id="caution"><i class="fa fa-exclamation-triangle"></i> Caution</h3></div><div class="panel-body"><p><code>list_neighbours</code> table SHOULD be created because <code>list_neighbours</code> is used multiple times.</p></div></div> +<h1 id="parallelize-top-k-computation">Parallelize Top-k computation</h1> +<div class="panel panel-info"><div class="panel-heading"><h3 class="panel-title" id="info"><i class="fa fa-info"></i> Info</h3></div><div class="panel-body"><p>To parallelize a top-k computation, break LEFT-hand table into piece as describe in <a href="../misc/topk.html">this page</a>.</p></div></div> <pre><code class="lang-sql">WITH k_distance as ( <span class="hljs-keyword">select</span> target, @@ -1804,7 +1831,25 @@ neighbours_lrd <span class="hljs-keyword">as</span> ( <pre><code>> 87 3.031143749957831 > 16 1.9755564408378874 > 1 1.8415763570939774 -</code></pre><p><div id="page-footer"><hr><p><sub><font color="gray"> +</code></pre><p><div id="page-footer"><hr><!-- + Licensed to the Apache Software Foundation (ASF) under one + or more contributor license agreements. See the NOTICE file + distributed with this work for additional information + regarding copyright ownership. The ASF licenses this file + to you under the Apache License, Version 2.0 (the + "License"); you may not use this file except in compliance + with the License. You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + + Unless required by applicable law or agreed to in writing, + software distributed under the License is distributed on an + "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + KIND, either express or implied. See the License for the + specific language governing permissions and limitations + under the License. +--> +<p><sub><font color="gray"> Apache Hivemall is an effort undergoing incubation at The Apache Software Foundation (ASF), sponsored by the Apache Incubator. </font></sub></p> </div></p> @@ -1841,7 +1886,7 @@ Apache Hivemall is an effort undergoing incubation at The Apache Software Founda <script> var gitbook = gitbook || []; gitbook.push(function() { - gitbook.page.hasChanged({"page":{"title":"Outlier Detection using Local Outlier Factor (LOF)","level":"9.1","depth":1,"next":{"title":"Hivemall on Apache Spark","level":"10.1","depth":1,"url":"https://github.com/maropu/hivemall-spark","ref":"https://github.com/maropu/hivemall-spark","articles":[]},"previous":{"title":"10-fold Cross Validation (Matrix Factorization)","level":"8.3.4","depth":2,"path":"recommend/movielens_cv.md","ref":"recommend/movielens_cv.md","articles":[]},"dir":"ltr"},"config":{"plugins":["theme-api","edit-link","github","splitter","sitemap","etoc","callouts","toggle-chapters","anchorjs","codeblock-filename","expandable-chapters","multipart","codeblock-filename","katex","emphasize","localized-footer"],"styles":{"website":"styles/website.css","pdf":"styles/pdf.css","epub":"styles/epub.css","mobi":"styles/mobi.css","ebook":"styles/ebook.css","print":"styles/print.css"},"pluginsConfig":{"emphasize":{},"callouts":{},"etoc":{"maxdepth":3,"mindepth":1,"notoc ":true},"github":{"url":"https://github.com/apache/incubator-hivemall/"},"splitter":{},"search":{},"downloadpdf":{"base":"https://github.com/apache/incubator-hivemall/docs/gitbook","label":"PDF","multilingual":false},"multipart":{},"localized-footer":{"filename":"FOOTER.md"},"lunr":{"maxIndexSize":1000000,"ignoreSpecialCharacters":false},"katex":{},"fontsettings":{"theme":"white","family":"sans","size":2,"font":"sans"},"highlight":{},"codeblock-filename":{},"sitemap":{"hostname":"http://hivemall.incubator.apache.org/"},"theme-api":{"languages":[],"split":false,"theme":"dark"},"sharing":{"facebook":true,"twitter":true,"google":false,"weibo":false,"instapaper":false,"vk":false,"all":["facebook","google","twitter","weibo","instapaper"]},"edit-link":{"label":"Edit","base":"https://github.com/apache/incubator-hivemall/docs/gitbook"},"theme-default":{"styles":{"website":"styles/website.css","pdf":"styles/pdf.css","epub":"styles/epub.css","mobi":"styles/mobi.css","ebook":"styles/ebook.css" ,"print":"styles/print.css"},"showLevel":true},"anchorjs":{"selector":"h1,h2,h3,*:not(.callout) > h4,h5"},"toggle-chapters":{},"expandable-chapters":{}},"theme":"default","pdf":{"pageNumbers":true,"fontSize":12,"fontFamily":"Arial","paperSize":"a4","chapterMark":"pagebreak","pageBreaksBefore":"/","margin":{"right":62,"left":62,"top":56,"bottom":56}},"structure":{"langs":"LANGS.md","readme":"README.md","glossary":"GLOSSARY.md","summary":"SUMMARY.md"},"variables":{},"title":"Hivemall User Manual","links":{"sidebar":{"<i class=\"fa fa-home\"></i> Home":"http://hivemall.incubator.apache.org/"}},"gitbook":"3.x.x","description":"User Manual for Apache Hivemall"},"file":{"path":"anomaly/lof.md","mtime":"2016-11-12T07:18:00.000Z","type":"markdown"},"gitbook":{"version":"3.2.2","time":"2016-11-14T10:40:22.987Z"},"basePath":"..","book":{"language":""}}); + gitbook.page.hasChanged({"page":{"title":"Outlier Detection using Local Outlier Factor (LOF)","level":"9.1","depth":1,"next":{"title":"Hivemall on Apache Spark","level":"10.1","depth":1,"url":"https://github.com/maropu/hivemall-spark","ref":"https://github.com/maropu/hivemall-spark","articles":[]},"previous":{"title":"10-fold Cross Validation (Matrix Factorization)","level":"8.3.4","depth":2,"path":"recommend/movielens_cv.md","ref":"recommend/movielens_cv.md","articles":[]},"dir":"ltr"},"config":{"plugins":["theme-api","edit-link","github","splitter","sitemap","etoc","callouts","toggle-chapters","anchorjs","codeblock-filename","expandable-chapters","multipart","codeblock-filename","katex","emphasize","localized-footer"],"styles":{"website":"styles/website.css","pdf":"styles/pdf.css","epub":"styles/epub.css","mobi":"styles/mobi.css","ebook":"styles/ebook.css","print":"styles/print.css"},"pluginsConfig":{"emphasize":{},"callouts":{},"etoc":{"maxdepth":3,"mindepth":1,"notoc ":true},"github":{"url":"https://github.com/apache/incubator-hivemall/"},"splitter":{},"search":{},"downloadpdf":{"base":"https://github.com/apache/incubator-hivemall/docs/gitbook","label":"PDF","multilingual":false},"multipart":{},"localized-footer":{"filename":"FOOTER.md"},"lunr":{"maxIndexSize":1000000,"ignoreSpecialCharacters":false},"katex":{},"fontsettings":{"theme":"white","family":"sans","size":2,"font":"sans"},"highlight":{},"codeblock-filename":{},"sitemap":{"hostname":"http://hivemall.incubator.apache.org/"},"theme-api":{"languages":[],"split":false,"theme":"dark"},"sharing":{"facebook":true,"twitter":true,"google":false,"weibo":false,"instapaper":false,"vk":false,"all":["facebook","google","twitter","weibo","instapaper"]},"edit-link":{"label":"Edit","base":"https://github.com/apache/incubator-hivemall/docs/gitbook"},"theme-default":{"styles":{"website":"styles/website.css","pdf":"styles/pdf.css","epub":"styles/epub.css","mobi":"styles/mobi.css","ebook":"styles/ebook.css" ,"print":"styles/print.css"},"showLevel":true},"anchorjs":{"selector":"h1,h2,h3,*:not(.callout) > h4,h5"},"toggle-chapters":{},"expandable-chapters":{}},"theme":"default","pdf":{"pageNumbers":true,"fontSize":12,"fontFamily":"Arial","paperSize":"a4","chapterMark":"pagebreak","pageBreaksBefore":"/","margin":{"right":62,"left":62,"top":56,"bottom":56}},"structure":{"langs":"LANGS.md","readme":"README.md","glossary":"GLOSSARY.md","summary":"SUMMARY.md"},"variables":{},"title":"Hivemall User Manual","links":{"sidebar":{"<i class=\"fa fa-home\"></i> Home":"http://hivemall.incubator.apache.org/"}},"gitbook":"3.x.x","description":"User Manual for Apache Hivemall"},"file":{"path":"anomaly/lof.md","mtime":"2016-11-17T09:55:36.000Z","type":"markdown"},"gitbook":{"version":"3.2.2","time":"2016-11-17T12:16:14.647Z"},"basePath":"..","book":{"language":""}}); }); </script> </div> http://git-wip-us.apache.org/repos/asf/incubator-hivemall-site/blob/68241a08/userguide/binaryclass/a9a.html ---------------------------------------------------------------------- diff --git a/userguide/binaryclass/a9a.html b/userguide/binaryclass/a9a.html index 70b0d67..36d53ea 100644 --- a/userguide/binaryclass/a9a.html +++ b/userguide/binaryclass/a9a.html @@ -999,6 +999,21 @@ </li> + <li class="chapter " data-level="5.6" data-path="titanic_rf.html"> + + <a href="titanic_rf.html"> + + + <b>5.6.</b> + + Kaggle Titanic Tutorial + + </a> + + + + </li> + @@ -1649,7 +1664,25 @@ specific language governing permissions and limitations under the License. --> -<p><div id="page-footer"><hr><p><sub><font color="gray"> +<p><div id="page-footer"><hr><!-- + Licensed to the Apache Software Foundation (ASF) under one + or more contributor license agreements. See the NOTICE file + distributed with this work for additional information + regarding copyright ownership. The ASF licenses this file + to you under the Apache License, Version 2.0 (the + "License"); you may not use this file except in compliance + with the License. You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + + Unless required by applicable law or agreed to in writing, + software distributed under the License is distributed on an + "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + KIND, either express or implied. See the License for the + specific language governing permissions and limitations + under the License. +--> +<p><sub><font color="gray"> Apache Hivemall is an effort undergoing incubation at The Apache Software Foundation (ASF), sponsored by the Apache Incubator. </font></sub></p> </div></p> @@ -1686,7 +1719,7 @@ Apache Hivemall is an effort undergoing incubation at The Apache Software Founda <script> var gitbook = gitbook || []; gitbook.push(function() { - gitbook.page.hasChanged({"page":{"title":"a9a Tutorial","level":"5.1","depth":1,"next":{"title":"Data preparation","level":"5.1.1","depth":2,"path":"binaryclass/a9a_dataset.md","ref":"binaryclass/a9a_dataset.md","articles":[]},"previous":{"title":"Logistic Regression data generation","level":"4.2.1","depth":2,"path":"eval/lr_datagen.md","ref":"eval/lr_datagen.md","articles":[]},"dir":"ltr"},"config":{"plugins":["theme-api","edit-link","github","splitter","sitemap","etoc","callouts","toggle-chapters","anchorjs","codeblock-filename","expandable-chapters","multipart","codeblock-filename","katex","emphasize","localized-footer"],"styles":{"website":"styles/website.css","pdf":"styles/pdf.css","epub":"styles/epub.css","mobi":"styles/mobi.css","ebook":"styles/ebook.css","print":"styles/print.css"},"pluginsConfig":{"emphasize":{},"callouts":{},"etoc":{"maxdepth":3,"mindepth":1,"notoc":true},"github":{"url":"https://github.com/apache/incubator-hivemall/"},"splitter":{},"search":{} ,"downloadpdf":{"base":"https://github.com/apache/incubator-hivemall/docs/gitbook","label":"PDF","multilingual":false},"multipart":{},"localized-footer":{"filename":"FOOTER.md"},"lunr":{"maxIndexSize":1000000,"ignoreSpecialCharacters":false},"katex":{},"fontsettings":{"theme":"white","family":"sans","size":2,"font":"sans"},"highlight":{},"codeblock-filename":{},"sitemap":{"hostname":"http://hivemall.incubator.apache.org/"},"theme-api":{"languages":[],"split":false,"theme":"dark"},"sharing":{"facebook":true,"twitter":true,"google":false,"weibo":false,"instapaper":false,"vk":false,"all":["facebook","google","twitter","weibo","instapaper"]},"edit-link":{"label":"Edit","base":"https://github.com/apache/incubator-hivemall/docs/gitbook"},"theme-default":{"styles":{"website":"styles/website.css","pdf":"styles/pdf.css","epub":"styles/epub.css","mobi":"styles/mobi.css","ebook":"styles/ebook.css","print":"styles/print.css"},"showLevel":true},"anchorjs":{"selector":"h1,h2,h3,*:not(.callout) > h4,h5"},"toggle-chapters":{},"expandable-chapters":{}},"theme":"default","pdf":{"pageNumbers":true,"fontSize":12,"fontFamily":"Arial","paperSize":"a4","chapterMark":"pagebreak","pageBreaksBefore":"/","margin":{"right":62,"left":62,"top":56,"bottom":56}},"structure":{"langs":"LANGS.md","readme":"README.md","glossary":"GLOSSARY.md","summary":"SUMMARY.md"},"variables":{},"title":"Hivemall User Manual","links":{"sidebar":{"<i class=\"fa fa-home\"></i> Home":"http://hivemall.incubator.apache.org/"}},"gitbook":"3.x.x","description":"User Manual for Apache Hivemall"},"file":{"path":"binaryclass/a9a.md","mtime":"2016-11-12T07:18:00.000Z","type":"markdown"},"gitbook":{"version":"3.2.2","time":"2016-11-14T10:40:22.987Z"},"basePath":"..","book":{"language":""}}); + gitbook.page.hasChanged({"page":{"title":"a9a Tutorial","level":"5.1","depth":1,"next":{"title":"Data preparation","level":"5.1.1","depth":2,"path":"binaryclass/a9a_dataset.md","ref":"binaryclass/a9a_dataset.md","articles":[]},"previous":{"title":"Logistic Regression data generation","level":"4.2.1","depth":2,"path":"eval/lr_datagen.md","ref":"eval/lr_datagen.md","articles":[]},"dir":"ltr"},"config":{"plugins":["theme-api","edit-link","github","splitter","sitemap","etoc","callouts","toggle-chapters","anchorjs","codeblock-filename","expandable-chapters","multipart","codeblock-filename","katex","emphasize","localized-footer"],"styles":{"website":"styles/website.css","pdf":"styles/pdf.css","epub":"styles/epub.css","mobi":"styles/mobi.css","ebook":"styles/ebook.css","print":"styles/print.css"},"pluginsConfig":{"emphasize":{},"callouts":{},"etoc":{"maxdepth":3,"mindepth":1,"notoc":true},"github":{"url":"https://github.com/apache/incubator-hivemall/"},"splitter":{},"search":{} ,"downloadpdf":{"base":"https://github.com/apache/incubator-hivemall/docs/gitbook","label":"PDF","multilingual":false},"multipart":{},"localized-footer":{"filename":"FOOTER.md"},"lunr":{"maxIndexSize":1000000,"ignoreSpecialCharacters":false},"katex":{},"fontsettings":{"theme":"white","family":"sans","size":2,"font":"sans"},"highlight":{},"codeblock-filename":{},"sitemap":{"hostname":"http://hivemall.incubator.apache.org/"},"theme-api":{"languages":[],"split":false,"theme":"dark"},"sharing":{"facebook":true,"twitter":true,"google":false,"weibo":false,"instapaper":false,"vk":false,"all":["facebook","google","twitter","weibo","instapaper"]},"edit-link":{"label":"Edit","base":"https://github.com/apache/incubator-hivemall/docs/gitbook"},"theme-default":{"styles":{"website":"styles/website.css","pdf":"styles/pdf.css","epub":"styles/epub.css","mobi":"styles/mobi.css","ebook":"styles/ebook.css","print":"styles/print.css"},"showLevel":true},"anchorjs":{"selector":"h1,h2,h3,*:not(.callout) > h4,h5"},"toggle-chapters":{},"expandable-chapters":{}},"theme":"default","pdf":{"pageNumbers":true,"fontSize":12,"fontFamily":"Arial","paperSize":"a4","chapterMark":"pagebreak","pageBreaksBefore":"/","margin":{"right":62,"left":62,"top":56,"bottom":56}},"structure":{"langs":"LANGS.md","readme":"README.md","glossary":"GLOSSARY.md","summary":"SUMMARY.md"},"variables":{},"title":"Hivemall User Manual","links":{"sidebar":{"<i class=\"fa fa-home\"></i> Home":"http://hivemall.incubator.apache.org/"}},"gitbook":"3.x.x","description":"User Manual for Apache Hivemall"},"file":{"path":"binaryclass/a9a.md","mtime":"2016-11-16T08:39:12.000Z","type":"markdown"},"gitbook":{"version":"3.2.2","time":"2016-11-17T12:16:14.647Z"},"basePath":"..","book":{"language":""}}); }); </script> </div> http://git-wip-us.apache.org/repos/asf/incubator-hivemall-site/blob/68241a08/userguide/binaryclass/a9a_dataset.html ---------------------------------------------------------------------- diff --git a/userguide/binaryclass/a9a_dataset.html b/userguide/binaryclass/a9a_dataset.html index 5f23143..9220b9c 100644 --- a/userguide/binaryclass/a9a_dataset.html +++ b/userguide/binaryclass/a9a_dataset.html @@ -999,6 +999,21 @@ </li> + <li class="chapter " data-level="5.6" data-path="titanic_rf.html"> + + <a href="titanic_rf.html"> + + + <b>5.6.</b> + + Kaggle Titanic Tutorial + + </a> + + + + </li> + @@ -1679,7 +1694,25 @@ hadoop fs -copyFromLocal a9a.test /dataset/a9a/test features <span class="hljs-built_in">ARRAY</span><<span class="hljs-keyword">STRING</span>> ) <span class="hljs-keyword">ROW</span> <span class="hljs-keyword">FORMAT</span> <span class="hljs-keyword">DELIMITED</span> <span class="hljs-keyword">FIELDS</span> <span class="hljs-keyword">TERMINATED</span> <span class="hljs-keyword">BY</span> <span class="hljs-string">'\t'</span> COLLECTION ITEMS <span class="hljs-keyword">TERMINATED</span> <span class="hljs-keyword">BY</span> <span class="hljs-string">","</span> <span class="hljs-keyword">STORED</span> <span class="hljs-keyword">AS</span> TEXTFILE LOCATION <span class="hljs-string">'/dataset/a9a/test'</span>; </code></pre> -<p><div id="page-footer"><hr><p><sub><font color="gray"> +<p><div id="page-footer"><hr><!-- + Licensed to the Apache Software Foundation (ASF) under one + or more contributor license agreements. See the NOTICE file + distributed with this work for additional information + regarding copyright ownership. The ASF licenses this file + to you under the Apache License, Version 2.0 (the + "License"); you may not use this file except in compliance + with the License. You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + + Unless required by applicable law or agreed to in writing, + software distributed under the License is distributed on an + "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + KIND, either express or implied. See the License for the + specific language governing permissions and limitations + under the License. +--> +<p><sub><font color="gray"> Apache Hivemall is an effort undergoing incubation at The Apache Software Foundation (ASF), sponsored by the Apache Incubator. </font></sub></p> </div></p> @@ -1716,7 +1749,7 @@ Apache Hivemall is an effort undergoing incubation at The Apache Software Founda <script> var gitbook = gitbook || []; gitbook.push(function() { - gitbook.page.hasChanged({"page":{"title":"Data preparation","level":"5.1.1","depth":2,"next":{"title":"Logistic Regression","level":"5.1.2","depth":2,"path":"binaryclass/a9a_lr.md","ref":"binaryclass/a9a_lr.md","articles":[]},"previous":{"title":"a9a Tutorial","level":"5.1","depth":1,"path":"binaryclass/a9a.md","ref":"binaryclass/a9a.md","articles":[{"title":"Data preparation","level":"5.1.1","depth":2,"path":"binaryclass/a9a_dataset.md","ref":"binaryclass/a9a_dataset.md","articles":[]},{"title":"Logistic Regression","level":"5.1.2","depth":2,"path":"binaryclass/a9a_lr.md","ref":"binaryclass/a9a_lr.md","articles":[]},{"title":"Mini-batch Gradient Descent","level":"5.1.3","depth":2,"path":"binaryclass/a9a_minibatch.md","ref":"binaryclass/a9a_minibatch.md","articles":[]}]},"dir":"ltr"},"config":{"plugins":["theme-api","edit-link","github","splitter","sitemap","etoc","callouts","toggle-chapters","anchorjs","codeblock-filename","expandable-chapters","multipart","codeblock-fi lename","katex","emphasize","localized-footer"],"styles":{"website":"styles/website.css","pdf":"styles/pdf.css","epub":"styles/epub.css","mobi":"styles/mobi.css","ebook":"styles/ebook.css","print":"styles/print.css"},"pluginsConfig":{"emphasize":{},"callouts":{},"etoc":{"maxdepth":3,"mindepth":1,"notoc":true},"github":{"url":"https://github.com/apache/incubator-hivemall/"},"splitter":{},"search":{},"downloadpdf":{"base":"https://github.com/apache/incubator-hivemall/docs/gitbook","label":"PDF","multilingual":false},"multipart":{},"localized-footer":{"filename":"FOOTER.md"},"lunr":{"maxIndexSize":1000000,"ignoreSpecialCharacters":false},"katex":{},"fontsettings":{"theme":"white","family":"sans","size":2,"font":"sans"},"highlight":{},"codeblock-filename":{},"sitemap":{"hostname":"http://hivemall.incubator.apache.org/"},"theme-api":{"languages":[],"split":false,"theme":"dark"},"sharing":{"facebook":true,"twitter":true,"google":false,"weibo":false,"instapaper":false,"vk":false,"all":["fa cebook","google","twitter","weibo","instapaper"]},"edit-link":{"label":"Edit","base":"https://github.com/apache/incubator-hivemall/docs/gitbook"},"theme-default":{"styles":{"website":"styles/website.css","pdf":"styles/pdf.css","epub":"styles/epub.css","mobi":"styles/mobi.css","ebook":"styles/ebook.css","print":"styles/print.css"},"showLevel":true},"anchorjs":{"selector":"h1,h2,h3,*:not(.callout) > h4,h5"},"toggle-chapters":{},"expandable-chapters":{}},"theme":"default","pdf":{"pageNumbers":true,"fontSize":12,"fontFamily":"Arial","paperSize":"a4","chapterMark":"pagebreak","pageBreaksBefore":"/","margin":{"right":62,"left":62,"top":56,"bottom":56}},"structure":{"langs":"LANGS.md","readme":"README.md","glossary":"GLOSSARY.md","summary":"SUMMARY.md"},"variables":{},"title":"Hivemall User Manual","links":{"sidebar":{"<i class=\"fa fa-home\"></i> Home":"http://hivemall.incubator.apache.org/"}},"gitbook":"3.x.x","description":"User Manual for Apache Hivemall"},"file":{"path":"binaryclass/a 9a_dataset.md","mtime":"2016-11-12T07:18:00.000Z","type":"markdown"},"gitbook":{"version":"3.2.2","time":"2016-11-14T10:40:22.987Z"},"basePath":"..","book":{"language":""}}); + gitbook.page.hasChanged({"page":{"title":"Data preparation","level":"5.1.1","depth":2,"next":{"title":"Logistic Regression","level":"5.1.2","depth":2,"path":"binaryclass/a9a_lr.md","ref":"binaryclass/a9a_lr.md","articles":[]},"previous":{"title":"a9a Tutorial","level":"5.1","depth":1,"path":"binaryclass/a9a.md","ref":"binaryclass/a9a.md","articles":[{"title":"Data preparation","level":"5.1.1","depth":2,"path":"binaryclass/a9a_dataset.md","ref":"binaryclass/a9a_dataset.md","articles":[]},{"title":"Logistic Regression","level":"5.1.2","depth":2,"path":"binaryclass/a9a_lr.md","ref":"binaryclass/a9a_lr.md","articles":[]},{"title":"Mini-batch Gradient Descent","level":"5.1.3","depth":2,"path":"binaryclass/a9a_minibatch.md","ref":"binaryclass/a9a_minibatch.md","articles":[]}]},"dir":"ltr"},"config":{"plugins":["theme-api","edit-link","github","splitter","sitemap","etoc","callouts","toggle-chapters","anchorjs","codeblock-filename","expandable-chapters","multipart","codeblock-fi lename","katex","emphasize","localized-footer"],"styles":{"website":"styles/website.css","pdf":"styles/pdf.css","epub":"styles/epub.css","mobi":"styles/mobi.css","ebook":"styles/ebook.css","print":"styles/print.css"},"pluginsConfig":{"emphasize":{},"callouts":{},"etoc":{"maxdepth":3,"mindepth":1,"notoc":true},"github":{"url":"https://github.com/apache/incubator-hivemall/"},"splitter":{},"search":{},"downloadpdf":{"base":"https://github.com/apache/incubator-hivemall/docs/gitbook","label":"PDF","multilingual":false},"multipart":{},"localized-footer":{"filename":"FOOTER.md"},"lunr":{"maxIndexSize":1000000,"ignoreSpecialCharacters":false},"katex":{},"fontsettings":{"theme":"white","family":"sans","size":2,"font":"sans"},"highlight":{},"codeblock-filename":{},"sitemap":{"hostname":"http://hivemall.incubator.apache.org/"},"theme-api":{"languages":[],"split":false,"theme":"dark"},"sharing":{"facebook":true,"twitter":true,"google":false,"weibo":false,"instapaper":false,"vk":false,"all":["fa cebook","google","twitter","weibo","instapaper"]},"edit-link":{"label":"Edit","base":"https://github.com/apache/incubator-hivemall/docs/gitbook"},"theme-default":{"styles":{"website":"styles/website.css","pdf":"styles/pdf.css","epub":"styles/epub.css","mobi":"styles/mobi.css","ebook":"styles/ebook.css","print":"styles/print.css"},"showLevel":true},"anchorjs":{"selector":"h1,h2,h3,*:not(.callout) > h4,h5"},"toggle-chapters":{},"expandable-chapters":{}},"theme":"default","pdf":{"pageNumbers":true,"fontSize":12,"fontFamily":"Arial","paperSize":"a4","chapterMark":"pagebreak","pageBreaksBefore":"/","margin":{"right":62,"left":62,"top":56,"bottom":56}},"structure":{"langs":"LANGS.md","readme":"README.md","glossary":"GLOSSARY.md","summary":"SUMMARY.md"},"variables":{},"title":"Hivemall User Manual","links":{"sidebar":{"<i class=\"fa fa-home\"></i> Home":"http://hivemall.incubator.apache.org/"}},"gitbook":"3.x.x","description":"User Manual for Apache Hivemall"},"file":{"path":"binaryclass/a 9a_dataset.md","mtime":"2016-11-16T08:39:12.000Z","type":"markdown"},"gitbook":{"version":"3.2.2","time":"2016-11-17T12:16:14.647Z"},"basePath":"..","book":{"language":""}}); }); </script> </div> http://git-wip-us.apache.org/repos/asf/incubator-hivemall-site/blob/68241a08/userguide/binaryclass/a9a_lr.html ---------------------------------------------------------------------- diff --git a/userguide/binaryclass/a9a_lr.html b/userguide/binaryclass/a9a_lr.html index a1820e1..f5519e6 100644 --- a/userguide/binaryclass/a9a_lr.html +++ b/userguide/binaryclass/a9a_lr.html @@ -999,6 +999,21 @@ </li> + <li class="chapter " data-level="5.6" data-path="titanic_rf.html"> + + <a href="titanic_rf.html"> + + + <b>5.6.</b> + + Kaggle Titanic Tutorial + + </a> + + + + </li> + @@ -1649,11 +1664,17 @@ specific language governing permissions and limitations under the License. --> -<h1 id="a9a">a9a</h1> -<p><a href="http://www.csie.ntu.edu.tw/~cjlin/libsvmtools/datasets/binary.html#a9a" target="_blank">http://www.csie.ntu.edu.tw/~cjlin/libsvmtools/datasets/binary.html#a9a</a></p> -<p><em>Training with iterations is OBSOLUTE in Hivemall.</em><br><em>Using amplifier and shuffling inputs is RECOMMENDED in Hivemall.</em></p> -<hr> -<h2 id="udf-preparation">UDF preparation</h2> +<!-- toc --><div id="toc" class="toc"> + +<ul> +<li><a href="#udf-preparation">UDF preparation</a></li> +<li><a href="#training">training</a></li> +<li><a href="#prediction">prediction</a></li> +<li><a href="#evaluation">evaluation</a></li> +</ul> + +</div><!-- tocstop --> +<h1 id="udf-preparation">UDF preparation</h1> <pre><code class="lang-sql"><span class="hljs-keyword">select</span> <span class="hljs-keyword">count</span>(<span class="hljs-number">1</span>) <span class="hljs-keyword">from</span> a9atrain; <span class="hljs-comment">-- set total_steps ideally be "count(1) / #map tasks"</span> <span class="hljs-keyword">set</span> hivevar:total_steps=<span class="hljs-number">32561</span>; @@ -1661,7 +1682,7 @@ <span class="hljs-keyword">select</span> <span class="hljs-keyword">count</span>(<span class="hljs-number">1</span>) <span class="hljs-keyword">from</span> a9atest; <span class="hljs-keyword">set</span> hivevar:num_test_instances=<span class="hljs-number">16281</span>; </code></pre> -<h2 id="training">training</h2> +<h1 id="training">training</h1> <pre><code class="lang-sql"><span class="hljs-keyword">create</span> <span class="hljs-keyword">table</span> a9a_model1 <span class="hljs-keyword">as</span> <span class="hljs-keyword">select</span> @@ -1676,7 +1697,7 @@ <span class="hljs-keyword">group</span> <span class="hljs-keyword">by</span> feature; </code></pre> <p><em>"-total_steps" option is optional for logress() function.</em><br><em>I recommend you NOT to use options (e.g., total_steps and eta0) if you are not familiar with those options. Hivemall then uses an autonomic ETA (learning rate) estimator.</em></p> -<h2 id="prediction">prediction</h2> +<h1 id="prediction">prediction</h1> <pre><code class="lang-sql"><span class="hljs-keyword">create</span> <span class="hljs-keyword">or</span> <span class="hljs-keyword">replace</span> <span class="hljs-keyword">view</span> a9a_predict1 <span class="hljs-keyword">as</span> <span class="hljs-keyword">WITH</span> a9atest_exploded <span class="hljs-keyword">as</span> ( @@ -1698,7 +1719,7 @@ <span class="hljs-keyword">group</span> <span class="hljs-keyword">by</span> t.<span class="hljs-keyword">rowid</span>; </code></pre> -<h2 id="evaluation">evaluation</h2> +<h1 id="evaluation">evaluation</h1> <pre><code class="lang-sql"><span class="hljs-keyword">create</span> <span class="hljs-keyword">or</span> <span class="hljs-keyword">replace</span> <span class="hljs-keyword">view</span> a9a_submit1 <span class="hljs-keyword">as</span> <span class="hljs-keyword">select</span> t.label <span class="hljs-keyword">as</span> actual, @@ -1712,12 +1733,30 @@ <span class="hljs-keyword">where</span> actual == predicted; </code></pre> <blockquote> -<p>0.8430071862907684 -<div id="page-footer"><hr><p><sub><font color="gray"> +<p>0.8430071862907684</p> +</blockquote> +<p><div id="page-footer"><hr><!-- + Licensed to the Apache Software Foundation (ASF) under one + or more contributor license agreements. See the NOTICE file + distributed with this work for additional information + regarding copyright ownership. The ASF licenses this file + to you under the Apache License, Version 2.0 (the + "License"); you may not use this file except in compliance + with the License. You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + + Unless required by applicable law or agreed to in writing, + software distributed under the License is distributed on an + "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + KIND, either express or implied. See the License for the + specific language governing permissions and limitations + under the License. +--> +<p><sub><font color="gray"> Apache Hivemall is an effort undergoing incubation at The Apache Software Foundation (ASF), sponsored by the Apache Incubator. </font></sub></p> </div></p> -</blockquote> </section> @@ -1751,7 +1790,7 @@ Apache Hivemall is an effort undergoing incubation at The Apache Software Founda <script> var gitbook = gitbook || []; gitbook.push(function() { - gitbook.page.hasChanged({"page":{"title":"Logistic Regression","level":"5.1.2","depth":2,"next":{"title":"Mini-batch Gradient Descent","level":"5.1.3","depth":2,"path":"binaryclass/a9a_minibatch.md","ref":"binaryclass/a9a_minibatch.md","articles":[]},"previous":{"title":"Data preparation","level":"5.1.1","depth":2,"path":"binaryclass/a9a_dataset.md","ref":"binaryclass/a9a_dataset.md","articles":[]},"dir":"ltr"},"config":{"plugins":["theme-api","edit-link","github","splitter","sitemap","etoc","callouts","toggle-chapters","anchorjs","codeblock-filename","expandable-chapters","multipart","codeblock-filename","katex","emphasize","localized-footer"],"styles":{"website":"styles/website.css","pdf":"styles/pdf.css","epub":"styles/epub.css","mobi":"styles/mobi.css","ebook":"styles/ebook.css","print":"styles/print.css"},"pluginsConfig":{"emphasize":{},"callouts":{},"etoc":{"maxdepth":3,"mindepth":1,"notoc":true},"github":{"url":"https://github.com/apache/incubator-hivemall/"},"spl itter":{},"search":{},"downloadpdf":{"base":"https://github.com/apache/incubator-hivemall/docs/gitbook","label":"PDF","multilingual":false},"multipart":{},"localized-footer":{"filename":"FOOTER.md"},"lunr":{"maxIndexSize":1000000,"ignoreSpecialCharacters":false},"katex":{},"fontsettings":{"theme":"white","family":"sans","size":2,"font":"sans"},"highlight":{},"codeblock-filename":{},"sitemap":{"hostname":"http://hivemall.incubator.apache.org/"},"theme-api":{"languages":[],"split":false,"theme":"dark"},"sharing":{"facebook":true,"twitter":true,"google":false,"weibo":false,"instapaper":false,"vk":false,"all":["facebook","google","twitter","weibo","instapaper"]},"edit-link":{"label":"Edit","base":"https://github.com/apache/incubator-hivemall/docs/gitbook"},"theme-default":{"styles":{"website":"styles/website.css","pdf":"styles/pdf.css","epub":"styles/epub.css","mobi":"styles/mobi.css","ebook":"styles/ebook.css","print":"styles/print.css"},"showLevel":true},"anchorjs":{"selector":"h1,h2, h3,*:not(.callout) > h4,h5"},"toggle-chapters":{},"expandable-chapters":{}},"theme":"default","pdf":{"pageNumbers":true,"fontSize":12,"fontFamily":"Arial","paperSize":"a4","chapterMark":"pagebreak","pageBreaksBefore":"/","margin":{"right":62,"left":62,"top":56,"bottom":56}},"structure":{"langs":"LANGS.md","readme":"README.md","glossary":"GLOSSARY.md","summary":"SUMMARY.md"},"variables":{},"title":"Hivemall User Manual","links":{"sidebar":{"<i class=\"fa fa-home\"></i> Home":"http://hivemall.incubator.apache.org/"}},"gitbook":"3.x.x","description":"User Manual for Apache Hivemall"},"file":{"path":"binaryclass/a9a_lr.md","mtime":"2016-11-12T07:18:00.000Z","type":"markdown"},"gitbook":{"version":"3.2.2","time":"2016-11-14T10:40:22.987Z"},"basePath":"..","book":{"language":""}}); + gitbook.page.hasChanged({"page":{"title":"Logistic Regression","level":"5.1.2","depth":2,"next":{"title":"Mini-batch Gradient Descent","level":"5.1.3","depth":2,"path":"binaryclass/a9a_minibatch.md","ref":"binaryclass/a9a_minibatch.md","articles":[]},"previous":{"title":"Data preparation","level":"5.1.1","depth":2,"path":"binaryclass/a9a_dataset.md","ref":"binaryclass/a9a_dataset.md","articles":[]},"dir":"ltr"},"config":{"plugins":["theme-api","edit-link","github","splitter","sitemap","etoc","callouts","toggle-chapters","anchorjs","codeblock-filename","expandable-chapters","multipart","codeblock-filename","katex","emphasize","localized-footer"],"styles":{"website":"styles/website.css","pdf":"styles/pdf.css","epub":"styles/epub.css","mobi":"styles/mobi.css","ebook":"styles/ebook.css","print":"styles/print.css"},"pluginsConfig":{"emphasize":{},"callouts":{},"etoc":{"maxdepth":3,"mindepth":1,"notoc":true},"github":{"url":"https://github.com/apache/incubator-hivemall/"},"spl itter":{},"search":{},"downloadpdf":{"base":"https://github.com/apache/incubator-hivemall/docs/gitbook","label":"PDF","multilingual":false},"multipart":{},"localized-footer":{"filename":"FOOTER.md"},"lunr":{"maxIndexSize":1000000,"ignoreSpecialCharacters":false},"katex":{},"fontsettings":{"theme":"white","family":"sans","size":2,"font":"sans"},"highlight":{},"codeblock-filename":{},"sitemap":{"hostname":"http://hivemall.incubator.apache.org/"},"theme-api":{"languages":[],"split":false,"theme":"dark"},"sharing":{"facebook":true,"twitter":true,"google":false,"weibo":false,"instapaper":false,"vk":false,"all":["facebook","google","twitter","weibo","instapaper"]},"edit-link":{"label":"Edit","base":"https://github.com/apache/incubator-hivemall/docs/gitbook"},"theme-default":{"styles":{"website":"styles/website.css","pdf":"styles/pdf.css","epub":"styles/epub.css","mobi":"styles/mobi.css","ebook":"styles/ebook.css","print":"styles/print.css"},"showLevel":true},"anchorjs":{"selector":"h1,h2, h3,*:not(.callout) > h4,h5"},"toggle-chapters":{},"expandable-chapters":{}},"theme":"default","pdf":{"pageNumbers":true,"fontSize":12,"fontFamily":"Arial","paperSize":"a4","chapterMark":"pagebreak","pageBreaksBefore":"/","margin":{"right":62,"left":62,"top":56,"bottom":56}},"structure":{"langs":"LANGS.md","readme":"README.md","glossary":"GLOSSARY.md","summary":"SUMMARY.md"},"variables":{},"title":"Hivemall User Manual","links":{"sidebar":{"<i class=\"fa fa-home\"></i> Home":"http://hivemall.incubator.apache.org/"}},"gitbook":"3.x.x","description":"User Manual for Apache Hivemall"},"file":{"path":"binaryclass/a9a_lr.md","mtime":"2016-11-17T12:04:04.000Z","type":"markdown"},"gitbook":{"version":"3.2.2","time":"2016-11-17T12:16:14.647Z"},"basePath":"..","book":{"language":""}}); }); </script> </div> http://git-wip-us.apache.org/repos/asf/incubator-hivemall-site/blob/68241a08/userguide/binaryclass/a9a_minibatch.html ---------------------------------------------------------------------- diff --git a/userguide/binaryclass/a9a_minibatch.html b/userguide/binaryclass/a9a_minibatch.html index 5ac7cf9..db85d8a 100644 --- a/userguide/binaryclass/a9a_minibatch.html +++ b/userguide/binaryclass/a9a_minibatch.html @@ -999,6 +999,21 @@ </li> + <li class="chapter " data-level="5.6" data-path="titanic_rf.html"> + + <a href="titanic_rf.html"> + + + <b>5.6.</b> + + Kaggle Titanic Tutorial + + </a> + + + + </li> + @@ -1649,10 +1664,10 @@ specific language governing permissions and limitations under the License. --> -<p>This page explains how to apply <a href="https://class.coursera.org/ml-003/lecture/106" target="_blank">Mini-Batch Gradient Descent</a> for the training of logistic regression explained in <a href="https://github.com/myui/hivemall/wiki/a9a-binary-classification-(logistic-regression" target="_blank">this example</a>). </p> -<p>See <a href="https://github.com/myui/hivemall/wiki/a9a-binary-classification-(logistic-regression" target="_blank">this page</a>) first. This content depends on it.</p> +<p>This page explains how to apply <a href="https://class.coursera.org/ml-003/lecture/106" target="_blank">Mini-Batch Gradient Descent</a> for the training of logistic regression explained in <a href="a9a_lr.html">this example</a>. +So, refer <a href="a9a_lr.html">this page</a> first. This content depends on it.</p> <h1 id="training">Training</h1> -<p>Replace <code>a9a_model1</code> of <a href="https://github.com/myui/hivemall/wiki/a9a-binary-classification-(logistic-regression" target="_blank">this example</a>).</p> +<p>Replace <code>a9a_model1</code> of <a href="a9a_lr.html">this example</a>.</p> <pre><code class="lang-sql"><span class="hljs-keyword">set</span> hivevar:total_steps=<span class="hljs-number">32561</span>; <span class="hljs-keyword">set</span> hivevar:mini_batch_size=<span class="hljs-number">10</span>; @@ -1687,7 +1702,25 @@ </tr> </tbody> </table> -<p><div id="page-footer"><hr><p><sub><font color="gray"> +<p><div id="page-footer"><hr><!-- + Licensed to the Apache Software Foundation (ASF) under one + or more contributor license agreements. See the NOTICE file + distributed with this work for additional information + regarding copyright ownership. The ASF licenses this file + to you under the Apache License, Version 2.0 (the + "License"); you may not use this file except in compliance + with the License. You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + + Unless required by applicable law or agreed to in writing, + software distributed under the License is distributed on an + "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + KIND, either express or implied. See the License for the + specific language governing permissions and limitations + under the License. +--> +<p><sub><font color="gray"> Apache Hivemall is an effort undergoing incubation at The Apache Software Foundation (ASF), sponsored by the Apache Incubator. </font></sub></p> </div></p> @@ -1724,7 +1757,7 @@ Apache Hivemall is an effort undergoing incubation at The Apache Software Founda <script> var gitbook = gitbook || []; gitbook.push(function() { - gitbook.page.hasChanged({"page":{"title":"Mini-batch Gradient Descent","level":"5.1.3","depth":2,"next":{"title":"News20 Tutorial","level":"5.2","depth":1,"path":"binaryclass/news20.md","ref":"binaryclass/news20.md","articles":[{"title":"Data preparation","level":"5.2.1","depth":2,"path":"binaryclass/news20_dataset.md","ref":"binaryclass/news20_dataset.md","articles":[]},{"title":"Perceptron, Passive Aggressive","level":"5.2.2","depth":2,"path":"binaryclass/news20_pa.md","ref":"binaryclass/news20_pa.md","articles":[]},{"title":"CW, AROW, SCW","level":"5.2.3","depth":2,"path":"binaryclass/news20_scw.md","ref":"binaryclass/news20_scw.md","articles":[]},{"title":"AdaGradRDA, AdaGrad, AdaDelta","level":"5.2.4","depth":2,"path":"binaryclass/news20_adagrad.md","ref":"binaryclass/news20_adagrad.md","articles":[]}]},"previous":{"title":"Logistic Regression","level":"5.1.2","depth":2,"path":"binaryclass/a9a_lr.md","ref":"binaryclass/a9a_lr.md","articles":[]},"dir":"ltr"},"config" :{"plugins":["theme-api","edit-link","github","splitter","sitemap","etoc","callouts","toggle-chapters","anchorjs","codeblock-filename","expandable-chapters","multipart","codeblock-filename","katex","emphasize","localized-footer"],"styles":{"website":"styles/website.css","pdf":"styles/pdf.css","epub":"styles/epub.css","mobi":"styles/mobi.css","ebook":"styles/ebook.css","print":"styles/print.css"},"pluginsConfig":{"emphasize":{},"callouts":{},"etoc":{"maxdepth":3,"mindepth":1,"notoc":true},"github":{"url":"https://github.com/apache/incubator-hivemall/"},"splitter":{},"search":{},"downloadpdf":{"base":"https://github.com/apache/incubator-hivemall/docs/gitbook","label":"PDF","multilingual":false},"multipart":{},"localized-footer":{"filename":"FOOTER.md"},"lunr":{"maxIndexSize":1000000,"ignoreSpecialCharacters":false},"katex":{},"fontsettings":{"theme":"white","family":"sans","size":2,"font":"sans"},"highlight":{},"codeblock-filename":{},"sitemap":{"hostname":"http://hivemall.incubator.a pache.org/"},"theme-api":{"languages":[],"split":false,"theme":"dark"},"sharing":{"facebook":true,"twitter":true,"google":false,"weibo":false,"instapaper":false,"vk":false,"all":["facebook","google","twitter","weibo","instapaper"]},"edit-link":{"label":"Edit","base":"https://github.com/apache/incubator-hivemall/docs/gitbook"},"theme-default":{"styles":{"website":"styles/website.css","pdf":"styles/pdf.css","epub":"styles/epub.css","mobi":"styles/mobi.css","ebook":"styles/ebook.css","print":"styles/print.css"},"showLevel":true},"anchorjs":{"selector":"h1,h2,h3,*:not(.callout) > h4,h5"},"toggle-chapters":{},"expandable-chapters":{}},"theme":"default","pdf":{"pageNumbers":true,"fontSize":12,"fontFamily":"Arial","paperSize":"a4","chapterMark":"pagebreak","pageBreaksBefore":"/","margin":{"right":62,"left":62,"top":56,"bottom":56}},"structure":{"langs":"LANGS.md","readme":"README.md","glossary":"GLOSSARY.md","summary":"SUMMARY.md"},"variables":{},"title":"Hivemall User Manual","links":{"si debar":{"<i class=\"fa fa-home\"></i> Home":"http://hivemall.incubator.apache.org/"}},"gitbook":"3.x.x","description":"User Manual for Apache Hivemall"},"file":{"path":"binaryclass/a9a_minibatch.md","mtime":"2016-11-12T07:18:00.000Z","type":"markdown"},"gitbook":{"version":"3.2.2","time":"2016-11-14T10:40:22.987Z"},"basePath":"..","book":{"language":""}}); + gitbook.page.hasChanged({"page":{"title":"Mini-batch Gradient Descent","level":"5.1.3","depth":2,"next":{"title":"News20 Tutorial","level":"5.2","depth":1,"path":"binaryclass/news20.md","ref":"binaryclass/news20.md","articles":[{"title":"Data preparation","level":"5.2.1","depth":2,"path":"binaryclass/news20_dataset.md","ref":"binaryclass/news20_dataset.md","articles":[]},{"title":"Perceptron, Passive Aggressive","level":"5.2.2","depth":2,"path":"binaryclass/news20_pa.md","ref":"binaryclass/news20_pa.md","articles":[]},{"title":"CW, AROW, SCW","level":"5.2.3","depth":2,"path":"binaryclass/news20_scw.md","ref":"binaryclass/news20_scw.md","articles":[]},{"title":"AdaGradRDA, AdaGrad, AdaDelta","level":"5.2.4","depth":2,"path":"binaryclass/news20_adagrad.md","ref":"binaryclass/news20_adagrad.md","articles":[]}]},"previous":{"title":"Logistic Regression","level":"5.1.2","depth":2,"path":"binaryclass/a9a_lr.md","ref":"binaryclass/a9a_lr.md","articles":[]},"dir":"ltr"},"config" :{"plugins":["theme-api","edit-link","github","splitter","sitemap","etoc","callouts","toggle-chapters","anchorjs","codeblock-filename","expandable-chapters","multipart","codeblock-filename","katex","emphasize","localized-footer"],"styles":{"website":"styles/website.css","pdf":"styles/pdf.css","epub":"styles/epub.css","mobi":"styles/mobi.css","ebook":"styles/ebook.css","print":"styles/print.css"},"pluginsConfig":{"emphasize":{},"callouts":{},"etoc":{"maxdepth":3,"mindepth":1,"notoc":true},"github":{"url":"https://github.com/apache/incubator-hivemall/"},"splitter":{},"search":{},"downloadpdf":{"base":"https://github.com/apache/incubator-hivemall/docs/gitbook","label":"PDF","multilingual":false},"multipart":{},"localized-footer":{"filename":"FOOTER.md"},"lunr":{"maxIndexSize":1000000,"ignoreSpecialCharacters":false},"katex":{},"fontsettings":{"theme":"white","family":"sans","size":2,"font":"sans"},"highlight":{},"codeblock-filename":{},"sitemap":{"hostname":"http://hivemall.incubator.a pache.org/"},"theme-api":{"languages":[],"split":false,"theme":"dark"},"sharing":{"facebook":true,"twitter":true,"google":false,"weibo":false,"instapaper":false,"vk":false,"all":["facebook","google","twitter","weibo","instapaper"]},"edit-link":{"label":"Edit","base":"https://github.com/apache/incubator-hivemall/docs/gitbook"},"theme-default":{"styles":{"website":"styles/website.css","pdf":"styles/pdf.css","epub":"styles/epub.css","mobi":"styles/mobi.css","ebook":"styles/ebook.css","print":"styles/print.css"},"showLevel":true},"anchorjs":{"selector":"h1,h2,h3,*:not(.callout) > h4,h5"},"toggle-chapters":{},"expandable-chapters":{}},"theme":"default","pdf":{"pageNumbers":true,"fontSize":12,"fontFamily":"Arial","paperSize":"a4","chapterMark":"pagebreak","pageBreaksBefore":"/","margin":{"right":62,"left":62,"top":56,"bottom":56}},"structure":{"langs":"LANGS.md","readme":"README.md","glossary":"GLOSSARY.md","summary":"SUMMARY.md"},"variables":{},"title":"Hivemall User Manual","links":{"si debar":{"<i class=\"fa fa-home\"></i> Home":"http://hivemall.incubator.apache.org/"}},"gitbook":"3.x.x","description":"User Manual for Apache Hivemall"},"file":{"path":"binaryclass/a9a_minibatch.md","mtime":"2016-11-17T10:03:51.000Z","type":"markdown"},"gitbook":{"version":"3.2.2","time":"2016-11-17T12:16:14.647Z"},"basePath":"..","book":{"language":""}}); }); </script> </div> http://git-wip-us.apache.org/repos/asf/incubator-hivemall-site/blob/68241a08/userguide/binaryclass/kdd2010a.html ---------------------------------------------------------------------- diff --git a/userguide/binaryclass/kdd2010a.html b/userguide/binaryclass/kdd2010a.html index 1429b50..851d032 100644 --- a/userguide/binaryclass/kdd2010a.html +++ b/userguide/binaryclass/kdd2010a.html @@ -999,6 +999,21 @@ </li> + <li class="chapter " data-level="5.6" data-path="titanic_rf.html"> + + <a href="titanic_rf.html"> + + + <b>5.6.</b> + + Kaggle Titanic Tutorial + + </a> + + + + </li> + @@ -1649,7 +1664,25 @@ specific language governing permissions and limitations under the License. --> -<p><div id="page-footer"><hr><p><sub><font color="gray"> +<p><div id="page-footer"><hr><!-- + Licensed to the Apache Software Foundation (ASF) under one + or more contributor license agreements. See the NOTICE file + distributed with this work for additional information + regarding copyright ownership. The ASF licenses this file + to you under the Apache License, Version 2.0 (the + "License"); you may not use this file except in compliance + with the License. You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + + Unless required by applicable law or agreed to in writing, + software distributed under the License is distributed on an + "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + KIND, either express or implied. See the License for the + specific language governing permissions and limitations + under the License. +--> +<p><sub><font color="gray"> Apache Hivemall is an effort undergoing incubation at The Apache Software Foundation (ASF), sponsored by the Apache Incubator. </font></sub></p> </div></p> @@ -1686,7 +1719,7 @@ Apache Hivemall is an effort undergoing incubation at The Apache Software Founda <script> var gitbook = gitbook || []; gitbook.push(function() { - gitbook.page.hasChanged({"page":{"title":"KDD2010a Tutorial","level":"5.3","depth":1,"next":{"title":"Data preparation","level":"5.3.1","depth":2,"path":"binaryclass/kdd2010a_dataset.md","ref":"binaryclass/kdd2010a_dataset.md","articles":[]},"previous":{"title":"AdaGradRDA, AdaGrad, AdaDelta","level":"5.2.4","depth":2,"path":"binaryclass/news20_adagrad.md","ref":"binaryclass/news20_adagrad.md","articles":[]},"dir":"ltr"},"config":{"plugins":["theme-api","edit-link","github","splitter","sitemap","etoc","callouts","toggle-chapters","anchorjs","codeblock-filename","expandable-chapters","multipart","codeblock-filename","katex","emphasize","localized-footer"],"styles":{"website":"styles/website.css","pdf":"styles/pdf.css","epub":"styles/epub.css","mobi":"styles/mobi.css","ebook":"styles/ebook.css","print":"styles/print.css"},"pluginsConfig":{"emphasize":{},"callouts":{},"etoc":{"maxdepth":3,"mindepth":1,"notoc":true},"github":{"url":"https://github.com/apache/incubator-hivema ll/"},"splitter":{},"search":{},"downloadpdf":{"base":"https://github.com/apache/incubator-hivemall/docs/gitbook","label":"PDF","multilingual":false},"multipart":{},"localized-footer":{"filename":"FOOTER.md"},"lunr":{"maxIndexSize":1000000,"ignoreSpecialCharacters":false},"katex":{},"fontsettings":{"theme":"white","family":"sans","size":2,"font":"sans"},"highlight":{},"codeblock-filename":{},"sitemap":{"hostname":"http://hivemall.incubator.apache.org/"},"theme-api":{"languages":[],"split":false,"theme":"dark"},"sharing":{"facebook":true,"twitter":true,"google":false,"weibo":false,"instapaper":false,"vk":false,"all":["facebook","google","twitter","weibo","instapaper"]},"edit-link":{"label":"Edit","base":"https://github.com/apache/incubator-hivemall/docs/gitbook"},"theme-default":{"styles":{"website":"styles/website.css","pdf":"styles/pdf.css","epub":"styles/epub.css","mobi":"styles/mobi.css","ebook":"styles/ebook.css","print":"styles/print.css"},"showLevel":true},"anchorjs":{"selecto r":"h1,h2,h3,*:not(.callout) > h4,h5"},"toggle-chapters":{},"expandable-chapters":{}},"theme":"default","pdf":{"pageNumbers":true,"fontSize":12,"fontFamily":"Arial","paperSize":"a4","chapterMark":"pagebreak","pageBreaksBefore":"/","margin":{"right":62,"left":62,"top":56,"bottom":56}},"structure":{"langs":"LANGS.md","readme":"README.md","glossary":"GLOSSARY.md","summary":"SUMMARY.md"},"variables":{},"title":"Hivemall User Manual","links":{"sidebar":{"<i class=\"fa fa-home\"></i> Home":"http://hivemall.incubator.apache.org/"}},"gitbook":"3.x.x","description":"User Manual for Apache Hivemall"},"file":{"path":"binaryclass/kdd2010a.md","mtime":"2016-11-12T07:18:00.000Z","type":"markdown"},"gitbook":{"version":"3.2.2","time":"2016-11-14T10:40:22.987Z"},"basePath":"..","book":{"language":""}}); + gitbook.page.hasChanged({"page":{"title":"KDD2010a Tutorial","level":"5.3","depth":1,"next":{"title":"Data preparation","level":"5.3.1","depth":2,"path":"binaryclass/kdd2010a_dataset.md","ref":"binaryclass/kdd2010a_dataset.md","articles":[]},"previous":{"title":"AdaGradRDA, AdaGrad, AdaDelta","level":"5.2.4","depth":2,"path":"binaryclass/news20_adagrad.md","ref":"binaryclass/news20_adagrad.md","articles":[]},"dir":"ltr"},"config":{"plugins":["theme-api","edit-link","github","splitter","sitemap","etoc","callouts","toggle-chapters","anchorjs","codeblock-filename","expandable-chapters","multipart","codeblock-filename","katex","emphasize","localized-footer"],"styles":{"website":"styles/website.css","pdf":"styles/pdf.css","epub":"styles/epub.css","mobi":"styles/mobi.css","ebook":"styles/ebook.css","print":"styles/print.css"},"pluginsConfig":{"emphasize":{},"callouts":{},"etoc":{"maxdepth":3,"mindepth":1,"notoc":true},"github":{"url":"https://github.com/apache/incubator-hivema ll/"},"splitter":{},"search":{},"downloadpdf":{"base":"https://github.com/apache/incubator-hivemall/docs/gitbook","label":"PDF","multilingual":false},"multipart":{},"localized-footer":{"filename":"FOOTER.md"},"lunr":{"maxIndexSize":1000000,"ignoreSpecialCharacters":false},"katex":{},"fontsettings":{"theme":"white","family":"sans","size":2,"font":"sans"},"highlight":{},"codeblock-filename":{},"sitemap":{"hostname":"http://hivemall.incubator.apache.org/"},"theme-api":{"languages":[],"split":false,"theme":"dark"},"sharing":{"facebook":true,"twitter":true,"google":false,"weibo":false,"instapaper":false,"vk":false,"all":["facebook","google","twitter","weibo","instapaper"]},"edit-link":{"label":"Edit","base":"https://github.com/apache/incubator-hivemall/docs/gitbook"},"theme-default":{"styles":{"website":"styles/website.css","pdf":"styles/pdf.css","epub":"styles/epub.css","mobi":"styles/mobi.css","ebook":"styles/ebook.css","print":"styles/print.css"},"showLevel":true},"anchorjs":{"selecto r":"h1,h2,h3,*:not(.callout) > h4,h5"},"toggle-chapters":{},"expandable-chapters":{}},"theme":"default","pdf":{"pageNumbers":true,"fontSize":12,"fontFamily":"Arial","paperSize":"a4","chapterMark":"pagebreak","pageBreaksBefore":"/","margin":{"right":62,"left":62,"top":56,"bottom":56}},"structure":{"langs":"LANGS.md","readme":"README.md","glossary":"GLOSSARY.md","summary":"SUMMARY.md"},"variables":{},"title":"Hivemall User Manual","links":{"sidebar":{"<i class=\"fa fa-home\"></i> Home":"http://hivemall.incubator.apache.org/"}},"gitbook":"3.x.x","description":"User Manual for Apache Hivemall"},"file":{"path":"binaryclass/kdd2010a.md","mtime":"2016-11-16T08:39:12.000Z","type":"markdown"},"gitbook":{"version":"3.2.2","time":"2016-11-17T12:16:14.647Z"},"basePath":"..","book":{"language":""}}); }); </script> </div> http://git-wip-us.apache.org/repos/asf/incubator-hivemall-site/blob/68241a08/userguide/binaryclass/kdd2010a_dataset.html ---------------------------------------------------------------------- diff --git a/userguide/binaryclass/kdd2010a_dataset.html b/userguide/binaryclass/kdd2010a_dataset.html index 9dded23..8b6d26c 100644 --- a/userguide/binaryclass/kdd2010a_dataset.html +++ b/userguide/binaryclass/kdd2010a_dataset.html @@ -999,6 +999,21 @@ </li> + <li class="chapter " data-level="5.6" data-path="titanic_rf.html"> + + <a href="titanic_rf.html"> + + + <b>5.6.</b> + + Kaggle Titanic Tutorial + + </a> + + + + </li> + @@ -1651,12 +1666,9 @@ --> <p><a href="http://www.csie.ntu.edu.tw/~cjlin/libsvmtools/datasets/binary.html#kdd2010 (algebra" target="_blank">http://www.csie.ntu.edu.tw/~cjlin/libsvmtools/datasets/binary.html#kdd2010 (algebra)</a>)</p> <ul> -<li><h1 id="of-classes-2">of classes: 2</h1> -</li> -<li><h1 id="of-data-8407752-training--510302-testing">of data: 8,407,752 (training) / 510,302 (testing)</h1> -</li> -<li><h1 id="of-features-20216830-in-about-273-gb-training--20216830-testing">of features: 20,216,830 in about 2.73 GB (training) / 20,216,830 (testing)</h1> -</li> +<li>the number of classes: 2</li> +<li>the number of data: 8,407,752 (training) / 510,302 (testing)</li> +<li>the number of features: 20,216,830 in about 2.73 GB (training) / 20,216,830 (testing) </li> </ul> <hr> <h1 id="define-trainingtesting-tables">Define training/testing tables</h1> @@ -1719,7 +1731,25 @@ CLUSTER <span class="hljs-keyword">BY</span> <span class="hljs-keyword">rand</sp <span class="hljs-keyword">from</span> kdd10a_train_orcfile; </code></pre> -<p><div id="page-footer"><hr><p><sub><font color="gray"> +<p><div id="page-footer"><hr><!-- + Licensed to the Apache Software Foundation (ASF) under one + or more contributor license agreements. See the NOTICE file + distributed with this work for additional information + regarding copyright ownership. The ASF licenses this file + to you under the Apache License, Version 2.0 (the + "License"); you may not use this file except in compliance + with the License. You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + + Unless required by applicable law or agreed to in writing, + software distributed under the License is distributed on an + "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + KIND, either express or implied. See the License for the + specific language governing permissions and limitations + under the License. +--> +<p><sub><font color="gray"> Apache Hivemall is an effort undergoing incubation at The Apache Software Foundation (ASF), sponsored by the Apache Incubator. </font></sub></p> </div></p> @@ -1756,7 +1786,7 @@ Apache Hivemall is an effort undergoing incubation at The Apache Software Founda <script> var gitbook = gitbook || []; gitbook.push(function() { - gitbook.page.hasChanged({"page":{"title":"Data preparation","level":"5.3.1","depth":2,"next":{"title":"PA, CW, AROW, SCW","level":"5.3.2","depth":2,"path":"binaryclass/kdd2010a_scw.md","ref":"binaryclass/kdd2010a_scw.md","articles":[]},"previous":{"title":"KDD2010a Tutorial","level":"5.3","depth":1,"path":"binaryclass/kdd2010a.md","ref":"binaryclass/kdd2010a.md","articles":[{"title":"Data preparation","level":"5.3.1","depth":2,"path":"binaryclass/kdd2010a_dataset.md","ref":"binaryclass/kdd2010a_dataset.md","articles":[]},{"title":"PA, CW, AROW, SCW","level":"5.3.2","depth":2,"path":"binaryclass/kdd2010a_scw.md","ref":"binaryclass/kdd2010a_scw.md","articles":[]}]},"dir":"ltr"},"config":{"plugins":["theme-api","edit-link","github","splitter","sitemap","etoc","callouts","toggle-chapters","anchorjs","codeblock-filename","expandable-chapters","multipart","codeblock-filename","katex","emphasize","localized-footer"],"styles":{"website":"styles/website.css","pdf":"styles/pdf.css ","epub":"styles/epub.css","mobi":"styles/mobi.css","ebook":"styles/ebook.css","print":"styles/print.css"},"pluginsConfig":{"emphasize":{},"callouts":{},"etoc":{"maxdepth":3,"mindepth":1,"notoc":true},"github":{"url":"https://github.com/apache/incubator-hivemall/"},"splitter":{},"search":{},"downloadpdf":{"base":"https://github.com/apache/incubator-hivemall/docs/gitbook","label":"PDF","multilingual":false},"multipart":{},"localized-footer":{"filename":"FOOTER.md"},"lunr":{"maxIndexSize":1000000,"ignoreSpecialCharacters":false},"katex":{},"fontsettings":{"theme":"white","family":"sans","size":2,"font":"sans"},"highlight":{},"codeblock-filename":{},"sitemap":{"hostname":"http://hivemall.incubator.apache.org/"},"theme-api":{"languages":[],"split":false,"theme":"dark"},"sharing":{"facebook":true,"twitter":true,"google":false,"weibo":false,"instapaper":false,"vk":false,"all":["facebook","google","twitter","weibo","instapaper"]},"edit-link":{"label":"Edit","base":"https://github.com/apach e/incubator-hivemall/docs/gitbook"},"theme-default":{"styles":{"website":"styles/website.css","pdf":"styles/pdf.css","epub":"styles/epub.css","mobi":"styles/mobi.css","ebook":"styles/ebook.css","print":"styles/print.css"},"showLevel":true},"anchorjs":{"selector":"h1,h2,h3,*:not(.callout) > h4,h5"},"toggle-chapters":{},"expandable-chapters":{}},"theme":"default","pdf":{"pageNumbers":true,"fontSize":12,"fontFamily":"Arial","paperSize":"a4","chapterMark":"pagebreak","pageBreaksBefore":"/","margin":{"right":62,"left":62,"top":56,"bottom":56}},"structure":{"langs":"LANGS.md","readme":"README.md","glossary":"GLOSSARY.md","summary":"SUMMARY.md"},"variables":{},"title":"Hivemall User Manual","links":{"sidebar":{"<i class=\"fa fa-home\"></i> Home":"http://hivemall.incubator.apache.org/"}},"gitbook":"3.x.x","description":"User Manual for Apache Hivemall"},"file":{"path":"binaryclass/kdd2010a_dataset.md","mtime":"2016-11-12T07:18:00.000Z","type":"markdown"},"gitbook":{"version":"3.2.2","time": "2016-11-14T10:40:22.987Z"},"basePath":"..","book":{"language":""}}); + gitbook.page.hasChanged({"page":{"title":"Data preparation","level":"5.3.1","depth":2,"next":{"title":"PA, CW, AROW, SCW","level":"5.3.2","depth":2,"path":"binaryclass/kdd2010a_scw.md","ref":"binaryclass/kdd2010a_scw.md","articles":[]},"previous":{"title":"KDD2010a Tutorial","level":"5.3","depth":1,"path":"binaryclass/kdd2010a.md","ref":"binaryclass/kdd2010a.md","articles":[{"title":"Data preparation","level":"5.3.1","depth":2,"path":"binaryclass/kdd2010a_dataset.md","ref":"binaryclass/kdd2010a_dataset.md","articles":[]},{"title":"PA, CW, AROW, SCW","level":"5.3.2","depth":2,"path":"binaryclass/kdd2010a_scw.md","ref":"binaryclass/kdd2010a_scw.md","articles":[]}]},"dir":"ltr"},"config":{"plugins":["theme-api","edit-link","github","splitter","sitemap","etoc","callouts","toggle-chapters","anchorjs","codeblock-filename","expandable-chapters","multipart","codeblock-filename","katex","emphasize","localized-footer"],"styles":{"website":"styles/website.css","pdf":"styles/pdf.css ","epub":"styles/epub.css","mobi":"styles/mobi.css","ebook":"styles/ebook.css","print":"styles/print.css"},"pluginsConfig":{"emphasize":{},"callouts":{},"etoc":{"maxdepth":3,"mindepth":1,"notoc":true},"github":{"url":"https://github.com/apache/incubator-hivemall/"},"splitter":{},"search":{},"downloadpdf":{"base":"https://github.com/apache/incubator-hivemall/docs/gitbook","label":"PDF","multilingual":false},"multipart":{},"localized-footer":{"filename":"FOOTER.md"},"lunr":{"maxIndexSize":1000000,"ignoreSpecialCharacters":false},"katex":{},"fontsettings":{"theme":"white","family":"sans","size":2,"font":"sans"},"highlight":{},"codeblock-filename":{},"sitemap":{"hostname":"http://hivemall.incubator.apache.org/"},"theme-api":{"languages":[],"split":false,"theme":"dark"},"sharing":{"facebook":true,"twitter":true,"google":false,"weibo":false,"instapaper":false,"vk":false,"all":["facebook","google","twitter","weibo","instapaper"]},"edit-link":{"label":"Edit","base":"https://github.com/apach e/incubator-hivemall/docs/gitbook"},"theme-default":{"styles":{"website":"styles/website.css","pdf":"styles/pdf.css","epub":"styles/epub.css","mobi":"styles/mobi.css","ebook":"styles/ebook.css","print":"styles/print.css"},"showLevel":true},"anchorjs":{"selector":"h1,h2,h3,*:not(.callout) > h4,h5"},"toggle-chapters":{},"expandable-chapters":{}},"theme":"default","pdf":{"pageNumbers":true,"fontSize":12,"fontFamily":"Arial","paperSize":"a4","chapterMark":"pagebreak","pageBreaksBefore":"/","margin":{"right":62,"left":62,"top":56,"bottom":56}},"structure":{"langs":"LANGS.md","readme":"README.md","glossary":"GLOSSARY.md","summary":"SUMMARY.md"},"variables":{},"title":"Hivemall User Manual","links":{"sidebar":{"<i class=\"fa fa-home\"></i> Home":"http://hivemall.incubator.apache.org/"}},"gitbook":"3.x.x","description":"User Manual for Apache Hivemall"},"file":{"path":"binaryclass/kdd2010a_dataset.md","mtime":"2016-11-17T08:53:23.000Z","type":"markdown"},"gitbook":{"version":"3.2.2","time": "2016-11-17T12:16:14.647Z"},"basePath":"..","book":{"language":""}}); }); </script> </div> http://git-wip-us.apache.org/repos/asf/incubator-hivemall-site/blob/68241a08/userguide/binaryclass/kdd2010a_scw.html ---------------------------------------------------------------------- diff --git a/userguide/binaryclass/kdd2010a_scw.html b/userguide/binaryclass/kdd2010a_scw.html index dc0251d..6923897 100644 --- a/userguide/binaryclass/kdd2010a_scw.html +++ b/userguide/binaryclass/kdd2010a_scw.html @@ -999,6 +999,21 @@ </li> + <li class="chapter " data-level="5.6" data-path="titanic_rf.html"> + + <a href="titanic_rf.html"> + + + <b>5.6.</b> + + Kaggle Titanic Tutorial + + </a> + + + + </li> + @@ -1849,7 +1864,25 @@ </tr> </tbody> </table> -<p><div id="page-footer"><hr><p><sub><font color="gray"> +<p><div id="page-footer"><hr><!-- + Licensed to the Apache Software Foundation (ASF) under one + or more contributor license agreements. See the NOTICE file + distributed with this work for additional information + regarding copyright ownership. The ASF licenses this file + to you under the Apache License, Version 2.0 (the + "License"); you may not use this file except in compliance + with the License. You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + + Unless required by applicable law or agreed to in writing, + software distributed under the License is distributed on an + "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + KIND, either express or implied. See the License for the + specific language governing permissions and limitations + under the License. +--> +<p><sub><font color="gray"> Apache Hivemall is an effort undergoing incubation at The Apache Software Foundation (ASF), sponsored by the Apache Incubator. </font></sub></p> </div></p> @@ -1886,7 +1919,7 @@ Apache Hivemall is an effort undergoing incubation at The Apache Software Founda <script> var gitbook = gitbook || []; gitbook.push(function() { - gitbook.page.hasChanged({"page":{"title":"PA, CW, AROW, SCW","level":"5.3.2","depth":2,"next":{"title":"KDD2010b Tutorial","level":"5.4","depth":1,"path":"binaryclass/kdd2010b.md","ref":"binaryclass/kdd2010b.md","articles":[{"title":"Data preparation","level":"5.4.1","depth":2,"path":"binaryclass/kdd2010b_dataset.md","ref":"binaryclass/kdd2010b_dataset.md","articles":[]},{"title":"AROW","level":"5.4.2","depth":2,"path":"binaryclass/kdd2010b_arow.md","ref":"binaryclass/kdd2010b_arow.md","articles":[]}]},"previous":{"title":"Data preparation","level":"5.3.1","depth":2,"path":"binaryclass/kdd2010a_dataset.md","ref":"binaryclass/kdd2010a_dataset.md","articles":[]},"dir":"ltr"},"config":{"plugins":["theme-api","edit-link","github","splitter","sitemap","etoc","callouts","toggle-chapters","anchorjs","codeblock-filename","expandable-chapters","multipart","codeblock-filename","katex","emphasize","localized-footer"],"styles":{"website":"styles/website.css","pdf":"styles/pdf.css"," epub":"styles/epub.css","mobi":"styles/mobi.css","ebook":"styles/ebook.css","print":"styles/print.css"},"pluginsConfig":{"emphasize":{},"callouts":{},"etoc":{"maxdepth":3,"mindepth":1,"notoc":true},"github":{"url":"https://github.com/apache/incubator-hivemall/"},"splitter":{},"search":{},"downloadpdf":{"base":"https://github.com/apache/incubator-hivemall/docs/gitbook","label":"PDF","multilingual":false},"multipart":{},"localized-footer":{"filename":"FOOTER.md"},"lunr":{"maxIndexSize":1000000,"ignoreSpecialCharacters":false},"katex":{},"fontsettings":{"theme":"white","family":"sans","size":2,"font":"sans"},"highlight":{},"codeblock-filename":{},"sitemap":{"hostname":"http://hivemall.incubator.apache.org/"},"theme-api":{"languages":[],"split":false,"theme":"dark"},"sharing":{"facebook":true,"twitter":true,"google":false,"weibo":false,"instapaper":false,"vk":false,"all":["facebook","google","twitter","weibo","instapaper"]},"edit-link":{"label":"Edit","base":"https://github.com/apache/i ncubator-hivemall/docs/gitbook"},"theme-default":{"styles":{"website":"styles/website.css","pdf":"styles/pdf.css","epub":"styles/epub.css","mobi":"styles/mobi.css","ebook":"styles/ebook.css","print":"styles/print.css"},"showLevel":true},"anchorjs":{"selector":"h1,h2,h3,*:not(.callout) > h4,h5"},"toggle-chapters":{},"expandable-chapters":{}},"theme":"default","pdf":{"pageNumbers":true,"fontSize":12,"fontFamily":"Arial","paperSize":"a4","chapterMark":"pagebreak","pageBreaksBefore":"/","margin":{"right":62,"left":62,"top":56,"bottom":56}},"structure":{"langs":"LANGS.md","readme":"README.md","glossary":"GLOSSARY.md","summary":"SUMMARY.md"},"variables":{},"title":"Hivemall User Manual","links":{"sidebar":{"<i class=\"fa fa-home\"></i> Home":"http://hivemall.incubator.apache.org/"}},"gitbook":"3.x.x","description":"User Manual for Apache Hivemall"},"file":{"path":"binaryclass/kdd2010a_scw.md","mtime":"2016-11-12T07:18:00.000Z","type":"markdown"},"gitbook":{"version":"3.2.2","time":"2016-1 1-14T10:40:22.987Z"},"basePath":"..","book":{"language":""}}); + gitbook.page.hasChanged({"page":{"title":"PA, CW, AROW, SCW","level":"5.3.2","depth":2,"next":{"title":"KDD2010b Tutorial","level":"5.4","depth":1,"path":"binaryclass/kdd2010b.md","ref":"binaryclass/kdd2010b.md","articles":[{"title":"Data preparation","level":"5.4.1","depth":2,"path":"binaryclass/kdd2010b_dataset.md","ref":"binaryclass/kdd2010b_dataset.md","articles":[]},{"title":"AROW","level":"5.4.2","depth":2,"path":"binaryclass/kdd2010b_arow.md","ref":"binaryclass/kdd2010b_arow.md","articles":[]}]},"previous":{"title":"Data preparation","level":"5.3.1","depth":2,"path":"binaryclass/kdd2010a_dataset.md","ref":"binaryclass/kdd2010a_dataset.md","articles":[]},"dir":"ltr"},"config":{"plugins":["theme-api","edit-link","github","splitter","sitemap","etoc","callouts","toggle-chapters","anchorjs","codeblock-filename","expandable-chapters","multipart","codeblock-filename","katex","emphasize","localized-footer"],"styles":{"website":"styles/website.css","pdf":"styles/pdf.css"," epub":"styles/epub.css","mobi":"styles/mobi.css","ebook":"styles/ebook.css","print":"styles/print.css"},"pluginsConfig":{"emphasize":{},"callouts":{},"etoc":{"maxdepth":3,"mindepth":1,"notoc":true},"github":{"url":"https://github.com/apache/incubator-hivemall/"},"splitter":{},"search":{},"downloadpdf":{"base":"https://github.com/apache/incubator-hivemall/docs/gitbook","label":"PDF","multilingual":false},"multipart":{},"localized-footer":{"filename":"FOOTER.md"},"lunr":{"maxIndexSize":1000000,"ignoreSpecialCharacters":false},"katex":{},"fontsettings":{"theme":"white","family":"sans","size":2,"font":"sans"},"highlight":{},"codeblock-filename":{},"sitemap":{"hostname":"http://hivemall.incubator.apache.org/"},"theme-api":{"languages":[],"split":false,"theme":"dark"},"sharing":{"facebook":true,"twitter":true,"google":false,"weibo":false,"instapaper":false,"vk":false,"all":["facebook","google","twitter","weibo","instapaper"]},"edit-link":{"label":"Edit","base":"https://github.com/apache/i ncubator-hivemall/docs/gitbook"},"theme-default":{"styles":{"website":"styles/website.css","pdf":"styles/pdf.css","epub":"styles/epub.css","mobi":"styles/mobi.css","ebook":"styles/ebook.css","print":"styles/print.css"},"showLevel":true},"anchorjs":{"selector":"h1,h2,h3,*:not(.callout) > h4,h5"},"toggle-chapters":{},"expandable-chapters":{}},"theme":"default","pdf":{"pageNumbers":true,"fontSize":12,"fontFamily":"Arial","paperSize":"a4","chapterMark":"pagebreak","pageBreaksBefore":"/","margin":{"right":62,"left":62,"top":56,"bottom":56}},"structure":{"langs":"LANGS.md","readme":"README.md","glossary":"GLOSSARY.md","summary":"SUMMARY.md"},"variables":{},"title":"Hivemall User Manual","links":{"sidebar":{"<i class=\"fa fa-home\"></i> Home":"http://hivemall.incubator.apache.org/"}},"gitbook":"3.x.x","description":"User Manual for Apache Hivemall"},"file":{"path":"binaryclass/kdd2010a_scw.md","mtime":"2016-11-16T08:39:12.000Z","type":"markdown"},"gitbook":{"version":"3.2.2","time":"2016-1 1-17T12:16:14.647Z"},"basePath":"..","book":{"language":""}}); }); </script> </div>
