Added: samza/site/learn/tutorials/0.10/deploy-samza-job-from-hdfs.html URL: http://svn.apache.org/viewvc/samza/site/learn/tutorials/0.10/deploy-samza-job-from-hdfs.html?rev=1721445&view=auto ============================================================================== --- samza/site/learn/tutorials/0.10/deploy-samza-job-from-hdfs.html (added) +++ samza/site/learn/tutorials/0.10/deploy-samza-job-from-hdfs.html Tue Dec 22 19:01:05 2015 @@ -0,0 +1,208 @@ +<!DOCTYPE html> +<!-- + Licensed to the Apache Software Foundation (ASF) under one or more + contributor license agreements. See the NOTICE file distributed with + this work for additional information regarding copyright ownership. + The ASF licenses this file to You under the Apache License, Version 2.0 + (the "License"); you may not use this file except in compliance with + the License. You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + + Unless required by applicable law or agreed to in writing, software + distributed under the License is distributed on an "AS IS" BASIS, + WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + See the License for the specific language governing permissions and + limitations under the License. +--> +<html lang="en"> + <head> + <meta charset="utf-8"> + <title>Samza - Deploying a Samza job from HDFS</title> + <link href='/css/ropa-sans.css' rel='stylesheet' type='text/css'/> + <link href="/css/bootstrap.min.css" rel="stylesheet"/> + <link href="/css/font-awesome.min.css" rel="stylesheet"/> + <link href="/css/main.css" rel="stylesheet"/> + <link href="/css/syntax.css" rel="stylesheet"/> + <link rel="icon" type="image/png" href="/img/samza-icon.png"> + <script src="/js/jquery-1.11.1.min.js"></script> + </head> + <body> + <div class="wrapper"> + <div class="wrapper-content"> + + <div class="masthead"> + <div class="container"> + <div class="masthead-logo"> + <a href="/" class="logo">samza</a> + </div> + <div class="masthead-icons"> + <div class="pull-right"> + <a href="/startup/download"><i class="fa fa-arrow-circle-o-down masthead-icon"></i></a> + <a href="https://git-wip-us.apache.org/repos/asf?p=samza.git;a=tree" target="_blank"><i class="fa fa-code masthead-icon" style="font-weight: bold;"></i></a> + <a href="https://twitter.com/samzastream" target="_blank"><i class="fa fa-twitter masthead-icon"></i></a> + <!-- this icon only shows in versioned pages --> + + + + + <a href="http://samza.apache.org/learn/tutorials/latest/deploy-samza-job-from-hdfs.html"><i id="switch-version-button"></i></a> + <!-- links for the navigation bar --> + + + </div> + </div> + </div><!-- /.container --> + </div> + + <div class="container"> + <div class="menu"> + <h1><i class="fa fa-rocket"></i> Getting Started</h1> + <ul> + <li><a href="/startup/hello-samza/0.10">Hello Samza</a></li> + <li><a href="/startup/download">Download</a></li> + </ul> + + <h1><i class="fa fa-book"></i> Learn</h1> + <ul> + <li><a href="/learn/documentation/0.10">Documentation</a></li> + <li><a href="/learn/documentation/0.10/jobs/configuration-table.html">Configuration</a></li> + <li><a href="/learn/documentation/0.10/api/javadocs/">Javadocs</a></li> + <li><a href="/learn/tutorials/0.10">Tutorials</a></li> + <li><a href="https://cwiki.apache.org/confluence/display/SAMZA/FAQ">FAQ</a></li> + <li><a href="https://cwiki.apache.org/confluence/display/SAMZA/Apache+Samza">Wiki</a></li> + <li><a href="https://cwiki.apache.org/confluence/pages/viewpage.action?pageId=51812876">Papers & Talks</a></li> + <li><a href="http://blogs.apache.org/samza">Blog</a></li> + </ul> + + <h1><i class="fa fa-comments"></i> Community</h1> + <ul> + <li><a href="/community/mailing-lists.html">Mailing Lists</a></li> + <li><a href="/community/irc.html">IRC</a></li> + <li><a href="https://issues.apache.org/jira/browse/SAMZA">Bugs</a></li> + <li><a href="https://cwiki.apache.org/confluence/display/SAMZA/Powered+By">Powered by</a></li> + <li><a href="https://cwiki.apache.org/confluence/display/SAMZA/Ecosystem">Ecosystem</a></li> + <li><a href="/community/committers.html">Committers</a></li> + </ul> + + <h1><i class="fa fa-code"></i> Contribute</h1> + <ul> + <li><a href="/contribute/rules.html">Rules</a></li> + <li><a href="/contribute/coding-guide.html">Coding Guide</a></li> + <li><a href="/contribute/projects.html">Projects</a></li> + <li><a href="/contribute/design-documents.html">Design Documents</a></li> + <li><a href="/contribute/code.html">Code</a></li> + <li><a href="https://reviews.apache.org/groups/samza">Review Board</a></li> + <li><a href="/contribute/tests.html">Tests</a></li> + </ul> + + <h1><i class="fa fa-history"></i> Archive</h1> + <ul> + <li><a href="/archive/index.html#latest">latest</a></li> + <li><a href="/archive/index.html#09">0.9</a></li> + <li><a href="/archive/index.html#08">0.8</a></li> + <li><a href="/archive/index.html#07">0.7</a></li> + </ul> + </div> + + <div class="content"> + <!-- + Licensed to the Apache Software Foundation (ASF) under one or more + contributor license agreements. See the NOTICE file distributed with + this work for additional information regarding copyright ownership. + The ASF licenses this file to You under the Apache License, Version 2.0 + (the "License"); you may not use this file except in compliance with + the License. You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + + Unless required by applicable law or agreed to in writing, software + distributed under the License is distributed on an "AS IS" BASIS, + WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + See the License for the specific language governing permissions and + limitations under the License. +--> + +<h2>Deploying a Samza job from HDFS</h2> + +<!-- + Licensed to the Apache Software Foundation (ASF) under one or more + contributor license agreements. See the NOTICE file distributed with + this work for additional information regarding copyright ownership. + The ASF licenses this file to You under the Apache License, Version 2.0 + (the "License"); you may not use this file except in compliance with + the License. You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + + Unless required by applicable law or agreed to in writing, software + distributed under the License is distributed on an "AS IS" BASIS, + WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + See the License for the specific language governing permissions and + limitations under the License. +--> + +<p>This tutorial uses <a href="../../../startup/hello-samza/0.10/">hello-samza</a> to illustrate how to run a Samza job if you want to publish the Samza job’s .tar.gz package to HDFS.</p> + +<h3 id="upload-the-package">Upload the package</h3> + +<div class="highlight"><pre><code class="bash">hadoop fs -put ./target/hello-samza-0.10.0-dist.tar.gz /path/for/tgz</code></pre></div> + +<h3 id="add-hdfs-configuration">Add HDFS configuration</h3> + +<p>Put the hdfs-site.xml file of your cluster into ~/.samza/conf directory (The same place as the yarn-site.xml). If you set HADOOP_CONF_DIR, put the hdfs-site.xml in your configuration directory if the hdfs-site.xml is not there.</p> + +<h3 id="change-properties-file">Change properties file</h3> + +<p>Change the yarn.package.path in the properties file to your HDFS location.</p> + +<div class="highlight"><pre><code class="jproperties"><span class="na">yarn.package.path</span><span class="o">=</span><span class="s">hdfs://<hdfs name node ip>:<hdfs name node port>/path/to/tgz</span></code></pre></div> + +<p>Then you should be able to run the Samza job as described in <a href="../../../startup/hello-samza/0.10/">hello-samza</a>.</p> + + + </div> + </div> + + </div><!-- /.wrapper-content --> + </div><!-- /.wrapper --> + + <div class="footer"> + <div class="container"> + <!-- nothing for now. --> + </div> + </div> + + + <script> + $( document ).ready(function() { + if ( $.fn.urlExists( "/learn/tutorials/latest/deploy-samza-job-from-hdfs.html" ) ) { + $("#switch-version-button").addClass("fa fa-history masthead-icon"); + } + }); + + /* a function to test whether the url exists or not */ + (function( $ ) { + $.fn.urlExists = function(url) { + var http = new XMLHttpRequest(); + http.open('HEAD', url, false); + http.send(); + return http.status != 404; + }; + }( jQuery )); + </script> + + + <!-- Google Analytics --> + <script> + (function(i,s,o,g,r,a,m){i['GoogleAnalyticsObject']=r;i[r]=i[r]||function(){ + (i[r].q=i[r].q||[]).push(arguments)},i[r].l=1*new Date();a=s.createElement(o), + m=s.getElementsByTagName(o)[0];a.async=1;a.src=g;m.parentNode.insertBefore(a,m) + })(window,document,'script','//www.google-analytics.com/analytics.js','ga'); + + ga('create', 'UA-43122768-1', 'apache.org'); + ga('send', 'pageview'); + + </script> + </body> +</html>
Added: samza/site/learn/tutorials/0.10/deploy-samza-to-CDH.html URL: http://svn.apache.org/viewvc/samza/site/learn/tutorials/0.10/deploy-samza-to-CDH.html?rev=1721445&view=auto ============================================================================== --- samza/site/learn/tutorials/0.10/deploy-samza-to-CDH.html (added) +++ samza/site/learn/tutorials/0.10/deploy-samza-to-CDH.html Tue Dec 22 19:01:05 2015 @@ -0,0 +1,220 @@ +<!DOCTYPE html> +<!-- + Licensed to the Apache Software Foundation (ASF) under one or more + contributor license agreements. See the NOTICE file distributed with + this work for additional information regarding copyright ownership. + The ASF licenses this file to You under the Apache License, Version 2.0 + (the "License"); you may not use this file except in compliance with + the License. You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + + Unless required by applicable law or agreed to in writing, software + distributed under the License is distributed on an "AS IS" BASIS, + WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + See the License for the specific language governing permissions and + limitations under the License. +--> +<html lang="en"> + <head> + <meta charset="utf-8"> + <title>Samza - Deploy Samza Job To CDH</title> + <link href='/css/ropa-sans.css' rel='stylesheet' type='text/css'/> + <link href="/css/bootstrap.min.css" rel="stylesheet"/> + <link href="/css/font-awesome.min.css" rel="stylesheet"/> + <link href="/css/main.css" rel="stylesheet"/> + <link href="/css/syntax.css" rel="stylesheet"/> + <link rel="icon" type="image/png" href="/img/samza-icon.png"> + <script src="/js/jquery-1.11.1.min.js"></script> + </head> + <body> + <div class="wrapper"> + <div class="wrapper-content"> + + <div class="masthead"> + <div class="container"> + <div class="masthead-logo"> + <a href="/" class="logo">samza</a> + </div> + <div class="masthead-icons"> + <div class="pull-right"> + <a href="/startup/download"><i class="fa fa-arrow-circle-o-down masthead-icon"></i></a> + <a href="https://git-wip-us.apache.org/repos/asf?p=samza.git;a=tree" target="_blank"><i class="fa fa-code masthead-icon" style="font-weight: bold;"></i></a> + <a href="https://twitter.com/samzastream" target="_blank"><i class="fa fa-twitter masthead-icon"></i></a> + <!-- this icon only shows in versioned pages --> + + + + + <a href="http://samza.apache.org/learn/tutorials/latest/deploy-samza-to-CDH.html"><i id="switch-version-button"></i></a> + <!-- links for the navigation bar --> + + + </div> + </div> + </div><!-- /.container --> + </div> + + <div class="container"> + <div class="menu"> + <h1><i class="fa fa-rocket"></i> Getting Started</h1> + <ul> + <li><a href="/startup/hello-samza/0.10">Hello Samza</a></li> + <li><a href="/startup/download">Download</a></li> + </ul> + + <h1><i class="fa fa-book"></i> Learn</h1> + <ul> + <li><a href="/learn/documentation/0.10">Documentation</a></li> + <li><a href="/learn/documentation/0.10/jobs/configuration-table.html">Configuration</a></li> + <li><a href="/learn/documentation/0.10/api/javadocs/">Javadocs</a></li> + <li><a href="/learn/tutorials/0.10">Tutorials</a></li> + <li><a href="https://cwiki.apache.org/confluence/display/SAMZA/FAQ">FAQ</a></li> + <li><a href="https://cwiki.apache.org/confluence/display/SAMZA/Apache+Samza">Wiki</a></li> + <li><a href="https://cwiki.apache.org/confluence/pages/viewpage.action?pageId=51812876">Papers & Talks</a></li> + <li><a href="http://blogs.apache.org/samza">Blog</a></li> + </ul> + + <h1><i class="fa fa-comments"></i> Community</h1> + <ul> + <li><a href="/community/mailing-lists.html">Mailing Lists</a></li> + <li><a href="/community/irc.html">IRC</a></li> + <li><a href="https://issues.apache.org/jira/browse/SAMZA">Bugs</a></li> + <li><a href="https://cwiki.apache.org/confluence/display/SAMZA/Powered+By">Powered by</a></li> + <li><a href="https://cwiki.apache.org/confluence/display/SAMZA/Ecosystem">Ecosystem</a></li> + <li><a href="/community/committers.html">Committers</a></li> + </ul> + + <h1><i class="fa fa-code"></i> Contribute</h1> + <ul> + <li><a href="/contribute/rules.html">Rules</a></li> + <li><a href="/contribute/coding-guide.html">Coding Guide</a></li> + <li><a href="/contribute/projects.html">Projects</a></li> + <li><a href="/contribute/design-documents.html">Design Documents</a></li> + <li><a href="/contribute/code.html">Code</a></li> + <li><a href="https://reviews.apache.org/groups/samza">Review Board</a></li> + <li><a href="/contribute/tests.html">Tests</a></li> + </ul> + + <h1><i class="fa fa-history"></i> Archive</h1> + <ul> + <li><a href="/archive/index.html#latest">latest</a></li> + <li><a href="/archive/index.html#09">0.9</a></li> + <li><a href="/archive/index.html#08">0.8</a></li> + <li><a href="/archive/index.html#07">0.7</a></li> + </ul> + </div> + + <div class="content"> + <!-- + Licensed to the Apache Software Foundation (ASF) under one or more + contributor license agreements. See the NOTICE file distributed with + this work for additional information regarding copyright ownership. + The ASF licenses this file to You under the Apache License, Version 2.0 + (the "License"); you may not use this file except in compliance with + the License. You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + + Unless required by applicable law or agreed to in writing, software + distributed under the License is distributed on an "AS IS" BASIS, + WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + See the License for the specific language governing permissions and + limitations under the License. +--> + +<h2>Deploy Samza Job To CDH</h2> + +<!-- + Licensed to the Apache Software Foundation (ASF) under one or more + contributor license agreements. See the NOTICE file distributed with + this work for additional information regarding copyright ownership. + The ASF licenses this file to You under the Apache License, Version 2.0 + (the "License"); you may not use this file except in compliance with + the License. You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + + Unless required by applicable law or agreed to in writing, software + distributed under the License is distributed on an "AS IS" BASIS, + WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + See the License for the specific language governing permissions and + limitations under the License. +--> + +<p>The tutorial assumes you have successfully run <a href="../../../startup/hello-samza/0.10/">hello-samza</a> and now you want to deploy the job to your Cloudera Data Hub (<a href="http://www.cloudera.com/content/cloudera/en/products-and-services/cdh.html">CDH</a>). This tutorial is based on CDH 5.0.0 and uses hello-samza as the example job.</p> + +<h3 id="upload-package-to-cluster">Upload Package to Cluster</h3> + +<p>There are a few ways of uploading the package to the cluster’s HDFS. If you do not have the job package in your cluster, <strong>scp</strong> from you local machine to the cluster. Then run</p> + +<div class="highlight"><pre><code class="bash">hadoop fs -put path/to/hello-samza-0.10.0-dist.tar.gz /path/for/tgz</code></pre></div> + +<h3 id="get-deloying-scripts">Get Deloying Scripts</h3> + +<p>Untar the job package (assume you will run from the current directory)</p> + +<div class="highlight"><pre><code class="bash">tar -xvf path/to/samza-job-package-0.10.0-dist.tar.gz -C ./</code></pre></div> + +<h3 id="add-package-path-to-properties-file">Add Package Path to Properties File</h3> + +<div class="highlight"><pre><code class="bash">vim config/wikipedia-parser.properties</code></pre></div> + +<p>Change the yarn package path:</p> + +<div class="highlight"><pre><code class="jproperties"><span class="na">yarn.package.path</span><span class="o">=</span><span class="s">hdfs://<hdfs name node ip>:<hdfs name node port>/path/to/tgz</span></code></pre></div> + +<h3 id="set-yarn-environment-variable">Set Yarn Environment Variable</h3> + +<div class="highlight"><pre><code class="bash"><span class="nb">export </span><span class="nv">HADOOP_CONF_DIR</span><span class="o">=</span>/etc/hadoop/conf</code></pre></div> + +<h3 id="run-samza-job">Run Samza Job</h3> + +<div class="highlight"><pre><code class="bash">bin/run-job.sh --config-factory<span class="o">=</span>org.apache.samza.config.factories.PropertiesConfigFactory --config-path<span class="o">=</span>file://<span class="nv">$PWD</span>/config/wikipedia-parser.properties</code></pre></div> + + + </div> + </div> + + </div><!-- /.wrapper-content --> + </div><!-- /.wrapper --> + + <div class="footer"> + <div class="container"> + <!-- nothing for now. --> + </div> + </div> + + + <script> + $( document ).ready(function() { + if ( $.fn.urlExists( "/learn/tutorials/latest/deploy-samza-to-CDH.html" ) ) { + $("#switch-version-button").addClass("fa fa-history masthead-icon"); + } + }); + + /* a function to test whether the url exists or not */ + (function( $ ) { + $.fn.urlExists = function(url) { + var http = new XMLHttpRequest(); + http.open('HEAD', url, false); + http.send(); + return http.status != 404; + }; + }( jQuery )); + </script> + + + <!-- Google Analytics --> + <script> + (function(i,s,o,g,r,a,m){i['GoogleAnalyticsObject']=r;i[r]=i[r]||function(){ + (i[r].q=i[r].q||[]).push(arguments)},i[r].l=1*new Date();a=s.createElement(o), + m=s.getElementsByTagName(o)[0];a.async=1;a.src=g;m.parentNode.insertBefore(a,m) + })(window,document,'script','//www.google-analytics.com/analytics.js','ga'); + + ga('create', 'UA-43122768-1', 'apache.org'); + ga('send', 'pageview'); + + </script> + </body> +</html> Added: samza/site/learn/tutorials/0.10/index.html URL: http://svn.apache.org/viewvc/samza/site/learn/tutorials/0.10/index.html?rev=1721445&view=auto ============================================================================== --- samza/site/learn/tutorials/0.10/index.html (added) +++ samza/site/learn/tutorials/0.10/index.html Tue Dec 22 19:01:05 2015 @@ -0,0 +1,211 @@ +<!DOCTYPE html> +<!-- + Licensed to the Apache Software Foundation (ASF) under one or more + contributor license agreements. See the NOTICE file distributed with + this work for additional information regarding copyright ownership. + The ASF licenses this file to You under the Apache License, Version 2.0 + (the "License"); you may not use this file except in compliance with + the License. You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + + Unless required by applicable law or agreed to in writing, software + distributed under the License is distributed on an "AS IS" BASIS, + WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + See the License for the specific language governing permissions and + limitations under the License. +--> +<html lang="en"> + <head> + <meta charset="utf-8"> + <title>Samza - Tutorials</title> + <link href='/css/ropa-sans.css' rel='stylesheet' type='text/css'/> + <link href="/css/bootstrap.min.css" rel="stylesheet"/> + <link href="/css/font-awesome.min.css" rel="stylesheet"/> + <link href="/css/main.css" rel="stylesheet"/> + <link href="/css/syntax.css" rel="stylesheet"/> + <link rel="icon" type="image/png" href="/img/samza-icon.png"> + <script src="/js/jquery-1.11.1.min.js"></script> + </head> + <body> + <div class="wrapper"> + <div class="wrapper-content"> + + <div class="masthead"> + <div class="container"> + <div class="masthead-logo"> + <a href="/" class="logo">samza</a> + </div> + <div class="masthead-icons"> + <div class="pull-right"> + <a href="/startup/download"><i class="fa fa-arrow-circle-o-down masthead-icon"></i></a> + <a href="https://git-wip-us.apache.org/repos/asf?p=samza.git;a=tree" target="_blank"><i class="fa fa-code masthead-icon" style="font-weight: bold;"></i></a> + <a href="https://twitter.com/samzastream" target="_blank"><i class="fa fa-twitter masthead-icon"></i></a> + <!-- this icon only shows in versioned pages --> + + + + + <a href="http://samza.apache.org/learn/tutorials/latest/index.html"><i id="switch-version-button"></i></a> + <!-- links for the navigation bar --> + + + </div> + </div> + </div><!-- /.container --> + </div> + + <div class="container"> + <div class="menu"> + <h1><i class="fa fa-rocket"></i> Getting Started</h1> + <ul> + <li><a href="/startup/hello-samza/0.10">Hello Samza</a></li> + <li><a href="/startup/download">Download</a></li> + </ul> + + <h1><i class="fa fa-book"></i> Learn</h1> + <ul> + <li><a href="/learn/documentation/0.10">Documentation</a></li> + <li><a href="/learn/documentation/0.10/jobs/configuration-table.html">Configuration</a></li> + <li><a href="/learn/documentation/0.10/api/javadocs/">Javadocs</a></li> + <li><a href="/learn/tutorials/0.10">Tutorials</a></li> + <li><a href="https://cwiki.apache.org/confluence/display/SAMZA/FAQ">FAQ</a></li> + <li><a href="https://cwiki.apache.org/confluence/display/SAMZA/Apache+Samza">Wiki</a></li> + <li><a href="https://cwiki.apache.org/confluence/pages/viewpage.action?pageId=51812876">Papers & Talks</a></li> + <li><a href="http://blogs.apache.org/samza">Blog</a></li> + </ul> + + <h1><i class="fa fa-comments"></i> Community</h1> + <ul> + <li><a href="/community/mailing-lists.html">Mailing Lists</a></li> + <li><a href="/community/irc.html">IRC</a></li> + <li><a href="https://issues.apache.org/jira/browse/SAMZA">Bugs</a></li> + <li><a href="https://cwiki.apache.org/confluence/display/SAMZA/Powered+By">Powered by</a></li> + <li><a href="https://cwiki.apache.org/confluence/display/SAMZA/Ecosystem">Ecosystem</a></li> + <li><a href="/community/committers.html">Committers</a></li> + </ul> + + <h1><i class="fa fa-code"></i> Contribute</h1> + <ul> + <li><a href="/contribute/rules.html">Rules</a></li> + <li><a href="/contribute/coding-guide.html">Coding Guide</a></li> + <li><a href="/contribute/projects.html">Projects</a></li> + <li><a href="/contribute/design-documents.html">Design Documents</a></li> + <li><a href="/contribute/code.html">Code</a></li> + <li><a href="https://reviews.apache.org/groups/samza">Review Board</a></li> + <li><a href="/contribute/tests.html">Tests</a></li> + </ul> + + <h1><i class="fa fa-history"></i> Archive</h1> + <ul> + <li><a href="/archive/index.html#latest">latest</a></li> + <li><a href="/archive/index.html#09">0.9</a></li> + <li><a href="/archive/index.html#08">0.8</a></li> + <li><a href="/archive/index.html#07">0.7</a></li> + </ul> + </div> + + <div class="content"> + <!-- + Licensed to the Apache Software Foundation (ASF) under one or more + contributor license agreements. See the NOTICE file distributed with + this work for additional information regarding copyright ownership. + The ASF licenses this file to You under the Apache License, Version 2.0 + (the "License"); you may not use this file except in compliance with + the License. You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + + Unless required by applicable law or agreed to in writing, software + distributed under the License is distributed on an "AS IS" BASIS, + WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + See the License for the specific language governing permissions and + limitations under the License. +--> + +<h2>Tutorials</h2> + +<!-- + Licensed to the Apache Software Foundation (ASF) under one or more + contributor license agreements. See the NOTICE file distributed with + this work for additional information regarding copyright ownership. + The ASF licenses this file to You under the Apache License, Version 2.0 + (the "License"); you may not use this file except in compliance with + the License. You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + + Unless required by applicable law or agreed to in writing, software + distributed under the License is distributed on an "AS IS" BASIS, + WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + See the License for the specific language governing permissions and + limitations under the License. +--> + +<p><a href="remote-debugging-samza.html">Remote Debugging with Samza</a></p> + +<p><a href="deploy-samza-job-from-hdfs.html">Deploying a Samza Job from HDFS</a></p> + +<p><a href="deploy-samza-to-CDH.html">Deoloy Samza to CDH</a></p> + +<p><a href="run-in-multi-node-yarn.html">Run Hello-samza in Multi-node YARN</a></p> + +<p><a href="run-hello-samza-without-internet.html">Run Hello-samza without Internet</a></p> + +<!-- TODO a bunch of tutorials +[Log Walkthrough](log-walkthrough.html) +<a href="configuring-kafka-system.html">Configuring a Kafka System</a><br/> +<a href="joining-streams.html">Joining Streams</a><br/> +<a href="sort-stream.html">Sorting a Stream</a><br/> +<a href="group-by-count.html">Group-by and Counting</a><br/> +<a href="initialize-close.html">Initializing and Closing</a><br/> +<a href="windowing.html">Windowing</a><br/> +<a href="committing.html">Committing</a><br/> +–> + + + </div> + </div> + + </div><!-- /.wrapper-content --> + </div><!-- /.wrapper --> + + <div class="footer"> + <div class="container"> + <!-- nothing for now. --> + </div> + </div> + + + <script> + $( document ).ready(function() { + if ( $.fn.urlExists( "/learn/tutorials/latest/index.html" ) ) { + $("#switch-version-button").addClass("fa fa-history masthead-icon"); + } + }); + + /* a function to test whether the url exists or not */ + (function( $ ) { + $.fn.urlExists = function(url) { + var http = new XMLHttpRequest(); + http.open('HEAD', url, false); + http.send(); + return http.status != 404; + }; + }( jQuery )); + </script> + + + <!-- Google Analytics --> + <script> + (function(i,s,o,g,r,a,m){i['GoogleAnalyticsObject']=r;i[r]=i[r]||function(){ + (i[r].q=i[r].q||[]).push(arguments)},i[r].l=1*new Date();a=s.createElement(o), + m=s.getElementsByTagName(o)[0];a.async=1;a.src=g;m.parentNode.insertBefore(a,m) + })(window,document,'script','//www.google-analytics.com/analytics.js','ga'); + + ga('create', 'UA-43122768-1', 'apache.org'); + ga('send', 'pageview'); + + </script> + </body> +</html> Added: samza/site/learn/tutorials/0.10/remote-debugging-samza.html URL: http://svn.apache.org/viewvc/samza/site/learn/tutorials/0.10/remote-debugging-samza.html?rev=1721445&view=auto ============================================================================== --- samza/site/learn/tutorials/0.10/remote-debugging-samza.html (added) +++ samza/site/learn/tutorials/0.10/remote-debugging-samza.html Tue Dec 22 19:01:05 2015 @@ -0,0 +1,254 @@ +<!DOCTYPE html> +<!-- + Licensed to the Apache Software Foundation (ASF) under one or more + contributor license agreements. See the NOTICE file distributed with + this work for additional information regarding copyright ownership. + The ASF licenses this file to You under the Apache License, Version 2.0 + (the "License"); you may not use this file except in compliance with + the License. You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + + Unless required by applicable law or agreed to in writing, software + distributed under the License is distributed on an "AS IS" BASIS, + WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + See the License for the specific language governing permissions and + limitations under the License. +--> +<html lang="en"> + <head> + <meta charset="utf-8"> + <title>Samza - Remote Debugging with Samza</title> + <link href='/css/ropa-sans.css' rel='stylesheet' type='text/css'/> + <link href="/css/bootstrap.min.css" rel="stylesheet"/> + <link href="/css/font-awesome.min.css" rel="stylesheet"/> + <link href="/css/main.css" rel="stylesheet"/> + <link href="/css/syntax.css" rel="stylesheet"/> + <link rel="icon" type="image/png" href="/img/samza-icon.png"> + <script src="/js/jquery-1.11.1.min.js"></script> + </head> + <body> + <div class="wrapper"> + <div class="wrapper-content"> + + <div class="masthead"> + <div class="container"> + <div class="masthead-logo"> + <a href="/" class="logo">samza</a> + </div> + <div class="masthead-icons"> + <div class="pull-right"> + <a href="/startup/download"><i class="fa fa-arrow-circle-o-down masthead-icon"></i></a> + <a href="https://git-wip-us.apache.org/repos/asf?p=samza.git;a=tree" target="_blank"><i class="fa fa-code masthead-icon" style="font-weight: bold;"></i></a> + <a href="https://twitter.com/samzastream" target="_blank"><i class="fa fa-twitter masthead-icon"></i></a> + <!-- this icon only shows in versioned pages --> + + + + + <a href="http://samza.apache.org/learn/tutorials/latest/remote-debugging-samza.html"><i id="switch-version-button"></i></a> + <!-- links for the navigation bar --> + + + </div> + </div> + </div><!-- /.container --> + </div> + + <div class="container"> + <div class="menu"> + <h1><i class="fa fa-rocket"></i> Getting Started</h1> + <ul> + <li><a href="/startup/hello-samza/0.10">Hello Samza</a></li> + <li><a href="/startup/download">Download</a></li> + </ul> + + <h1><i class="fa fa-book"></i> Learn</h1> + <ul> + <li><a href="/learn/documentation/0.10">Documentation</a></li> + <li><a href="/learn/documentation/0.10/jobs/configuration-table.html">Configuration</a></li> + <li><a href="/learn/documentation/0.10/api/javadocs/">Javadocs</a></li> + <li><a href="/learn/tutorials/0.10">Tutorials</a></li> + <li><a href="https://cwiki.apache.org/confluence/display/SAMZA/FAQ">FAQ</a></li> + <li><a href="https://cwiki.apache.org/confluence/display/SAMZA/Apache+Samza">Wiki</a></li> + <li><a href="https://cwiki.apache.org/confluence/pages/viewpage.action?pageId=51812876">Papers & Talks</a></li> + <li><a href="http://blogs.apache.org/samza">Blog</a></li> + </ul> + + <h1><i class="fa fa-comments"></i> Community</h1> + <ul> + <li><a href="/community/mailing-lists.html">Mailing Lists</a></li> + <li><a href="/community/irc.html">IRC</a></li> + <li><a href="https://issues.apache.org/jira/browse/SAMZA">Bugs</a></li> + <li><a href="https://cwiki.apache.org/confluence/display/SAMZA/Powered+By">Powered by</a></li> + <li><a href="https://cwiki.apache.org/confluence/display/SAMZA/Ecosystem">Ecosystem</a></li> + <li><a href="/community/committers.html">Committers</a></li> + </ul> + + <h1><i class="fa fa-code"></i> Contribute</h1> + <ul> + <li><a href="/contribute/rules.html">Rules</a></li> + <li><a href="/contribute/coding-guide.html">Coding Guide</a></li> + <li><a href="/contribute/projects.html">Projects</a></li> + <li><a href="/contribute/design-documents.html">Design Documents</a></li> + <li><a href="/contribute/code.html">Code</a></li> + <li><a href="https://reviews.apache.org/groups/samza">Review Board</a></li> + <li><a href="/contribute/tests.html">Tests</a></li> + </ul> + + <h1><i class="fa fa-history"></i> Archive</h1> + <ul> + <li><a href="/archive/index.html#latest">latest</a></li> + <li><a href="/archive/index.html#09">0.9</a></li> + <li><a href="/archive/index.html#08">0.8</a></li> + <li><a href="/archive/index.html#07">0.7</a></li> + </ul> + </div> + + <div class="content"> + <!-- + Licensed to the Apache Software Foundation (ASF) under one or more + contributor license agreements. See the NOTICE file distributed with + this work for additional information regarding copyright ownership. + The ASF licenses this file to You under the Apache License, Version 2.0 + (the "License"); you may not use this file except in compliance with + the License. You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + + Unless required by applicable law or agreed to in writing, software + distributed under the License is distributed on an "AS IS" BASIS, + WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + See the License for the specific language governing permissions and + limitations under the License. +--> + +<h2>Remote Debugging with Samza</h2> + +<!-- + Licensed to the Apache Software Foundation (ASF) under one or more + contributor license agreements. See the NOTICE file distributed with + this work for additional information regarding copyright ownership. + The ASF licenses this file to You under the Apache License, Version 2.0 + (the "License"); you may not use this file except in compliance with + the License. You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + + Unless required by applicable law or agreed to in writing, software + distributed under the License is distributed on an "AS IS" BASIS, + WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + See the License for the specific language governing permissions and + limitations under the License. +--> + +<p>Let’s use Eclipse to attach a remote debugger to a Samza container. If you’re an IntelliJ user, you’ll have to fill in the blanks, but the process should be pretty similar. This tutorial assumes you’ve already run through the <a href="../../../startup/hello-samza/0.10/">Hello Samza</a> tutorial.</p> + +<h3 id="get-the-code">Get the Code</h3> + +<p>Start by checking out Samza, so we have access to the source.</p> + +<div class="highlight"><pre><code class="bash">git clone http://git-wip-us.apache.org/repos/asf/samza.git</code></pre></div> + +<p>Next, grab hello-samza.</p> + +<div class="highlight"><pre><code class="bash">git clone https://git.apache.org/samza-hello-samza.git</code></pre></div> + +<h3 id="setup-the-environment">Setup the Environment</h3> + +<p>Now, let’s setup the Eclipse project files.</p> + +<div class="highlight"><pre><code class="bash"><span class="nb">cd </span>samza +./gradlew eclipse</code></pre></div> + +<p>Let’s also release Samza to Maven’s local repository, so hello-samza has access to the JARs that it needs.</p> + +<div class="highlight"><pre><code class="bash">./gradlew -PscalaVersion<span class="o">=</span>2.10 clean publishToMavenLocal</code></pre></div> + +<p>Next, open Eclipse, and import the Samza source code into your workspace: “File” > “Import” > “Existing Projects into Workspace” > “Browse”. Select ‘samza’ folder, and hit ‘finish’.</p> + +<h3 id="enable-remote-debugging">Enable Remote Debugging</h3> + +<p>Now, go back to the hello-samza project, and edit ./src/main/config/wikipedia-feed.properties to add the following line:</p> + +<div class="highlight"><pre><code class="jproperties"><span class="na">task.opts</span><span class="o">=</span><span class="s">-agentlib:jdwp=transport=dt_socket,address=localhost:9009,server=y,suspend=y</span></code></pre></div> + +<p>The <a href="../../documentation/0.10/jobs/configuration-table.html">task.opts</a> configuration parameter is a way to override Java parameters at runtime for your Samza containers. In this example, we’re setting the agentlib parameter to enable remote debugging on localhost, port 9009. In a more realistic environment, you might also set Java heap settings (-Xmx, -Xms, etc), as well as garbage collection and logging settings.</p> + +<p><em>NOTE: If you’re running multiple Samza containers on the same machine, there is a potential for port collisions. You must configure your task.opts to assign different ports for different Samza jobs. If a Samza job has more than one container (e.g. if you’re using YARN with yarn.container.count=2), those containers must be run on different machines.</em></p> + +<h3 id="start-the-grid">Start the Grid</h3> + +<p>Now that the Samza job has been setup to enable remote debugging when a Samza container starts, let’s start the ZooKeeper, Kafka, and YARN.</p> + +<div class="highlight"><pre><code class="bash">bin/grid</code></pre></div> + +<p>If you get a complaint that JAVA_HOME is not set, then you’ll need to set it. This can be done on OSX by running:</p> + +<div class="highlight"><pre><code class="bash"><span class="nb">export </span><span class="nv">JAVA_HOME</span><span class="o">=</span><span class="k">$(</span>/usr/libexec/java_home<span class="k">)</span></code></pre></div> + +<p>Once the grid starts, you can start the wikipedia-feed Samza job.</p> + +<div class="highlight"><pre><code class="bash">mvn clean package +mkdir -p deploy/samza +tar -xvf ./target/hello-samza-0.10.0-dist.tar.gz -C deploy/samza +deploy/samza/bin/run-job.sh --config-factory<span class="o">=</span>org.apache.samza.config.factories.PropertiesConfigFactory --config-path<span class="o">=</span>file://<span class="nv">$PWD</span>/deploy/samza/config/wikipedia-feed.properties</code></pre></div> + +<p>When the wikipedia-feed job starts up, a single Samza container will be created to process all incoming messages. This is the container that we’ll want to connect to from the remote debugger.</p> + +<h3 id="connect-the-remote-debugger">Connect the Remote Debugger</h3> + +<p>Switch back to Eclipse, and set a break point in TaskInstance.process by clicking on a line inside TaskInstance.process, and clicking “Run” > “Toggle Breakpoint”. A blue circle should appear to the left of the line. This will let you see incoming messages as they arrive.</p> + +<p>Setup a remote debugging session: “Run” > “Debug Configurations…” > right click on “Remote Java Application” > “New”. Set the name to ‘wikipedia-feed-debug’. Set the port to 9009 (matching the port in the task.opts configuration). Click “Source” > “Add…” > “Java Project”. Select all of the Samza projects that you imported (i.e. samza-api, samza-core, etc). If you would like to set breakpoints in your own Stream task, also add the project that contains your StreamTask implementation. Click ‘Debug’.</p> + +<p>After a few moments, Eclipse should connect to the wikipedia-feed job, and ask you to switch to Debug mode. Once in debug, you’ll see that it’s broken at the TaskInstance.process method. From here, you can step through code, inspect variable values, etc.</p> + +<p>Congratulations, you’ve got a remote debug connection to your StreamTask!</p> + + + </div> + </div> + + </div><!-- /.wrapper-content --> + </div><!-- /.wrapper --> + + <div class="footer"> + <div class="container"> + <!-- nothing for now. --> + </div> + </div> + + + <script> + $( document ).ready(function() { + if ( $.fn.urlExists( "/learn/tutorials/latest/remote-debugging-samza.html" ) ) { + $("#switch-version-button").addClass("fa fa-history masthead-icon"); + } + }); + + /* a function to test whether the url exists or not */ + (function( $ ) { + $.fn.urlExists = function(url) { + var http = new XMLHttpRequest(); + http.open('HEAD', url, false); + http.send(); + return http.status != 404; + }; + }( jQuery )); + </script> + + + <!-- Google Analytics --> + <script> + (function(i,s,o,g,r,a,m){i['GoogleAnalyticsObject']=r;i[r]=i[r]||function(){ + (i[r].q=i[r].q||[]).push(arguments)},i[r].l=1*new Date();a=s.createElement(o), + m=s.getElementsByTagName(o)[0];a.async=1;a.src=g;m.parentNode.insertBefore(a,m) + })(window,document,'script','//www.google-analytics.com/analytics.js','ga'); + + ga('create', 'UA-43122768-1', 'apache.org'); + ga('send', 'pageview'); + + </script> + </body> +</html> Added: samza/site/learn/tutorials/0.10/run-hello-samza-without-internet.html URL: http://svn.apache.org/viewvc/samza/site/learn/tutorials/0.10/run-hello-samza-without-internet.html?rev=1721445&view=auto ============================================================================== --- samza/site/learn/tutorials/0.10/run-hello-samza-without-internet.html (added) +++ samza/site/learn/tutorials/0.10/run-hello-samza-without-internet.html Tue Dec 22 19:01:05 2015 @@ -0,0 +1,233 @@ +<!DOCTYPE html> +<!-- + Licensed to the Apache Software Foundation (ASF) under one or more + contributor license agreements. See the NOTICE file distributed with + this work for additional information regarding copyright ownership. + The ASF licenses this file to You under the Apache License, Version 2.0 + (the "License"); you may not use this file except in compliance with + the License. You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + + Unless required by applicable law or agreed to in writing, software + distributed under the License is distributed on an "AS IS" BASIS, + WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + See the License for the specific language governing permissions and + limitations under the License. +--> +<html lang="en"> + <head> + <meta charset="utf-8"> + <title>Samza - Run Hello Samza without Internet</title> + <link href='/css/ropa-sans.css' rel='stylesheet' type='text/css'/> + <link href="/css/bootstrap.min.css" rel="stylesheet"/> + <link href="/css/font-awesome.min.css" rel="stylesheet"/> + <link href="/css/main.css" rel="stylesheet"/> + <link href="/css/syntax.css" rel="stylesheet"/> + <link rel="icon" type="image/png" href="/img/samza-icon.png"> + <script src="/js/jquery-1.11.1.min.js"></script> + </head> + <body> + <div class="wrapper"> + <div class="wrapper-content"> + + <div class="masthead"> + <div class="container"> + <div class="masthead-logo"> + <a href="/" class="logo">samza</a> + </div> + <div class="masthead-icons"> + <div class="pull-right"> + <a href="/startup/download"><i class="fa fa-arrow-circle-o-down masthead-icon"></i></a> + <a href="https://git-wip-us.apache.org/repos/asf?p=samza.git;a=tree" target="_blank"><i class="fa fa-code masthead-icon" style="font-weight: bold;"></i></a> + <a href="https://twitter.com/samzastream" target="_blank"><i class="fa fa-twitter masthead-icon"></i></a> + <!-- this icon only shows in versioned pages --> + + + + + <a href="http://samza.apache.org/learn/tutorials/latest/run-hello-samza-without-internet.html"><i id="switch-version-button"></i></a> + <!-- links for the navigation bar --> + + + </div> + </div> + </div><!-- /.container --> + </div> + + <div class="container"> + <div class="menu"> + <h1><i class="fa fa-rocket"></i> Getting Started</h1> + <ul> + <li><a href="/startup/hello-samza/0.10">Hello Samza</a></li> + <li><a href="/startup/download">Download</a></li> + </ul> + + <h1><i class="fa fa-book"></i> Learn</h1> + <ul> + <li><a href="/learn/documentation/0.10">Documentation</a></li> + <li><a href="/learn/documentation/0.10/jobs/configuration-table.html">Configuration</a></li> + <li><a href="/learn/documentation/0.10/api/javadocs/">Javadocs</a></li> + <li><a href="/learn/tutorials/0.10">Tutorials</a></li> + <li><a href="https://cwiki.apache.org/confluence/display/SAMZA/FAQ">FAQ</a></li> + <li><a href="https://cwiki.apache.org/confluence/display/SAMZA/Apache+Samza">Wiki</a></li> + <li><a href="https://cwiki.apache.org/confluence/pages/viewpage.action?pageId=51812876">Papers & Talks</a></li> + <li><a href="http://blogs.apache.org/samza">Blog</a></li> + </ul> + + <h1><i class="fa fa-comments"></i> Community</h1> + <ul> + <li><a href="/community/mailing-lists.html">Mailing Lists</a></li> + <li><a href="/community/irc.html">IRC</a></li> + <li><a href="https://issues.apache.org/jira/browse/SAMZA">Bugs</a></li> + <li><a href="https://cwiki.apache.org/confluence/display/SAMZA/Powered+By">Powered by</a></li> + <li><a href="https://cwiki.apache.org/confluence/display/SAMZA/Ecosystem">Ecosystem</a></li> + <li><a href="/community/committers.html">Committers</a></li> + </ul> + + <h1><i class="fa fa-code"></i> Contribute</h1> + <ul> + <li><a href="/contribute/rules.html">Rules</a></li> + <li><a href="/contribute/coding-guide.html">Coding Guide</a></li> + <li><a href="/contribute/projects.html">Projects</a></li> + <li><a href="/contribute/design-documents.html">Design Documents</a></li> + <li><a href="/contribute/code.html">Code</a></li> + <li><a href="https://reviews.apache.org/groups/samza">Review Board</a></li> + <li><a href="/contribute/tests.html">Tests</a></li> + </ul> + + <h1><i class="fa fa-history"></i> Archive</h1> + <ul> + <li><a href="/archive/index.html#latest">latest</a></li> + <li><a href="/archive/index.html#09">0.9</a></li> + <li><a href="/archive/index.html#08">0.8</a></li> + <li><a href="/archive/index.html#07">0.7</a></li> + </ul> + </div> + + <div class="content"> + <!-- + Licensed to the Apache Software Foundation (ASF) under one or more + contributor license agreements. See the NOTICE file distributed with + this work for additional information regarding copyright ownership. + The ASF licenses this file to You under the Apache License, Version 2.0 + (the "License"); you may not use this file except in compliance with + the License. You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + + Unless required by applicable law or agreed to in writing, software + distributed under the License is distributed on an "AS IS" BASIS, + WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + See the License for the specific language governing permissions and + limitations under the License. +--> + +<h2>Run Hello Samza without Internet</h2> + +<!-- + Licensed to the Apache Software Foundation (ASF) under one or more + contributor license agreements. See the NOTICE file distributed with + this work for additional information regarding copyright ownership. + The ASF licenses this file to You under the Apache License, Version 2.0 + (the "License"); you may not use this file except in compliance with + the License. You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + + Unless required by applicable law or agreed to in writing, software + distributed under the License is distributed on an "AS IS" BASIS, + WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + See the License for the specific language governing permissions and + limitations under the License. +--> + +<p>This tutorial is to help you run <a href="../../../startup/hello-samza/0.10/">Hello Samza</a> if you can not connect to the internet. </p> + +<h3 id="test-your-connection">Test Your Connection</h3> + +<p>Ping irc.wikimedia.org. Sometimes the firewall in your company blocks this service.</p> + +<div class="highlight"><pre><code class="bash">telnet irc.wikimedia.org 6667</code></pre></div> + +<p>You should see something like this:</p> +<div class="highlight"><pre><code class="language-text" data-lang="text">Trying 208.80.152.178... +Connected to ekrem.wikimedia.org. +Escape character is '^]'. +NOTICE AUTH :*** Processing connection to irc.pmtpa.wikimedia.org +NOTICE AUTH :*** Looking up your hostname... +NOTICE AUTH :*** Checking Ident +NOTICE AUTH :*** Found your hostname +</code></pre></div> +<p>Otherwise, you may have the connection problem.</p> + +<h3 id="use-local-data-to-run-hello-samza">Use Local Data to Run Hello Samza</h3> + +<p>We provide an alternative to get wikipedia feed data. Instead of running</p> + +<div class="highlight"><pre><code class="bash">deploy/samza/bin/run-job.sh --config-factory<span class="o">=</span>org.apache.samza.config.factories.PropertiesConfigFactory --config-path<span class="o">=</span>file://<span class="nv">$PWD</span>/deploy/samza/config/wikipedia-feed.properties</code></pre></div> + +<p>You will run</p> + +<div class="highlight"><pre><code class="bash">bin/produce-wikipedia-raw-data.sh</code></pre></div> + +<p>This script will read wikipedia feed data from local file and produce them to the Kafka broker. By default, it produces to localhost:9092 as the Kafka broker and uses localhost:2181 as zookeeper. You can overwrite them:</p> + +<div class="highlight"><pre><code class="bash">bin/produce-wikipedia-raw-data.sh -b yourKafkaBrokerAddress -z yourZookeeperAddress</code></pre></div> + +<p>Now you can go back to Generate Wikipedia Statistics section in <a href="../../../startup/hello-samza/0.10/">Hello Samza</a> and follow the remaining steps.</p> + +<h3 id="a-little-explanation">A Little Explanation</h3> + +<p>The goal of</p> + +<div class="highlight"><pre><code class="bash">deploy/samza/bin/run-job.sh --config-factory<span class="o">=</span>org.apache.samza.config.factories.PropertiesConfigFactory --config-path<span class="o">=</span>file://<span class="nv">$PWD</span>/deploy/samza/config/wikipedia-feed.properties</code></pre></div> + +<p>is to deploy a Samza job which listens to wikipedia API, receives the feed in realtime and produces the feed to the Kafka topic wikipedia-raw. The alternative in this tutorial is reading local wikipedia feed in an infinite loop and producing the data to Kafka wikipedia-raw. The follow-up job, wikipedia-parser is getting data from Kafka topic wikipedia-raw, so as long as we have correct data in Kafka topic wikipedia-raw, we are fine. All Samza jobs are connected by the Kafka and do not depend on each other.</p> + + + </div> + </div> + + </div><!-- /.wrapper-content --> + </div><!-- /.wrapper --> + + <div class="footer"> + <div class="container"> + <!-- nothing for now. --> + </div> + </div> + + + <script> + $( document ).ready(function() { + if ( $.fn.urlExists( "/learn/tutorials/latest/run-hello-samza-without-internet.html" ) ) { + $("#switch-version-button").addClass("fa fa-history masthead-icon"); + } + }); + + /* a function to test whether the url exists or not */ + (function( $ ) { + $.fn.urlExists = function(url) { + var http = new XMLHttpRequest(); + http.open('HEAD', url, false); + http.send(); + return http.status != 404; + }; + }( jQuery )); + </script> + + + <!-- Google Analytics --> + <script> + (function(i,s,o,g,r,a,m){i['GoogleAnalyticsObject']=r;i[r]=i[r]||function(){ + (i[r].q=i[r].q||[]).push(arguments)},i[r].l=1*new Date();a=s.createElement(o), + m=s.getElementsByTagName(o)[0];a.async=1;a.src=g;m.parentNode.insertBefore(a,m) + })(window,document,'script','//www.google-analytics.com/analytics.js','ga'); + + ga('create', 'UA-43122768-1', 'apache.org'); + ga('send', 'pageview'); + + </script> + </body> +</html> Added: samza/site/learn/tutorials/0.10/run-in-multi-node-yarn.html URL: http://svn.apache.org/viewvc/samza/site/learn/tutorials/0.10/run-in-multi-node-yarn.html?rev=1721445&view=auto ============================================================================== --- samza/site/learn/tutorials/0.10/run-in-multi-node-yarn.html (added) +++ samza/site/learn/tutorials/0.10/run-in-multi-node-yarn.html Tue Dec 22 19:01:05 2015 @@ -0,0 +1,314 @@ +<!DOCTYPE html> +<!-- + Licensed to the Apache Software Foundation (ASF) under one or more + contributor license agreements. See the NOTICE file distributed with + this work for additional information regarding copyright ownership. + The ASF licenses this file to You under the Apache License, Version 2.0 + (the "License"); you may not use this file except in compliance with + the License. You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + + Unless required by applicable law or agreed to in writing, software + distributed under the License is distributed on an "AS IS" BASIS, + WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + See the License for the specific language governing permissions and + limitations under the License. +--> +<html lang="en"> + <head> + <meta charset="utf-8"> + <title>Samza - Run Hello-samza in Multi-node YARN</title> + <link href='/css/ropa-sans.css' rel='stylesheet' type='text/css'/> + <link href="/css/bootstrap.min.css" rel="stylesheet"/> + <link href="/css/font-awesome.min.css" rel="stylesheet"/> + <link href="/css/main.css" rel="stylesheet"/> + <link href="/css/syntax.css" rel="stylesheet"/> + <link rel="icon" type="image/png" href="/img/samza-icon.png"> + <script src="/js/jquery-1.11.1.min.js"></script> + </head> + <body> + <div class="wrapper"> + <div class="wrapper-content"> + + <div class="masthead"> + <div class="container"> + <div class="masthead-logo"> + <a href="/" class="logo">samza</a> + </div> + <div class="masthead-icons"> + <div class="pull-right"> + <a href="/startup/download"><i class="fa fa-arrow-circle-o-down masthead-icon"></i></a> + <a href="https://git-wip-us.apache.org/repos/asf?p=samza.git;a=tree" target="_blank"><i class="fa fa-code masthead-icon" style="font-weight: bold;"></i></a> + <a href="https://twitter.com/samzastream" target="_blank"><i class="fa fa-twitter masthead-icon"></i></a> + <!-- this icon only shows in versioned pages --> + + + + + <a href="http://samza.apache.org/learn/tutorials/latest/run-in-multi-node-yarn.html"><i id="switch-version-button"></i></a> + <!-- links for the navigation bar --> + + + </div> + </div> + </div><!-- /.container --> + </div> + + <div class="container"> + <div class="menu"> + <h1><i class="fa fa-rocket"></i> Getting Started</h1> + <ul> + <li><a href="/startup/hello-samza/0.10">Hello Samza</a></li> + <li><a href="/startup/download">Download</a></li> + </ul> + + <h1><i class="fa fa-book"></i> Learn</h1> + <ul> + <li><a href="/learn/documentation/0.10">Documentation</a></li> + <li><a href="/learn/documentation/0.10/jobs/configuration-table.html">Configuration</a></li> + <li><a href="/learn/documentation/0.10/api/javadocs/">Javadocs</a></li> + <li><a href="/learn/tutorials/0.10">Tutorials</a></li> + <li><a href="https://cwiki.apache.org/confluence/display/SAMZA/FAQ">FAQ</a></li> + <li><a href="https://cwiki.apache.org/confluence/display/SAMZA/Apache+Samza">Wiki</a></li> + <li><a href="https://cwiki.apache.org/confluence/pages/viewpage.action?pageId=51812876">Papers & Talks</a></li> + <li><a href="http://blogs.apache.org/samza">Blog</a></li> + </ul> + + <h1><i class="fa fa-comments"></i> Community</h1> + <ul> + <li><a href="/community/mailing-lists.html">Mailing Lists</a></li> + <li><a href="/community/irc.html">IRC</a></li> + <li><a href="https://issues.apache.org/jira/browse/SAMZA">Bugs</a></li> + <li><a href="https://cwiki.apache.org/confluence/display/SAMZA/Powered+By">Powered by</a></li> + <li><a href="https://cwiki.apache.org/confluence/display/SAMZA/Ecosystem">Ecosystem</a></li> + <li><a href="/community/committers.html">Committers</a></li> + </ul> + + <h1><i class="fa fa-code"></i> Contribute</h1> + <ul> + <li><a href="/contribute/rules.html">Rules</a></li> + <li><a href="/contribute/coding-guide.html">Coding Guide</a></li> + <li><a href="/contribute/projects.html">Projects</a></li> + <li><a href="/contribute/design-documents.html">Design Documents</a></li> + <li><a href="/contribute/code.html">Code</a></li> + <li><a href="https://reviews.apache.org/groups/samza">Review Board</a></li> + <li><a href="/contribute/tests.html">Tests</a></li> + </ul> + + <h1><i class="fa fa-history"></i> Archive</h1> + <ul> + <li><a href="/archive/index.html#latest">latest</a></li> + <li><a href="/archive/index.html#09">0.9</a></li> + <li><a href="/archive/index.html#08">0.8</a></li> + <li><a href="/archive/index.html#07">0.7</a></li> + </ul> + </div> + + <div class="content"> + <!-- + Licensed to the Apache Software Foundation (ASF) under one or more + contributor license agreements. See the NOTICE file distributed with + this work for additional information regarding copyright ownership. + The ASF licenses this file to You under the Apache License, Version 2.0 + (the "License"); you may not use this file except in compliance with + the License. You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + + Unless required by applicable law or agreed to in writing, software + distributed under the License is distributed on an "AS IS" BASIS, + WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + See the License for the specific language governing permissions and + limitations under the License. +--> + +<h2>Run Hello-samza in Multi-node YARN</h2> + +<!-- + Licensed to the Apache Software Foundation (ASF) under one or more + contributor license agreements. See the NOTICE file distributed with + this work for additional information regarding copyright ownership. + The ASF licenses this file to You under the Apache License, Version 2.0 + (the "License"); you may not use this file except in compliance with + the License. You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + + Unless required by applicable law or agreed to in writing, software + distributed under the License is distributed on an "AS IS" BASIS, + WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + See the License for the specific language governing permissions and + limitations under the License. +--> + +<p>You must successfully run the <a href="../../../startup/hello-samza/0.10/">hello-samza</a> project in a single-node YARN by following the <a href="../../../startup/hello-samza/0.10/">hello-samza</a> tutorial. Now it’s time to run the Samza job in a “real” YARN grid (with more than one node).</p> + +<h2 id="set-up-multi-node-yarn">Set Up Multi-node YARN</h2> + +<p>If you already have a multi-node YARN cluster (such as CDH5 cluster), you can skip this set-up section.</p> + +<h3 id="basic-yarn-setting">Basic YARN Setting</h3> + +<p>1. Download <a href="http://mirror.symnds.com/software/Apache/hadoop/common/hadoop-2.6.1/hadoop-2.6.1.tar.gz">YARN 2.6</a> to /tmp and untar it.</p> + +<div class="highlight"><pre><code class="bash"><span class="nb">cd</span> /tmp +tar -xvf hadoop-2.6.1.tar.gz +<span class="nb">cd </span>hadoop-2.6.1</code></pre></div> + +<p>2. Set up environment variables.</p> + +<div class="highlight"><pre><code class="bash"><span class="nb">export </span><span class="nv">HADOOP_YARN_HOME</span><span class="o">=</span><span class="k">$(</span><span class="nb">pwd</span><span class="k">)</span> +mkdir conf +<span class="nb">export </span><span class="nv">HADOOP_CONF_DIR</span><span class="o">=</span><span class="nv">$HADOOP_YARN_HOME</span>/conf</code></pre></div> + +<p>3. Configure YARN setting file.</p> + +<div class="highlight"><pre><code class="bash">cp ./etc/hadoop/yarn-site.xml conf +vi conf/yarn-site.xml</code></pre></div> + +<p>Add the following property to yarn-site.xml:</p> + +<div class="highlight"><pre><code class="xml"><span class="nt"><property></span> + <span class="nt"><name></span>yarn.resourcemanager.hostname<span class="nt"></name></span> + <span class="c"><!-- hostname that is accessible from all NMs --></span> + <span class="nt"><value></span>yourHostname<span class="nt"></value></span> +<span class="nt"></property></span></code></pre></div> + +<p>Download and add capacity-schedule.xml.</p> +<div class="highlight"><pre><code class="language-text" data-lang="text">curl http://svn.apache.org/viewvc/hadoop/common/trunk/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-tests/src/test/resources/capacity-scheduler.xml?view=co > conf/capacity-scheduler.xml +</code></pre></div> +<h3 id="set-up-http-filesystem-for-yarn">Set Up Http Filesystem for YARN</h3> + +<p>The goal of these steps is to configure YARN to read http filesystem because we will use Http server to deploy Samza job package. If you want to use HDFS to deploy Samza job package, you can skip step 4~6 and follow <a href="deploy-samza-job-from-hdfs.html">Deploying a Samza Job from HDFS</a></p> + +<p>4. Download Scala package and untar it.</p> + +<div class="highlight"><pre><code class="bash"><span class="nb">cd</span> /tmp +curl http://www.scala-lang.org/files/archive/scala-2.10.4.tgz > scala-2.10.4.tgz +tar -xvf scala-2.10.4.tgz</code></pre></div> + +<p>5. Add Scala, its log jars, and Samza’s HttpFileSystem implementation.</p> + +<div class="highlight"><pre><code class="bash">cp /tmp/scala-2.10.4/lib/scala-compiler.jar <span class="nv">$HADOOP_YARN_HOME</span>/share/hadoop/hdfs/lib +cp /tmp/scala-2.10.4/lib/scala-library.jar <span class="nv">$HADOOP_YARN_HOME</span>/share/hadoop/hdfs/lib +curl -L http://search.maven.org/remotecontent?filepath<span class="o">=</span>org/clapper/grizzled-slf4j_2.10/1.0.1/grizzled-slf4j_2.10-1.0.1.jar > <span class="nv">$HADOOP_YARN_HOME</span>/share/hadoop/hdfs/lib/grizzled-slf4j_2.10-1.0.1.jar +curl -L http://search.maven.org/remotecontent?filepath<span class="o">=</span>org/apache/samza/samza-yarn_2.10/0.10.0/samza-yarn_2.10-0.10.0.jar > <span class="nv">$HADOOP_YARN_HOME</span>/share/hadoop/hdfs/lib/samza-yarn_2.10-0.10.0.jar +curl -L http://search.maven.org/remotecontent?filepath<span class="o">=</span>org/apache/samza/samza-core_2.10/0.10.0/samza-core_2.10-0.10.0.jar > <span class="nv">$HADOOP_YARN_HOME</span>/share/hadoop/hdfs/lib/samza-core_2.10-0.10.0.jar</code></pre></div> + +<p>6. Add http configuration in core-site.xml (create the core-site.xml file and add content).</p> + +<div class="highlight"><pre><code class="xml">vi $HADOOP_YARN_HOME/conf/core-site.xml</code></pre></div> + +<p>Add the following code:</p> + +<div class="highlight"><pre><code class="xml"><span class="cp"><?xml-stylesheet type="text/xsl" href="configuration.xsl"?></span> +<span class="nt"><configuration></span> + <span class="nt"><property></span> + <span class="nt"><name></span>fs.http.impl<span class="nt"></name></span> + <span class="nt"><value></span>org.apache.samza.util.hadoop.HttpFileSystem<span class="nt"></value></span> + <span class="nt"></property></span> +<span class="nt"></configuration></span></code></pre></div> + +<h3 id="distribute-hadoop-file-to-slaves">Distribute Hadoop File to Slaves</h3> + +<p>7. Basically, you copy the hadoop file in your host machine to slave machines. (172.21.100.35, in my case):</p> + +<div class="highlight"><pre><code class="bash">scp -r . 172.21.100.35:/tmp/hadoop-2.6.1 +<span class="nb">echo </span>172.21.100.35 > conf/slaves +sbin/start-yarn.sh</code></pre></div> + +<ul> +<li>If you get “172.21.100.35: Error: JAVA<em>HOME is not set and could not be found.”, you’ll need to add a conf/hadoop-env.sh file to the machine with the failure (172.21.100.35, in this case), which has “export JAVA</em>HOME=/export/apps/jdk/JDK-1<em>8</em>0<em>45” (or wherever your JAVA</em>HOME actually is).</li> +</ul> + +<p>8. Validate that your nodes are up by visiting http://yourHostname:8088/cluster/nodes.</p> + +<h2 id="deploy-samza-job">Deploy Samza Job</h2> + +<p>Some of the following steps are exactlly identical to what you have seen in <a href="../../../startup/hello-samza/0.10/">hello-samza</a>. You may skip them if you have already done so.</p> + +<p>1. Download Samza and publish it to Maven local repository.</p> + +<div class="highlight"><pre><code class="bash"><span class="nb">cd</span> /tmp +git clone http://git-wip-us.apache.org/repos/asf/samza.git +<span class="nb">cd </span>samza +./gradlew clean publishToMavenLocal +<span class="nb">cd</span> ..</code></pre></div> + +<p>2. Download hello-samza project and change the job properties file.</p> + +<div class="highlight"><pre><code class="bash">git clone git://github.com/linkedin/hello-samza.git +<span class="nb">cd </span>hello-samza +vi src/main/config/wikipedia-feed.properties</code></pre></div> + +<p>Change the yarn.package.path property to be:</p> + +<div class="highlight"><pre><code class="jproperties"><span class="na">yarn.package.path</span><span class="o">=</span><span class="s">http://yourHostname:8000/target/hello-samza-0.10.0-dist.tar.gz</span></code></pre></div> + +<p>3. Complie hello-samza.</p> + +<div class="highlight"><pre><code class="bash">mvn clean package +mkdir -p deploy/samza +tar -xvf ./target/hello-samza-0.10.0-dist.tar.gz -C deploy/samza</code></pre></div> + +<p>4. Deploy Samza job package to Http server..</p> + +<p>Open a new terminal, and run:</p> + +<div class="highlight"><pre><code class="bash"><span class="nb">cd</span> /tmp/hello-samza <span class="o">&&</span> python -m SimpleHTTPServer</code></pre></div> + +<p>Go back to the original terminal (not the one running the HTTP server):</p> + +<div class="highlight"><pre><code class="bash">deploy/samza/bin/run-job.sh --config-factory<span class="o">=</span>org.apache.samza.config.factories.PropertiesConfigFactory --config-path<span class="o">=</span>file://<span class="nv">$PWD</span>/deploy/samza/config/wikipedia-feed.properties</code></pre></div> + +<p>Go to http://yourHostname:8088 and find the wikipedia-feed job. Click on the ApplicationMaster link to see that it’s running.</p> + +<p>Congratulations! You now run the Samza job in a “real” YARN grid!</p> + + + </div> + </div> + + </div><!-- /.wrapper-content --> + </div><!-- /.wrapper --> + + <div class="footer"> + <div class="container"> + <!-- nothing for now. --> + </div> + </div> + + + <script> + $( document ).ready(function() { + if ( $.fn.urlExists( "/learn/tutorials/latest/run-in-multi-node-yarn.html" ) ) { + $("#switch-version-button").addClass("fa fa-history masthead-icon"); + } + }); + + /* a function to test whether the url exists or not */ + (function( $ ) { + $.fn.urlExists = function(url) { + var http = new XMLHttpRequest(); + http.open('HEAD', url, false); + http.send(); + return http.status != 404; + }; + }( jQuery )); + </script> + + + <!-- Google Analytics --> + <script> + (function(i,s,o,g,r,a,m){i['GoogleAnalyticsObject']=r;i[r]=i[r]||function(){ + (i[r].q=i[r].q||[]).push(arguments)},i[r].l=1*new Date();a=s.createElement(o), + m=s.getElementsByTagName(o)[0];a.async=1;a.src=g;m.parentNode.insertBefore(a,m) + })(window,document,'script','//www.google-analytics.com/analytics.js','ga'); + + ga('create', 'UA-43122768-1', 'apache.org'); + ga('send', 'pageview'); + + </script> + </body> +</html> Modified: samza/site/sitemap.xml URL: http://svn.apache.org/viewvc/samza/site/sitemap.xml?rev=1721445&r1=1721444&r2=1721445&view=diff ============================================================================== --- samza/site/sitemap.xml (original) +++ samza/site/sitemap.xml Tue Dec 22 19:01:05 2015 @@ -20,7 +20,7 @@ <url> <loc>http://samza.apache.org/</loc> - <lastmod>2015-07-12</lastmod> + <lastmod>2015-12-22</lastmod> <changefreq>daily</changefreq> <priority>1.0</priority> </url> @@ -30,343 +30,357 @@ <url> <loc>http://samza.apache.org/learn/documentation/versioned/yarn/application-master.html</loc> - <lastmod>2015-07-12</lastmod> + <lastmod>2015-12-22</lastmod> </url> <url> <loc>http://samza.apache.org/learn/documentation/versioned/introduction/architecture.html</loc> - <lastmod>2015-07-12</lastmod> + <lastmod>2015-12-22</lastmod> </url> <url> <loc>http://samza.apache.org/learn/documentation/versioned/introduction/background.html</loc> - <lastmod>2015-07-12</lastmod> + <lastmod>2015-12-22</lastmod> </url> <url> <loc>http://samza.apache.org/learn/documentation/versioned/container/checkpointing.html</loc> - <lastmod>2015-07-12</lastmod> + <lastmod>2015-12-22</lastmod> </url> <url> <loc>http://samza.apache.org/contribute/code.html</loc> - <lastmod>2015-07-12</lastmod> + <lastmod>2015-12-22</lastmod> </url> <url> <loc>http://samza.apache.org/contribute/coding-guide.html</loc> - <lastmod>2015-07-12</lastmod> + <lastmod>2015-12-22</lastmod> </url> <url> <loc>http://samza.apache.org/community/committers.html</loc> - <lastmod>2015-07-12</lastmod> + <lastmod>2015-12-22</lastmod> </url> <url> <loc>http://samza.apache.org/learn/documentation/versioned/introduction/concepts.html</loc> - <lastmod>2015-07-12</lastmod> + <lastmod>2015-12-22</lastmod> </url> <url> <loc>http://samza.apache.org/learn/documentation/versioned/jobs/configuration.html</loc> - <lastmod>2015-07-12</lastmod> + <lastmod>2015-12-22</lastmod> + + + </url> + + <url> + <loc>http://samza.apache.org/learn/documentation/versioned/container/coordinator-stream.html</loc> + <lastmod>2015-12-22</lastmod> </url> <url> <loc>http://samza.apache.org/learn/tutorials/versioned/deploy-samza-job-from-hdfs.html</loc> - <lastmod>2015-07-12</lastmod> + <lastmod>2015-12-22</lastmod> </url> <url> <loc>http://samza.apache.org/learn/tutorials/versioned/deploy-samza-to-CDH.html</loc> - <lastmod>2015-07-12</lastmod> + <lastmod>2015-12-22</lastmod> </url> <url> <loc>http://samza.apache.org/contribute/design-documents.html</loc> - <lastmod>2015-07-12</lastmod> + <lastmod>2015-12-22</lastmod> </url> <url> <loc>http://samza.apache.org/learn/documentation/versioned/container/event-loop.html</loc> - <lastmod>2015-07-12</lastmod> + <lastmod>2015-12-22</lastmod> </url> <url> <loc>http://samza.apache.org/learn/documentation/versioned/index.html</loc> - <lastmod>2015-07-12</lastmod> + <lastmod>2015-12-22</lastmod> </url> <url> <loc>http://samza.apache.org/archive/index.html</loc> - <lastmod>2015-07-12</lastmod> + <lastmod>2015-12-22</lastmod> </url> <url> - <loc>http://samza.apache.org/index.html</loc> - <lastmod>2015-07-12</lastmod> + <loc>http://samza.apache.org/learn/tutorials/versioned/index.html</loc> + <lastmod>2015-12-22</lastmod> </url> <url> - <loc>http://samza.apache.org/learn/tutorials/versioned/index.html</loc> - <lastmod>2015-07-12</lastmod> + <loc>http://samza.apache.org/index.html</loc> + <lastmod>2015-12-22</lastmod> </url> <url> <loc>http://samza.apache.org/startup/download/index.html</loc> - <lastmod>2015-07-12</lastmod> + <lastmod>2015-12-22</lastmod> </url> <url> <loc>http://samza.apache.org/startup/hello-samza/versioned/index.html</loc> - <lastmod>2015-07-12</lastmod> + <lastmod>2015-12-22</lastmod> </url> <url> <loc>http://samza.apache.org/learn/documentation/versioned/comparisons/introduction.html</loc> - <lastmod>2015-07-12</lastmod> + <lastmod>2015-12-22</lastmod> </url> <url> <loc>http://samza.apache.org/community/irc.html</loc> - <lastmod>2015-07-12</lastmod> + <lastmod>2015-12-22</lastmod> </url> <url> <loc>http://samza.apache.org/learn/documentation/versioned/yarn/isolation.html</loc> - <lastmod>2015-07-12</lastmod> + <lastmod>2015-12-22</lastmod> </url> <url> <loc>http://samza.apache.org/learn/documentation/versioned/container/jmx.html</loc> - <lastmod>2015-07-12</lastmod> + <lastmod>2015-12-22</lastmod> </url> <url> <loc>http://samza.apache.org/learn/documentation/versioned/jobs/job-runner.html</loc> - <lastmod>2015-07-12</lastmod> + <lastmod>2015-12-22</lastmod> </url> <url> <loc>http://samza.apache.org/learn/documentation/versioned/operations/kafka.html</loc> - <lastmod>2015-07-12</lastmod> + <lastmod>2015-12-22</lastmod> </url> <url> <loc>http://samza.apache.org/learn/documentation/versioned/jobs/logging.html</loc> - <lastmod>2015-07-12</lastmod> + <lastmod>2015-12-22</lastmod> </url> <url> <loc>http://samza.apache.org/community/mailing-lists.html</loc> - <lastmod>2015-07-12</lastmod> + <lastmod>2015-12-22</lastmod> </url> <url> <loc>http://samza.apache.org/learn/documentation/versioned/container/metrics.html</loc> - <lastmod>2015-07-12</lastmod> + <lastmod>2015-12-22</lastmod> </url> <url> <loc>http://samza.apache.org/learn/documentation/versioned/comparisons/mupd8.html</loc> - <lastmod>2015-07-12</lastmod> + <lastmod>2015-12-22</lastmod> </url> <url> <loc>http://samza.apache.org/learn/documentation/versioned/api/overview.html</loc> - <lastmod>2015-07-12</lastmod> + <lastmod>2015-12-22</lastmod> </url> <url> <loc>http://samza.apache.org/learn/documentation/versioned/jobs/packaging.html</loc> - <lastmod>2015-07-12</lastmod> + <lastmod>2015-12-22</lastmod> + + + </url> + + <url> + <loc>http://samza.apache.org/learn/documentation/versioned/hdfs/producer.html</loc> + <lastmod>2015-12-22</lastmod> </url> <url> <loc>http://samza.apache.org/contribute/projects.html</loc> - <lastmod>2015-07-12</lastmod> + <lastmod>2015-12-22</lastmod> </url> <url> <loc>http://samza.apache.org/learn/tutorials/versioned/remote-debugging-samza.html</loc> - <lastmod>2015-07-12</lastmod> + <lastmod>2015-12-22</lastmod> </url> <url> <loc>http://samza.apache.org/learn/documentation/versioned/jobs/reprocessing.html</loc> - <lastmod>2015-07-12</lastmod> + <lastmod>2015-12-22</lastmod> </url> <url> <loc>http://samza.apache.org/contribute/rules.html</loc> - <lastmod>2015-07-12</lastmod> + <lastmod>2015-12-22</lastmod> </url> <url> <loc>http://samza.apache.org/learn/tutorials/versioned/run-hello-samza-without-internet.html</loc> - <lastmod>2015-07-12</lastmod> + <lastmod>2015-12-22</lastmod> </url> <url> <loc>http://samza.apache.org/learn/tutorials/versioned/run-in-multi-node-yarn.html</loc> - <lastmod>2015-07-12</lastmod> + <lastmod>2015-12-22</lastmod> </url> <url> <loc>http://samza.apache.org/learn/documentation/versioned/container/samza-container.html</loc> - <lastmod>2015-07-12</lastmod> + <lastmod>2015-12-22</lastmod> </url> <url> <loc>http://samza.apache.org/learn/documentation/versioned/operations/security.html</loc> - <lastmod>2015-07-12</lastmod> + <lastmod>2015-12-22</lastmod> </url> <url> <loc>http://samza.apache.org/learn/documentation/versioned/container/serialization.html</loc> - <lastmod>2015-07-12</lastmod> + <lastmod>2015-12-22</lastmod> </url> <url> <loc>http://samza.apache.org/learn/documentation/versioned/comparisons/spark-streaming.html</loc> - <lastmod>2015-07-12</lastmod> + <lastmod>2015-12-22</lastmod> </url> <url> <loc>http://samza.apache.org/learn/documentation/versioned/container/state-management.html</loc> - <lastmod>2015-07-12</lastmod> + <lastmod>2015-12-22</lastmod> </url> <url> <loc>http://samza.apache.org/learn/documentation/versioned/comparisons/storm.html</loc> - <lastmod>2015-07-12</lastmod> + <lastmod>2015-12-22</lastmod> </url> <url> <loc>http://samza.apache.org/learn/documentation/versioned/container/streams.html</loc> - <lastmod>2015-07-12</lastmod> + <lastmod>2015-12-22</lastmod> </url> <url> <loc>http://samza.apache.org/contribute/tests.html</loc> - <lastmod>2015-07-12</lastmod> + <lastmod>2015-12-22</lastmod> </url> <url> - <loc>http://samza.apache.org/learn/tutorials/versioned/upgrading-from-0.7.0-to-0.8.0.html</loc> - <lastmod>2015-07-12</lastmod> + <loc>http://samza.apache.org/learn/documentation/versioned/jobs/web-ui-rest-api.html</loc> + <lastmod>2015-12-22</lastmod> </url> <url> - <loc>http://samza.apache.org/learn/documentation/versioned/jobs/web-ui-rest-api.html</loc> - <lastmod>2015-07-12</lastmod> + <loc>http://samza.apache.org/learn/documentation/versioned/container/windowing.html</loc> + <lastmod>2015-12-22</lastmod> </url> <url> - <loc>http://samza.apache.org/learn/documentation/versioned/container/windowing.html</loc> - <lastmod>2015-07-12</lastmod> + <loc>http://samza.apache.org/learn/documentation/versioned/yarn/yarn-host-affinity.html</loc> + <lastmod>2015-12-22</lastmod> </url> <url> <loc>http://samza.apache.org/learn/documentation/versioned/jobs/yarn-jobs.html</loc> - <lastmod>2015-07-12</lastmod> + <lastmod>2015-12-22</lastmod> </url>
