accumulo-testing git commit: ACCUMULO-4581 Fixing several bugs in agitator scripts
Repository: accumulo-testing Updated Branches: refs/heads/master 28ca75a36 -> 7495ba604 ACCUMULO-4581 Fixing several bugs in agitator scripts * Updated how perl scripts are called in bash * Removed analyze-missing.pl as it relies on centralized logging * Renamed accumulo home and conf dir variables names in agitator perl scripts Project: http://git-wip-us.apache.org/repos/asf/accumulo-testing/repo Commit: http://git-wip-us.apache.org/repos/asf/accumulo-testing/commit/7495ba60 Tree: http://git-wip-us.apache.org/repos/asf/accumulo-testing/tree/7495ba60 Diff: http://git-wip-us.apache.org/repos/asf/accumulo-testing/diff/7495ba60 Branch: refs/heads/master Commit: 7495ba6048ead216e578e8b6cdcc86d4ae8b1b47 Parents: 28ca75a Author: Mike WalchAuthored: Wed Feb 1 15:53:47 2017 -0500 Committer: Mike Walch Committed: Mon Feb 6 15:55:26 2017 -0500 -- bin/accumulo-testing | 28 --- conf/accumulo-testing-env.sh.example | 12 ++- libexec/analyze-missing.pl | 127 -- libexec/datanode-agitator.pl | 18 ++--- libexec/master-agitator.pl | 25 +++--- libexec/tserver-agitator.pl | 22 +++--- 6 files changed, 49 insertions(+), 183 deletions(-) -- http://git-wip-us.apache.org/repos/asf/accumulo-testing/blob/7495ba60/bin/accumulo-testing -- diff --git a/bin/accumulo-testing b/bin/accumulo-testing index 7cf7206..84a1d40 100755 --- a/bin/accumulo-testing +++ b/bin/accumulo-testing @@ -116,6 +116,8 @@ function determine_mapred_main() { } function start_agitator() { + hash pssh 2>/dev/null || { echo >&2 "The agitator requires pssh to be installed. Aborting."; exit 1; } + mkdir -p "${at_home}/logs" log_base="${at_home}/logs/$(date +%Y%m%d%H%M%S)_$(hostname)" libexec="${at_home}/libexec" @@ -132,17 +134,23 @@ function start_agitator() { su -c "$master_cmd >${master_log}.out 2>${master_log}.err" & -m - "$AGTR_ACCUMULO_USER" su -c "$tserver_cmd >${tserver_log}.out 2>${tserver_log}.err" & -m - "$AGTR_ACCUMULO_USER" su -c "$datanode_cmd >${datanode_log}.out 2>${datanode_log}.err" & -m - "$AGTR_HDFS_USER" - elif [[ $AGITATOR_USER == "$AGTR_ACCUMULO_USER" ]]; then -echo "Running master-agitator and tserver-agitator as $AGITATOR_USER Running datanode-agitator as $AGTR_HDFS_USER using sudo." -$master_cmd > "${master_log}.out" 2> "${master_log}.err" & -$tserver_cmd > "${tserver_log}.out" 2> "${tserver_log}.err" & -sudo -u "$AGTR_HDFS_USER" "$datanode_cmd" > "${datanode_log}.out" 2> "${datanode_log}.err" & else -echo "Running master-agitator and tserver-agitator as $AGTR_ACCUMULO_USER using sudo. Running datanode-agitator as $AGTR_HDFS_USER using sudo." -# Not root, and not the accumulo user, hope you can sudo to it -sudo -u "$AGTR_ACCUMULO_USER" "$master_cmd" > "${master_log}.out" 2> "${master_log}.err" & -sudo -u "$AGTR_ACCUMULO_USER" "$tserver_cmd" > "${tserver_log}.out" 2> "${tserver_log}.err" & -sudo -u "$AGTR_HDFS_USER" "$datanode_cmd" > "${datanode_log}.out" 2> "${datanode_log}.err" & -m - "$AGTR_HDFS_USER" +if [[ $AGITATOR_USER == "$AGTR_ACCUMULO_USER" ]]; then + echo "Running master-agitator and tserver-agitator as $AGITATOR_USER" + $master_cmd > "${master_log}.out" 2> "${master_log}.err" & + $tserver_cmd > "${tserver_log}.out" 2> "${tserver_log}.err" & +else + echo "Running master-agitator and tserver-agitator as $AGTR_ACCUMULO_USER using sudo." + sudo -u "$AGTR_ACCUMULO_USER" $master_cmd > "${master_log}.out" 2> "${master_log}.err" & + sudo -u "$AGTR_ACCUMULO_USER" $tserver_cmd > "${tserver_log}.out" 2> "${tserver_log}.err" & +fi +if [[ $AGITATOR_USER == "$AGTR_HDFS_USER" ]]; then + echo "Running datanode-agitator as $AGITATOR_USER" + $datanode_cmd > "${datanode_log}.out" 2> "${datanode_log}.err" & +else + echo "Running datanode-agitator as $AGTR_HDFS_USER using sudo." + sudo -u "$AGTR_HDFS_USER" $datanode_cmd > "${datanode_log}.out" 2> "${datanode_log}.err" & +fi fi if ${AGTR_HDFS:-false} ; then http://git-wip-us.apache.org/repos/asf/accumulo-testing/blob/7495ba60/conf/accumulo-testing-env.sh.example -- diff --git a/conf/accumulo-testing-env.sh.example b/conf/accumulo-testing-env.sh.example index 3f71463..e03c973 100644 --- a/conf/accumulo-testing-env.sh.example +++ b/conf/accumulo-testing-env.sh.example @@ -13,20 +13,18 @@ # See the License for the specific language governing permissions and # limitations under the License. -# Hadoop -# == +# General +# === test -z "$HADOOP_PREFIX" && export HADOOP_PREFIX=/path/to/hadoop -test -z
accumulo-examples git commit: ACCUMULO-4528 tool.sh is now 'accumulo-util hadoop-jar'
Repository: accumulo-examples Updated Branches: refs/heads/master d10b96321 -> 71a84a1ef ACCUMULO-4528 tool.sh is now 'accumulo-util hadoop-jar' * Added note in README about copying jar to accumulo/lib/ext Project: http://git-wip-us.apache.org/repos/asf/accumulo-examples/repo Commit: http://git-wip-us.apache.org/repos/asf/accumulo-examples/commit/71a84a1e Tree: http://git-wip-us.apache.org/repos/asf/accumulo-examples/tree/71a84a1e Diff: http://git-wip-us.apache.org/repos/asf/accumulo-examples/diff/71a84a1e Branch: refs/heads/master Commit: 71a84a1ef2326889a79991dd3ba1ae30d2688119 Parents: d10b963 Author: Mike WalchAuthored: Fri Feb 17 11:36:28 2017 -0500 Committer: Mike Walch Committed: Fri Feb 17 15:21:16 2017 -0500 -- README.md | 12 docs/bulkIngest.md | 2 +- docs/filedata.md| 2 +- docs/mapred.md | 6 +++--- docs/regex.md | 2 +- docs/rowhash.md | 2 +- docs/tabletofile.md | 2 +- docs/terasort.md| 2 +- 8 files changed, 17 insertions(+), 13 deletions(-) -- http://git-wip-us.apache.org/repos/asf/accumulo-examples/blob/71a84a1e/README.md -- diff --git a/README.md b/README.md index 63a02d8..c4450eb 100644 --- a/README.md +++ b/README.md @@ -41,7 +41,12 @@ Before running any of the examples, the following steps must be performed. cp examples.conf.template examples.conf nano examples.conf -5. Each Accumulo example has its own documentation and instructions for running the example which +5. The examples have some custom iterators that need to be executed by Accumulo tablet servers. + Make them available by copying the accumulo-examples.jar to Accumulo's `lib/ext` directory. + +cp target/accumulo-examples-X.Y.Z.jar /path/accumulo/lib/ext/ + +6. Each Accumulo example has its own documentation and instructions for running the example which are linked to below. When running the examples, remember the tips below: @@ -50,9 +55,8 @@ When running the examples, remember the tips below: The `runex` command is a simple wrapper around the Maven Exec plugin. * Commands intended to be run in bash are prefixed by '$' and should be run from the root of this repository. -* Several examples use the `accumulo` and `tool.sh` commands which are expected to be on your - `PATH`. These commands are found in the `bin/` and `contrib/` directories of your Accumulo - installation. +* Several examples use the `accumulo` and `accumulo-util` commands which are expected to be on your + `PATH`. These commands are found in the `bin/` directory of your Accumulo installation. * Commands intended to be run in the Accumulo shell are prefixed by '>'. ## Available Examples http://git-wip-us.apache.org/repos/asf/accumulo-examples/blob/71a84a1e/docs/bulkIngest.md -- diff --git a/docs/bulkIngest.md b/docs/bulkIngest.md index 614bde4..22bf07c 100644 --- a/docs/bulkIngest.md +++ b/docs/bulkIngest.md @@ -27,7 +27,7 @@ accumulo. Then we verify the 1000 rows are in accumulo. $ ARGS="-i instance -z zookeepers -u username -p password" $ accumulo $PKG.SetupTable $ARGS -t test_bulk row_0333 row_0666 $ accumulo $PKG.GenerateTestData --start-row 0 --count 1000 --output bulk/test_1.txt -$ tool.sh target/accumulo-examples.jar $PKG.BulkIngestExample $ARGS -t test_bulk --inputDir bulk --workDir tmp/bulkWork +$ accumulo-util hadoop-jar target/accumulo-examples.jar $PKG.BulkIngestExample $ARGS -t test_bulk --inputDir bulk --workDir tmp/bulkWork $ accumulo $PKG.VerifyIngest $ARGS -t test_bulk --start-row 0 --count 1000 For a high level discussion of bulk ingest, see the docs dir. http://git-wip-us.apache.org/repos/asf/accumulo-examples/blob/71a84a1e/docs/filedata.md -- diff --git a/docs/filedata.md b/docs/filedata.md index 84311d2..aacd86e 100644 --- a/docs/filedata.md +++ b/docs/filedata.md @@ -40,7 +40,7 @@ Open the accumulo shell and look at the data. The row is the MD5 hash of the fil Run the CharacterHistogram MapReduce to add some information about the file. -$ tool.sh target/accumulo-examples.jar org.apache.accumulo.examples.filedata.CharacterHistogram -c ./examples.conf -t dataTable --auths exampleVis --vis exampleVis +$ accumulo-util hadoop-jar target/accumulo-examples.jar org.apache.accumulo.examples.filedata.CharacterHistogram -c ./examples.conf -t dataTable --auths exampleVis --vis exampleVis Scan again to see the histogram stored in the 'info' column family. http://git-wip-us.apache.org/repos/asf/accumulo-examples/blob/71a84a1e/docs/mapred.md
[3/4] accumulo git commit: ACCUMULO-4528 Accumulo scripts improvements
ACCUMULO-4528 Accumulo scripts improvements * Accumulo now determines hostname in Java * Minimized use of environment variables * Consolidated scripts by moving code in service.sh and cluster.sh to accumulo-service and accumulo-cluster. * Example host files (i.e master, tservers) are no longer included in tarball distribution. User can create them using 'accumulo-cluster create-config' * Moved check-tservers from distribution to contrib/scripts in repo. * NUMA and multiple tservers are no longer configured in scripts but could be NUMA commands could be added using ACCUMULO_JAVA_PREFIX env variable. * Removed accumulo-watcher script as restarting services should not be handled by Accumulo scripts. Script coud still be used in future using ACCUMULO_JAVA_PREFIX. * Made several updates to accumulo-env.sh * Moved create-config and build-native from accumulo script to new accumulo-util script which now includes scripts from contrib dir Project: http://git-wip-us.apache.org/repos/asf/accumulo/repo Commit: http://git-wip-us.apache.org/repos/asf/accumulo/commit/9a3cc5c4 Tree: http://git-wip-us.apache.org/repos/asf/accumulo/tree/9a3cc5c4 Diff: http://git-wip-us.apache.org/repos/asf/accumulo/diff/9a3cc5c4 Branch: refs/heads/master Commit: 9a3cc5c445293e8d4219cc066757a72a972804b4 Parents: 00b1535 Author: Mike WalchAuthored: Thu Feb 2 12:15:17 2017 -0500 Committer: Mike Walch Committed: Fri Feb 17 13:47:06 2017 -0500 -- INSTALL.md | 42 +- assemble/bin/accumulo | 610 +++-- assemble/bin/accumulo-cluster | 300 +++- assemble/bin/accumulo-service | 95 ++- assemble/bin/accumulo-util | 686 +++ assemble/conf/examples/gc | 16 - .../conf/examples/generic_logger.properties | 6 +- assemble/conf/examples/generic_logger.xml | 6 +- assemble/conf/examples/masters | 16 - assemble/conf/examples/monitor | 16 - .../conf/examples/templates/accumulo-env.sh | 64 ++ .../conf/examples/templates/accumulo-site.xml | 175 + assemble/conf/examples/tracers | 16 - assemble/conf/examples/tservers | 16 - assemble/contrib/bootstrap-hdfs.sh | 91 --- assemble/contrib/check-tservers | 199 -- assemble/contrib/gen-monitor-cert.sh| 85 --- assemble/contrib/tool.sh| 93 --- assemble/libexec/accumulo-watcher.sh| 141 assemble/libexec/cluster.sh | 325 - assemble/libexec/load-env.sh| 155 - assemble/libexec/service.sh | 239 --- assemble/libexec/templates/accumulo-env.sh | 90 --- assemble/libexec/templates/accumulo-site.xml| 175 - assemble/pom.xml| 7 +- assemble/src/main/assemblies/component.xml | 50 +- .../main/scripts/generate-example-configs.sh| 2 +- contrib/scripts/check-tservers.py | 199 ++ .../accumulo/core/conf/ConfigurationDocGen.java | 2 +- .../org/apache/accumulo/core/conf/Property.java | 2 +- .../main/asciidoc/chapters/administration.txt | 187 ++--- docs/src/main/asciidoc/chapters/clients.txt | 4 +- docs/src/main/asciidoc/chapters/kerberos.txt| 14 +- docs/src/main/asciidoc/chapters/replication.txt | 4 +- docs/src/main/asciidoc/chapters/ssl.txt | 4 +- .../main/asciidoc/chapters/troubleshooting.txt | 7 +- .../apache/accumulo/server/init/Initialize.java | 2 +- .../java/org/apache/accumulo/start/Main.java| 2 - 38 files changed, 1691 insertions(+), 2452 deletions(-) -- http://git-wip-us.apache.org/repos/asf/accumulo/blob/9a3cc5c4/INSTALL.md -- diff --git a/INSTALL.md b/INSTALL.md index b614991..6e924c4 100644 --- a/INSTALL.md +++ b/INSTALL.md @@ -25,11 +25,13 @@ source code. Unpack as follows. tar xzf /accumulo-X.Y.Z-bin.tar.gz cd accumulo-X.Y.Z -There are three scripts in the the `bin/` directory that are used to manage Accumulo: +There are four scripts in the `bin` directory of the tarball distribution that are used +to manage Accumulo: 1. `accumulo` - Runs Accumulo command-line tools and starts Accumulo processes 2. `accumulo-service` - Runs Accumulo processes as services 3. `accumulo-cluster` - Manages Accumulo cluster on a single node or several nodes +4. `accumulo-util` - Accumulo utilities for creating configuration, native libraries, etc. These scripts will be used in the remaining instructions to configure and run Accumulo. For convenience, consider adding `accumulo-X.Y.Z/bin/`
[1/4] accumulo git commit: ACCUMULO-4528 Accumulo scripts improvements
Repository: accumulo Updated Branches: refs/heads/master e2247ead5 -> 6494a829b http://git-wip-us.apache.org/repos/asf/accumulo/blob/9a3cc5c4/docs/src/main/asciidoc/chapters/administration.txt -- diff --git a/docs/src/main/asciidoc/chapters/administration.txt b/docs/src/main/asciidoc/chapters/administration.txt index 1478543..f2ed57a 100644 --- a/docs/src/main/asciidoc/chapters/administration.txt +++ b/docs/src/main/asciidoc/chapters/administration.txt @@ -40,7 +40,7 @@ network bandwidth must be available between any two machines. In addition to needing access to ports associated with HDFS and ZooKeeper, Accumulo will use the following default ports. Please make sure that they are open, or change -their value in conf/accumulo-site.xml. +their value in accumulo-site.xml. .Accumulo default ports [width="75%",cols=">,^2,^2"] @@ -80,24 +80,15 @@ sufficient space: Repeat this step on each machine in your cluster. Typically, the same ++ is chosen for all machines in the cluster. -There are three scripts in the the `bin/` directory that are used to manage Accumulo: +There are four scripts in the `bin/` directory that are used to manage Accumulo: 1. `accumulo` - Runs Accumulo command-line tools and starts Accumulo processes 2. `accumulo-service` - Runs Accumulo processes as services 3. `accumulo-cluster` - Manages Accumulo cluster on a single node or several nodes +4. `accumulo-util` - Accumulo utilities for creating configuration, native libraries, etc. These scripts will be used in the remaining instructions to configure and run Accumulo. -Add the following to your `~/.bashrc` if you want to be able to execute these scripts -from any directory: - - export PATH=/path/to/accumulo-X.Y.Z/bin:$PATH - -Source your `~/.bashrc` for the changes to take effect and verify: - - source ~/.bashrc - which accumulo - === Dependencies Accumulo requires HDFS and ZooKeeper to be configured and running @@ -108,32 +99,37 @@ sync, which can cause problems with automatically timestamped data. === Configuration -Accumulo is configured by editing several Shell and XML files found in -+$ACCUMULO_CONF_DIR+. The structure closely resembles Hadoop's configuration -files. +The Accumulo tarball contains a +conf/+ directory where Accumulo looks for configuration. If you +installed Accumulo using downstream packaging, the +conf/+ could be something else like +/etc/accumulo/+. -Logging is primarily controlled using the log4j configuration files, -+generic_logger.xml+ and +monitor_logger.xml+ (or their corresponding -+.properties+ version if the +.xml+ version is missing). The generic logger is -used for most server types, and is typically configured to send logs to the -monitor, as well as log files. The monitor logger is used by the monitor, and -is typically configured to log only errors the monitor itself generates, -rather than all the logs that it receives from other server types. +Before starting Accumulo, the configuration files +accumulo-env.sh+ and +accumulo-site.xml+ must exist in ++conf/+ and be properly configured. You can either copy these files from +conf/examples+ or run ++accumulo-util create-config+ to generate these files. If you are using +accumulo-cluster+ to launch +a cluster, the `conf/` directory must also contain hosts file for Accumulo services (i.e +gc+, +masters+, ++monitor+, +tservers+, +tracers+). You can either create these files manually or run ++accumulo-cluster create-config+. - Edit conf/accumulo-env.sh +Additional optional configuration files can be copied from `conf/examples` to `conf/`. For example, +logging is primarily controlled using the log4j configuration files, +generic_logger.xml+ and ++monitor_logger.xml+ (or their corresponding +.properties+ version if the +.xml+ version is missing). +The generic logger is used for most server types, and is typically configured to send logs to the +monitor, as well as log files. The monitor logger is used by the monitor, and is typically configured +to log only errors the monitor itself generates, rather than all the logs that it receives from other +server types. + + Configure accumulo-env.sh Accumulo needs to know where to find the software it depends on. Edit accumulo-env.sh and specify the following: -. Enter your system's Java home for +$JAVA_HOME+ . Enter the location of Hadoop for +$HADOOP_PREFIX+ -. Choose a location for Accumulo logs and enter it for +$ACCUMULO_LOG_DIR+ . Enter the location of ZooKeeper for +$ZOOKEEPER_HOME+ +. Optionally, choose a different location for Accumulo logs using +$ACCUMULO_LOG_DIR+ -By default Accumulo TabletServers are set to use 1GB of memory. You may change -this by altering the value of +$ACCUMULO_TSERVER_OPTS+. Note the syntax is that of -the Java JVM command line options. This value should be less than the physical -memory of the machines running TabletServers. +You
[4/4] accumulo git commit: Merge branch 'script-refactor'
Merge branch 'script-refactor' Project: http://git-wip-us.apache.org/repos/asf/accumulo/repo Commit: http://git-wip-us.apache.org/repos/asf/accumulo/commit/6494a829 Tree: http://git-wip-us.apache.org/repos/asf/accumulo/tree/6494a829 Diff: http://git-wip-us.apache.org/repos/asf/accumulo/diff/6494a829 Branch: refs/heads/master Commit: 6494a829b9560b3b38359641f25ecdcf3aac9a75 Parents: e2247ea 9a3cc5c Author: Mike WalchAuthored: Fri Feb 17 14:05:34 2017 -0500 Committer: Mike Walch Committed: Fri Feb 17 14:05:34 2017 -0500 -- INSTALL.md | 42 +- assemble/bin/accumulo | 610 +++-- assemble/bin/accumulo-cluster | 300 +++- assemble/bin/accumulo-service | 95 ++- assemble/bin/accumulo-util | 686 +++ assemble/conf/examples/gc | 16 - .../conf/examples/generic_logger.properties | 6 +- assemble/conf/examples/generic_logger.xml | 6 +- assemble/conf/examples/masters | 16 - assemble/conf/examples/monitor | 16 - .../conf/examples/templates/accumulo-env.sh | 64 ++ .../conf/examples/templates/accumulo-site.xml | 175 + assemble/conf/examples/tracers | 16 - assemble/conf/examples/tservers | 16 - assemble/contrib/bootstrap-hdfs.sh | 91 --- assemble/contrib/check-tservers | 199 -- assemble/contrib/gen-monitor-cert.sh| 85 --- assemble/contrib/tool.sh| 93 --- assemble/libexec/accumulo-watcher.sh| 141 assemble/libexec/cluster.sh | 325 - assemble/libexec/load-env.sh| 155 - assemble/libexec/service.sh | 239 --- assemble/libexec/templates/accumulo-env.sh | 90 --- assemble/libexec/templates/accumulo-site.xml| 175 - assemble/pom.xml| 7 +- assemble/src/main/assemblies/component.xml | 50 +- .../main/scripts/generate-example-configs.sh| 2 +- contrib/scripts/check-tservers.py | 199 ++ .../accumulo/core/conf/ConfigurationDocGen.java | 2 +- .../org/apache/accumulo/core/conf/Property.java | 2 +- .../main/asciidoc/chapters/administration.txt | 187 ++--- docs/src/main/asciidoc/chapters/clients.txt | 4 +- docs/src/main/asciidoc/chapters/kerberos.txt| 14 +- docs/src/main/asciidoc/chapters/replication.txt | 4 +- docs/src/main/asciidoc/chapters/ssl.txt | 4 +- .../main/asciidoc/chapters/troubleshooting.txt | 7 +- .../apache/accumulo/server/init/Initialize.java | 2 +- .../java/org/apache/accumulo/start/Main.java| 2 - 38 files changed, 1691 insertions(+), 2452 deletions(-) -- http://git-wip-us.apache.org/repos/asf/accumulo/blob/6494a829/docs/src/main/asciidoc/chapters/administration.txt -- diff --cc docs/src/main/asciidoc/chapters/administration.txt index bfddb31,f2ed57a..ad6cf11 --- a/docs/src/main/asciidoc/chapters/administration.txt +++ b/docs/src/main/asciidoc/chapters/administration.txt @@@ -1178,24 -1129,25 +1129,16 @@@ are true interruptions to availability Several of these conditions become more common in VM environments, where they can be exacerbated by resource constraints and clock drift. - Accumulo includes a mechanism to limit the impact of the false positives known - as the <>. The watcher monitors Accumulo processes and will restart - them when they fail for certain reasons. The watcher can be configured within - the accumulo-env.sh file inside of Accumulo's configuration directory. We - recommend using the watcher to monitor Accumulo processes, as it will restore - the system to full capacity without administrator interaction after many of the - common failure modes. - Tested Versions -Another large consideration for Accumulo stability is to use versions of -software that have been tested together in a VM environment. Any cluster of -processes that have not been tested together are likely to expose running -conditions that vary from the environments individually tested in the various -components. For example, Accumulo's use of HDFS includes many short block -reads, which differs from the more common full file read used in most -map/reduce applications. We have found that certain versions of Accumulo and -Hadoop will include stability bugs that greatly affect overall stability. In -our testing, Accumulo 1.6.2, Hadoop 2.6.0, and Zookeeper 3.4.6 resulted in a -stable VM clusters that did not fail a month of testing, while Accumulo 1.6.1, -Hadoop 2.5.1, and Zookeeper 3.4.5 had a mean
[2/4] accumulo git commit: ACCUMULO-4528 Accumulo scripts improvements
http://git-wip-us.apache.org/repos/asf/accumulo/blob/9a3cc5c4/assemble/conf/examples/templates/accumulo-site.xml -- diff --git a/assemble/conf/examples/templates/accumulo-site.xml b/assemble/conf/examples/templates/accumulo-site.xml new file mode 100644 index 000..a1f4153 --- /dev/null +++ b/assemble/conf/examples/templates/accumulo-site.xml @@ -0,0 +1,175 @@ + + + + + + + +instance.volumes + +comma separated list of URIs for volumes. example: hdfs://localhost:9000/accumulo + + + +instance.zookeeper.host +localhost:2181 +comma separated list of zookeeper servers + + + +instance.secret +DEFAULT +A secret unique to a given instance that all servers must know in order to communicate with one another. + Change it before initialization. To + change it later use ./bin/accumulo org.apache.accumulo.server.util.ChangeSecret --old [oldpasswd] --new [newpasswd], + and then update this file. + + + + +tserver.memory.maps.max +${memMapMax} + + + +tserver.memory.maps.native.enabled +${nativeEnabled} + + + +tserver.cache.data.size +${cacheDataSize} + + + +tserver.cache.index.size +${cacheIndexSize} + + + +trace.token.property.password + +secret + + + + +instance.rpc.sasl.enabled +true + + + +general.kerberos.keytab +${keytab} + + + +general.kerberos.principal +${principal} + + + +trace.token.type + org.apache.accumulo.core.client.security.tokens.KerberosToken + + + +instance.security.authenticator + org.apache.accumulo.server.security.handler.KerberosAuthenticator + + + +instance.security.authorizor + org.apache.accumulo.server.security.handler.KerberosAuthorizor + + + +instance.security.permissionHandler + org.apache.accumulo.server.security.handler.KerberosPermissionHandler + + + + +trace.user +${traceUser} + + + +tserver.sort.buffer.size +${sortBufferSize} + + + +tserver.walog.max.size +${waLogMaxSize} + +${mvnProjBaseDir} + +general.classpaths + + + + $ACCUMULO_HOME/lib/accumulo-server.jar, + $ACCUMULO_HOME/lib/accumulo-core.jar, + $ACCUMULO_HOME/lib/accumulo-start.jar, + $ACCUMULO_HOME/lib/accumulo-fate.jar, + $ACCUMULO_HOME/lib/accumulo-proxy.jar, + $ACCUMULO_HOME/lib/[^.].*.jar, + + $ZOOKEEPER_HOME/zookeeper[^.].*.jar, + + $HADOOP_CONF_DIR, + + $HADOOP_PREFIX/share/hadoop/common/[^.].*.jar, + $HADOOP_PREFIX/share/hadoop/common/lib/(?!slf4j)[^.].*.jar, + $HADOOP_PREFIX/share/hadoop/hdfs/[^.].*.jar, + $HADOOP_PREFIX/share/hadoop/mapreduce/[^.].*.jar, + $HADOOP_PREFIX/share/hadoop/yarn/[^.].*.jar, + $HADOOP_PREFIX/share/hadoop/yarn/lib/jersey.*.jar, + + + /usr/lib/hadoop/[^.].*.jar, + /usr/lib/hadoop/lib/[^.].*.jar, + /usr/lib/hadoop-hdfs/[^.].*.jar, + /usr/lib/hadoop-mapreduce/[^.].*.jar, + /usr/lib/hadoop-yarn/[^.].*.jar, + /usr/lib/hadoop-yarn/lib/jersey.*.jar, + + + /usr/hdp/current/hadoop-client/[^.].*.jar, + /usr/hdp/current/hadoop-client/lib/(?!slf4j)[^.].*.jar, + /usr/hdp/current/hadoop-hdfs-client/[^.].*.jar, + /usr/hdp/current/hadoop-mapreduce-client/[^.].*.jar, + /usr/hdp/current/hadoop-yarn-client/[^.].*.jar, + /usr/hdp/current/hadoop-yarn-client/lib/jersey.*.jar, + /usr/hdp/current/hive-client/lib/hive-accumulo-handler.jar + + + /usr/iop/current/hadoop-client/[^.].*.jar, + /usr/iop/current/hadoop-client/lib/(?!slf4j)[^.].*.jar, + /usr/iop/current/hadoop-hdfs-client/[^.].*.jar, + /usr/iop/current/hadoop-mapreduce-client/[^.].*.jar, + /usr/iop/current/hadoop-yarn-client/[^.].*.jar, + /usr/iop/current/hadoop-yarn-client/lib/jersey.*.jar, + /usr/iop/current/hive-client/lib/hive-accumulo-handler.jar + + +Classpaths that accumulo checks for updates and class files. + + http://git-wip-us.apache.org/repos/asf/accumulo/blob/9a3cc5c4/assemble/conf/examples/tracers -- diff --git a/assemble/conf/examples/tracers b/assemble/conf/examples/tracers deleted file mode 100644 index 63fb8bb..000 --- a/assemble/conf/examples/tracers +++ /dev/null @@ -1,16 +0,0 @@ -# Licensed to the Apache Software Foundation (ASF) under one or more -# contributor license agreements. See the NOTICE file distributed with -# this work for additional information regarding copyright ownership. -# The ASF licenses this file to You under the Apache License, Version 2.0 -# (the "License"); you may not use this file except in compliance with -# the License. You may obtain a copy of the License at -# -# http://www.apache.org/licenses/LICENSE-2.0 -# -# Unless required by applicable law or agreed
[2/3] accumulo-wikisearch git commit: Use hadoop-client dep instead of hadoop-common
Use hadoop-client dep instead of hadoop-common Project: http://git-wip-us.apache.org/repos/asf/accumulo-wikisearch/repo Commit: http://git-wip-us.apache.org/repos/asf/accumulo-wikisearch/commit/fb4af6c2 Tree: http://git-wip-us.apache.org/repos/asf/accumulo-wikisearch/tree/fb4af6c2 Diff: http://git-wip-us.apache.org/repos/asf/accumulo-wikisearch/diff/fb4af6c2 Branch: refs/heads/master Commit: fb4af6c2d50d061f33ae4341d37290b6b56bd1c4 Parents: eb573a5 Author: Mike MillerAuthored: Thu Feb 16 15:52:21 2017 -0500 Committer: Mike Miller Committed: Fri Feb 17 10:38:49 2017 -0500 -- pom.xml | 2 +- query/pom.xml | 14 ++ 2 files changed, 3 insertions(+), 13 deletions(-) -- http://git-wip-us.apache.org/repos/asf/accumulo-wikisearch/blob/fb4af6c2/pom.xml -- diff --git a/pom.xml b/pom.xml index 08e9dbb..d62928a 100644 --- a/pom.xml +++ b/pom.xml @@ -68,7 +68,7 @@ org.apache.hadoop - hadoop-common + hadoop-client ${version.hadoop} http://git-wip-us.apache.org/repos/asf/accumulo-wikisearch/blob/fb4af6c2/query/pom.xml -- diff --git a/query/pom.xml b/query/pom.xml index 76494eb..e022965 100644 --- a/query/pom.xml +++ b/query/pom.xml @@ -74,17 +74,7 @@ org.apache.hadoop - hadoop-common - - -com.sun.jersey -jersey-json - - -javax.servlet -servlet-api - - + hadoop-client javaee @@ -156,7 +146,7 @@ lib - commons-io,commons-configuration,commons-lang,commons-codec,protobuf-java,libthrift,zookeeper,hadoop-common,commons-jexl,guava,kryo,asm,minlog,reflectasm,wikisearch-ingest,accumulo-core,accumulo-fate,accumulo-trace,htrace-core + commons-io,commons-configuration,commons-lang,commons-codec,protobuf-java,libthrift,zookeeper,hadoop-client,commons-jexl,guava,kryo,asm,minlog,reflectasm,wikisearch-ingest,accumulo-core,accumulo-fate,accumulo-trace,htrace-core true
[1/3] accumulo-wikisearch git commit: Fixes to query for 1.8 Update
Repository: accumulo-wikisearch Updated Branches: refs/heads/master 074fa7729 -> e51ad6a2f Fixes to query for 1.8 Update Project: http://git-wip-us.apache.org/repos/asf/accumulo-wikisearch/repo Commit: http://git-wip-us.apache.org/repos/asf/accumulo-wikisearch/commit/eb573a51 Tree: http://git-wip-us.apache.org/repos/asf/accumulo-wikisearch/tree/eb573a51 Diff: http://git-wip-us.apache.org/repos/asf/accumulo-wikisearch/diff/eb573a51 Branch: refs/heads/master Commit: eb573a5188c10fc82ddf911f4a0ab892860335d1 Parents: 074fa77 Author: Mike MillerAuthored: Wed Jan 4 14:19:33 2017 -0500 Committer: Mike Miller Committed: Thu Feb 16 10:53:38 2017 -0500 -- .gitignore | 3 +- INSTALL.md | 14 +- pom.xml | 3 +- query-war/src/main/webapp/WEB-INF/web.xml | 10 -- query-war/src/main/webapp/ui.html | 131 +++ query-war/src/main/webapp/ui.jsp| 131 --- query/pom.xml | 29 +++- .../iterator/DefaultIteratorEnvironment.java| 57 ++-- .../src/main/resources/META-INF/ejb-jar.xml.uno | 62 + 9 files changed, 242 insertions(+), 198 deletions(-) -- http://git-wip-us.apache.org/repos/asf/accumulo-wikisearch/blob/eb573a51/.gitignore -- diff --git a/.gitignore b/.gitignore index 8a09ac0..9a97fb5 100644 --- a/.gitignore +++ b/.gitignore @@ -5,4 +5,5 @@ .project .settings/ .classpath - +wikipedia.xml +ejb-jar.xml http://git-wip-us.apache.org/repos/asf/accumulo-wikisearch/blob/eb573a51/INSTALL.md -- diff --git a/INSTALL.md b/INSTALL.md index 9a85105..f7cc175 100644 --- a/INSTALL.md +++ b/INSTALL.md @@ -49,9 +49,12 @@ Instructions for installing and running the Accumulo Wikisearch example. ### Prerequisites -1. The query software was tested using JBoss AS 6. Install this unless you feel like messing with the installation. - - NOTE: Ran into a [bug] that did not allow an EJB3.1 war file. The workaround is to separate the RESTEasy servlet -from the EJBs by creating an EJB jar and a WAR file. +1. The query software was tested using JBoss AS 6. Install the JBoss distro and follow the instructions below + to build the EJB jar and WAR file required. + * To stop the JBoss warnings about WSDescriptorDeployer and JMSDescriptorDeployer, these deployers can be +removed from `$JBOSS_HOME/server/default/deployers/jbossws.deployer/META-INF/stack-agnostic-jboss-beans.xml` +1. Ensure that you have successfully run `mvn clean install` at the Wikisearch top level to install the jars + into your local maven repo before building the query package. ### Instructions @@ -85,7 +88,7 @@ Instructions for installing and running the Accumulo Wikisearch example. 1. At this point you should be able to open a browser and view the page: -http://localhost:8080/accumulo-wikisearch/ui/ui.jsp +http://localhost:8080/accumulo-wikisearch/ui.html You can issue the queries using this user interface or via the following REST urls: @@ -98,6 +101,9 @@ Instructions for installing and running the Accumulo Wikisearch example. into the search box at ui.jsp, and the auths parameter is a comma-separated list of wikis that you want to search (i.e. enwiki,frwiki,dewiki, etc. Or you can use all) + - NOTE: Ran into a [bug] that did not allow an EJB3.1 war file. The workaround is to separate the RESTEasy servlet +from the EJBs by creating an EJB jar and a WAR file. + [ejb-jar.xml.example]: query/src/main/resources/META-INF/ejb-jar.xml.example [dump-files]: http://dumps.wikimedia.org/backup-index.html [wikipedia.xml.example]: ingest/conf/wikipedia.xml.example http://git-wip-us.apache.org/repos/asf/accumulo-wikisearch/blob/eb573a51/pom.xml -- diff --git a/pom.xml b/pom.xml index bebc1cf..08e9dbb 100644 --- a/pom.xml +++ b/pom.xml @@ -45,6 +45,7 @@ 1.0.1.Final 11.0.2 2.6.4 +3.1.0-incubating 2.1.0.GA 4.11 1.04 @@ -67,7 +68,7 @@ org.apache.hadoop - hadoop-client + hadoop-common ${version.hadoop} http://git-wip-us.apache.org/repos/asf/accumulo-wikisearch/blob/eb573a51/query-war/src/main/webapp/WEB-INF/web.xml -- diff --git a/query-war/src/main/webapp/WEB-INF/web.xml b/query-war/src/main/webapp/WEB-INF/web.xml index a4ff03a..ffde45a 100644 --- a/query-war/src/main/webapp/WEB-INF/web.xml +++
[3/3] accumulo-wikisearch git commit: Fix to use proper Accumulo API
Fix to use proper Accumulo API Project: http://git-wip-us.apache.org/repos/asf/accumulo-wikisearch/repo Commit: http://git-wip-us.apache.org/repos/asf/accumulo-wikisearch/commit/e51ad6a2 Tree: http://git-wip-us.apache.org/repos/asf/accumulo-wikisearch/tree/e51ad6a2 Diff: http://git-wip-us.apache.org/repos/asf/accumulo-wikisearch/diff/e51ad6a2 Branch: refs/heads/master Commit: e51ad6a2f6a2f6437f627e6ec7d76f17d0378323 Parents: fb4af6c Author: Mike MillerAuthored: Fri Feb 17 12:27:58 2017 -0500 Committer: Mike Miller Committed: Fri Feb 17 12:27:58 2017 -0500 -- .../iterator/DefaultIteratorEnvironment.java| 45 1 file changed, 37 insertions(+), 8 deletions(-) -- http://git-wip-us.apache.org/repos/asf/accumulo-wikisearch/blob/e51ad6a2/query/src/main/java/org/apache/accumulo/examples/wikisearch/iterator/DefaultIteratorEnvironment.java -- diff --git a/query/src/main/java/org/apache/accumulo/examples/wikisearch/iterator/DefaultIteratorEnvironment.java b/query/src/main/java/org/apache/accumulo/examples/wikisearch/iterator/DefaultIteratorEnvironment.java index d37751e..6783efe 100644 --- a/query/src/main/java/org/apache/accumulo/examples/wikisearch/iterator/DefaultIteratorEnvironment.java +++ b/query/src/main/java/org/apache/accumulo/examples/wikisearch/iterator/DefaultIteratorEnvironment.java @@ -16,26 +16,25 @@ */ package org.apache.accumulo.examples.wikisearch.iterator; -import java.io.IOException; - -import org.apache.accumulo.core.client.impl.BaseIteratorEnvironment; import org.apache.accumulo.core.conf.AccumuloConfiguration; +import org.apache.accumulo.core.client.sample.SamplerConfiguration; import org.apache.accumulo.core.data.Key; import org.apache.accumulo.core.data.Value; +import org.apache.accumulo.core.iterators.IteratorEnvironment; import org.apache.accumulo.core.iterators.SortedKeyValueIterator; import org.apache.accumulo.core.iterators.system.MapFileIterator; import org.apache.accumulo.core.util.CachedConfiguration; import org.apache.hadoop.conf.Configuration; import org.apache.hadoop.fs.FileSystem; +import org.apache.accumulo.core.security.Authorizations; +import org.apache.accumulo.core.iterators.IteratorUtil.IteratorScope; + +import java.io.IOException; -public class DefaultIteratorEnvironment extends BaseIteratorEnvironment { +public class DefaultIteratorEnvironment implements IteratorEnvironment { AccumuloConfiguration conf; - public DefaultIteratorEnvironment(AccumuloConfiguration conf) { -this.conf = conf; - } - public DefaultIteratorEnvironment() { this.conf = AccumuloConfiguration.getDefaultConfiguration(); } @@ -56,4 +55,34 @@ public class DefaultIteratorEnvironment extends BaseIteratorEnvironment { public boolean isSamplingEnabled() { return false; } + + @Override + public IteratorScope getIteratorScope() { +throw new UnsupportedOperationException(); + } + + @Override + public boolean isFullMajorCompaction() { +throw new UnsupportedOperationException(); + } + + @Override + public void registerSideChannel(SortedKeyValueIterator iter) { +throw new UnsupportedOperationException(); + } + + @Override + public Authorizations getAuthorizations() { +throw new UnsupportedOperationException(); + } + + @Override + public SamplerConfiguration getSamplerConfiguration() { +throw new UnsupportedOperationException(); + } + + @Override + public IteratorEnvironment cloneWithSamplingEnabled() { +throw new UnsupportedOperationException(); + } }