http://git-wip-us.apache.org/repos/asf/asterixdb-site/blob/bf2c56b0/docs/0.9.0/data/twm.adm ---------------------------------------------------------------------- diff --git a/docs/0.9.0/data/twm.adm b/docs/0.9.0/data/twm.adm new file mode 100644 index 0000000..fa764af --- /dev/null +++ b/docs/0.9.0/data/twm.adm @@ -0,0 +1,12 @@ +{"tweetid":"1","user":{"screen-name":"NathanGiesen@211","lang":"en","friends_count":39339,"statuses_count":473,"name":"Nathan Giesen","followers_count":49416},"sender-location":point("47.44,80.65"),"send-time":datetime("2008-04-26T10:10:00"),"referred-topics":{{"t-mobile","customization"}},"message-text":" love t-mobile its customization is good:)"} +{"tweetid":"2","user":{"screen-name":"ColineGeyer@63","lang":"en","friends_count":121,"statuses_count":362,"name":"Coline Geyer","followers_count":17159},"sender-location":point("32.84,67.14"),"send-time":datetime("2010-05-13T10:10:00"),"referred-topics":{{"verizon","shortcut-menu"}},"message-text":" like verizon its shortcut-menu is awesome:)"} +{"tweetid":"3","user":{"screen-name":"NathanGiesen@211","lang":"en","friends_count":39339,"statuses_count":473,"name":"Nathan Giesen","followers_count":49416},"sender-location":point("29.72,75.8"),"send-time":datetime("2006-11-04T10:10:00"),"referred-topics":{{"motorola","speed"}},"message-text":" like motorola the speed is good:)"} +{"tweetid":"4","user":{"screen-name":"NathanGiesen@211","lang":"en","friends_count":39339,"statuses_count":473,"name":"Nathan Giesen","followers_count":49416},"sender-location":point("39.28,70.48"),"send-time":datetime("2011-12-26T10:10:00"),"referred-topics":{{"sprint","voice-command"}},"message-text":" like sprint the voice-command is mind-blowing:)"} +{"tweetid":"5","user":{"screen-name":"NathanGiesen@211","lang":"en","friends_count":39339,"statuses_count":473,"name":"Nathan Giesen","followers_count":49416},"sender-location":point("40.09,92.69"),"send-time":datetime("2006-08-04T10:10:00"),"referred-topics":{{"motorola","speed"}},"message-text":" can't stand motorola its speed is terrible:("} +{"tweetid":"6","user":{"screen-name":"ColineGeyer@63","lang":"en","friends_count":121,"statuses_count":362,"name":"Coline Geyer","followers_count":17159},"sender-location":point("47.51,83.99"),"send-time":datetime("2010-05-07T10:10:00"),"referred-topics":{{"iphone","voice-clarity"}},"message-text":" like iphone the voice-clarity is good:)"} +{"tweetid":"7","user":{"screen-name":"ChangEwing_573","lang":"en","friends_count":182,"statuses_count":394,"name":"Chang Ewing","followers_count":32136},"sender-location":point("36.21,72.6"),"send-time":datetime("2011-08-25T10:10:00"),"referred-topics":{{"samsung","platform"}},"message-text":" like samsung the platform is good"} +{"tweetid":"8","user":{"screen-name":"NathanGiesen@211","lang":"en","friends_count":39339,"statuses_count":473,"name":"Nathan Giesen","followers_count":49416},"sender-location":point("46.05,93.34"),"send-time":datetime("2005-10-14T10:10:00"),"referred-topics":{{"t-mobile","shortcut-menu"}},"message-text":" like t-mobile the shortcut-menu is awesome:)"} +{"tweetid":"9","user":{"screen-name":"NathanGiesen@211","lang":"en","friends_count":39339,"statuses_count":473,"name":"Nathan Giesen","followers_count":49416},"sender-location":point("36.86,74.62"),"send-time":datetime("2012-07-21T10:10:00"),"referred-topics":{{"verizon","voicemail-service"}},"message-text":" love verizon its voicemail-service is awesome"} +{"tweetid":"10","user":{"screen-name":"ColineGeyer@63","lang":"en","friends_count":121,"statuses_count":362,"name":"Coline Geyer","followers_count":17159},"sender-location":point("29.15,76.53"),"send-time":datetime("2008-01-26T10:10:00"),"referred-topics":{{"verizon","voice-clarity"}},"message-text":" hate verizon its voice-clarity is OMG:("} +{"tweetid":"11","user":{"screen-name":"NilaMilliron_tw","lang":"en","friends_count":445,"statuses_count":164,"name":"Nila Milliron","followers_count":22649},"sender-location":point("37.59,68.42"),"send-time":datetime("2008-03-09T10:10:00"),"referred-topics":{{"iphone","platform"}},"message-text":" can't stand iphone its platform is terrible"} +{"tweetid":"12","user":{"screen-name":"OliJackson_512","lang":"en","friends_count":445,"statuses_count":164,"name":"Oli Jackson","followers_count":22649},"sender-location":point("24.82,94.63"),"send-time":datetime("2010-02-13T10:10:00"),"referred-topics":{{"samsung","voice-command"}},"message-text":" like samsung the voice-command is amazing:)"}
http://git-wip-us.apache.org/repos/asf/asterixdb-site/blob/bf2c56b0/docs/0.9.0/data/twu.adm ---------------------------------------------------------------------- diff --git a/docs/0.9.0/data/twu.adm b/docs/0.9.0/data/twu.adm new file mode 100644 index 0000000..32a1917 --- /dev/null +++ b/docs/0.9.0/data/twu.adm @@ -0,0 +1,4 @@ +{"screen-name":"NathanGiesen@211","lang":"en","friends_count":18,"statuses_count":473,"name":"Nathan Giesen","followers_count":49416} +{"screen-name":"ColineGeyer@63","lang":"en","friends_count":121,"statuses_count":362,"name":"Coline Geyer","followers_count":17159} +{"screen-name":"NilaMilliron_tw","lang":"en","friends_count":445,"statuses_count":164,"name":"Nila Milliron","followers_count":22649} +{"screen-name":"ChangEwing_573","lang":"en","friends_count":182,"statuses_count":394,"name":"Chang Ewing","followers_count":32136} http://git-wip-us.apache.org/repos/asf/asterixdb-site/blob/bf2c56b0/docs/0.9.0/datamodel.html ---------------------------------------------------------------------- diff --git a/docs/0.9.0/datamodel.html b/docs/0.9.0/datamodel.html new file mode 100644 index 0000000..e835a73 --- /dev/null +++ b/docs/0.9.0/datamodel.html @@ -0,0 +1,883 @@ +<!DOCTYPE html> +<!-- + | Generated by Apache Maven Doxia at 2017-01-24 + | Rendered using Apache Maven Fluido Skin 1.3.0 +--> +<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en"> + <head> + <meta charset="UTF-8" /> + <meta name="viewport" content="width=device-width, initial-scale=1.0" /> + <meta name="Date-Revision-yyyymmdd" content="20170124" /> + <meta http-equiv="Content-Language" content="en" /> + <title>AsterixDB – The Asterix Data Model (ADM)</title> + <link rel="stylesheet" href="./css/apache-maven-fluido-1.3.0.min.css" /> + <link rel="stylesheet" href="./css/site.css" /> + <link rel="stylesheet" href="./css/print.css" media="print" /> + + + <script type="text/javascript" src="./js/apache-maven-fluido-1.3.0.min.js"></script> + + + +<script>(function(i,s,o,g,r,a,m){i['GoogleAnalyticsObject']=r;i[r]=i[r]||function(){ + (i[r].q=i[r].q||[]).push(arguments)},i[r].l=1*new Date();a=s.createElement(o), + m=s.getElementsByTagName(o)[0];a.async=1;a.src=g;m.parentNode.insertBefore(a,m) + })(window,document,'script','//www.google-analytics.com/analytics.js','ga'); + + ga('create', 'UA-41536543-1', 'uci.edu'); + ga('send', 'pageview');</script> + + </head> + <body class="topBarDisabled"> + + + + + <div class="container-fluid"> + <div id="banner"> + <div class="pull-left"> + <a href="./" id="bannerLeft"> + <img src="images/asterixlogo.png" alt="AsterixDB"/> + </a> + </div> + <div class="pull-right"> </div> + <div class="clear"><hr/></div> + </div> + + <div id="breadcrumbs"> + <ul class="breadcrumb"> + + + <li id="publishDate">Last Published: 2017-01-24</li> + + + + <li id="projectVersion" class="pull-right">Version: 0.9.0</li> + + <li class="divider pull-right">|</li> + + <li class="pull-right"> <a href="index.html" title="Documentation Home"> + Documentation Home</a> + </li> + + </ul> + </div> + + + <div class="row-fluid"> + <div id="leftColumn" class="span3"> + <div class="well sidebar-nav"> + + + <ul class="nav nav-list"> + <li class="nav-header">Get Started - Installation</li> + + <li> + + <a href="ncservice.html" title="Option 1: using NCService"> + <i class="none"></i> + Option 1: using NCService</a> + </li> + + <li> + + <a href="install.html" title="Option 2: using Managix"> + <i class="none"></i> + Option 2: using Managix</a> + </li> + + <li> + + <a href="yarn.html" title="Option 3: using YARN"> + <i class="none"></i> + Option 3: using YARN</a> + </li> + <li class="nav-header">AsterixDB Primer</li> + + <li> + + <a href="sqlpp/primer-sqlpp.html" title="Option 1: using SQL++"> + <i class="none"></i> + Option 1: using SQL++</a> + </li> + + <li> + + <a href="aql/primer.html" title="Option 2: using AQL"> + <i class="none"></i> + Option 2: using AQL</a> + </li> + <li class="nav-header">Data Model</li> + + <li class="active"> + + <a href="#"><i class="none"></i>The Asterix Data Model</a> + </li> + <li class="nav-header">Queries - SQL++</li> + + <li> + + <a href="sqlpp/manual.html" title="The SQL++ Query Language"> + <i class="none"></i> + The SQL++ Query Language</a> + </li> + + <li> + + <a href="sqlpp/builtins.html" title="Builtin Functions"> + <i class="none"></i> + Builtin Functions</a> + </li> + <li class="nav-header">Queries - AQL</li> + + <li> + + <a href="aql/manual.html" title="The Asterix Query Language (AQL)"> + <i class="none"></i> + The Asterix Query Language (AQL)</a> + </li> + + <li> + + <a href="aql/builtins.html" title="Builtin Functions"> + <i class="none"></i> + Builtin Functions</a> + </li> + <li class="nav-header">Advanced Features</li> + + <li> + + <a href="aql/similarity.html" title="Support of Similarity Queries"> + <i class="none"></i> + Support of Similarity Queries</a> + </li> + + <li> + + <a href="aql/fulltext.html" title="Support of Full-text Queries"> + <i class="none"></i> + Support of Full-text Queries</a> + </li> + + <li> + + <a href="aql/externaldata.html" title="Accessing External Data"> + <i class="none"></i> + Accessing External Data</a> + </li> + + <li> + + <a href="feeds/tutorial.html" title="Support for Data Ingestion"> + <i class="none"></i> + Support for Data Ingestion</a> + </li> + + <li> + + <a href="udf.html" title="User Defined Functions"> + <i class="none"></i> + User Defined Functions</a> + </li> + + <li> + + <a href="aql/filters.html" title="Filter-Based LSM Index Acceleration"> + <i class="none"></i> + Filter-Based LSM Index Acceleration</a> + </li> + <li class="nav-header">API/SDK</li> + + <li> + + <a href="api.html" title="HTTP API"> + <i class="none"></i> + HTTP API</a> + </li> + </ul> + + + + <hr class="divider" /> + + <div id="poweredBy"> + <div class="clear"></div> + <div class="clear"></div> + <div class="clear"></div> + <a href="./" title="AsterixDB" class="builtBy"> + <img class="builtBy" alt="AsterixDB" src="images/asterixlogo.png" /> + </a> + </div> + </div> + </div> + + + <div id="bodyColumn" class="span9" > + + <!-- ! Licensed to the Apache Software Foundation (ASF) under one + ! or more contributor license agreements. See the NOTICE file + ! distributed with this work for additional information + ! regarding copyright ownership. The ASF licenses this file + ! to you under the Apache License, Version 2.0 (the + ! "License"); you may not use this file except in compliance + ! with the License. You may obtain a copy of the License at + ! + ! http://www.apache.org/licenses/LICENSE-2.0 + ! + ! Unless required by applicable law or agreed to in writing, + ! software distributed under the License is distributed on an + ! "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + ! KIND, either express or implied. See the License for the + ! specific language governing permissions and limitations + ! under the License. + ! --><h1>The Asterix Data Model (ADM)</h1> +<div class="section"> +<h2><a name="Table_of_Contents"></a><a name="toc" id="toc">Table of Contents</a></h2> + +<ul> + +<li><a href="#PrimitiveTypes">Primitive Types</a> + +<ul> + +<li><a href="#PrimitiveTypesBoolean">Boolean</a></li> + +<li><a href="#PrimitiveTypesInt">Tinyint / Smallint / Integer (Int) / Bigint</a></li> + +<li><a href="#PrimitiveTypesFloat">Float</a></li> + +<li><a href="#PrimitiveTypesDouble">Double (Double Precision)</a></li> + +<li><a href="#PrimitiveTypesString">String</a></li> + +<li><a href="#PrimitiveTypesBinary">Binary</a></li> + +<li><a href="#PrimitiveTypesPoint">Point</a></li> + +<li><a href="#PrimitiveTypesLine">Line</a></li> + +<li><a href="#PrimitiveTypesRectangle">Rectangle</a></li> + +<li><a href="#PrimitiveTypesCircle">Circle</a></li> + +<li><a href="#PrimitiveTypesPolygon">Polygon</a></li> + +<li><a href="#PrimitiveTypesDate">Date</a></li> + +<li><a href="#PrimitiveTypesTime">Time</a></li> + +<li><a href="#PrimitiveTypesDateTime">Datetime (Timestamp)</a></li> + +<li><a href="#PrimitiveTypesDuration">Duration/Year_month_duration/Day_time_duration</a></li> + +<li><a href="#PrimitiveTypesInterval">Interval</a></li> + +<li><a href="#PrimitiveTypesUUID">UUID</a></li> + </ul></li> + +<li><a href="#IncompleteInformationTypesTypes">Incomplete Information Types</a> + +<ul> + +<li><a href="#IncompleteInformationTypesNull">Null</a></li> + +<li><a href="#IncompleteInformationTypesMissing">Missing</a></li> + </ul></li> + +<li><a href="#DerivedTypes">Derived Types</a> + +<ul> + +<li><a href="#DerivedTypesObject">Object</a></li> + +<li><a href="#DerivedTypesArray">Array</a></li> + +<li><a href="#DerivedTypesMultiset">Multiset</a></li> + </ul></li> +</ul> +<p>An instance of Asterix data model (ADM) can be a <i><i>primitive type</i></i> (<tt>boolean</tt>, <tt>tinyint</tt>, <tt>smallint</tt>, <tt>integer</tt>, <tt>bigint</tt>, <tt>string</tt>, <tt>float</tt>, <tt>double</tt>, <tt>date</tt>, <tt>time</tt>, <tt>datetime</tt>, etc.), a <i><i>special type</i></i> (<tt>null</tt> or <tt>missing</tt>), or a <i><i>derived type</i></i>.</p> +<p>The type names are case-insensitive, e.g., both <tt>BIGINT</tt> and <tt>bigint</tt> are acceptable.</p></div> +<div class="section"> +<h2><a name="Primitive_Types"></a><a name="PrimitiveTypes" id="PrimitiveTypes">Primitive Types</a></h2> +<div class="section"> +<h3><a name="Boolean"></a><a name="PrimitiveTypesBoolean" id="PrimitiveTypesBoolean">Boolean</a></h3> +<p><tt>boolean</tt> data type can have one of the two values: <i><i>true</i></i> or <i><i>false</i></i>.</p> + +<ul> + +<li> +<p>Example:</p> + +<div class="source"> +<div class="source"> +<pre>{ "true": true, "false": false }; +</pre></div></div></li> +</ul> + +<ul> + +<li> +<p>The expected result is:</p> + +<div class="source"> +<div class="source"> +<pre>{ "true": true, "false": false } +</pre></div></div></li> +</ul></div> +<div class="section"> +<h3><a name="Tinyint__Smallint__Integer_Int__Bigint"></a><a name="PrimitiveTypesInt" id="PrimitiveTypesInt">Tinyint / Smallint / Integer (Int) / Bigint</a></h3> +<p>Integer types using 8, 16, 32, or 64 bits. The ranges of these types are:</p> + +<ul> + +<li><tt>tinyint</tt>: -127 to 127</li> + +<li><tt>smallint</tt>: -32767 to 32767</li> + +<li><tt>integer</tt>: -2147483647 to 2147483647</li> + +<li><tt>bigint</tt>: -9223372036854775808 to 9223372036854775807</li> +</ul> +<p><tt>int</tt> is an abbreviated alias for integer.</p> + +<ul> + +<li> +<p>Example:</p> + +<div class="source"> +<div class="source"> +<pre>{ "tinyint": tiny("125"), "smallint": smallint("32765"), "integer": 294967295, "bigint": bigint("1700000000000000000")}; +</pre></div></div></li> +</ul> + +<ul> + +<li> +<p>The expected result is:</p> + +<div class="source"> +<div class="source"> +<pre>{ "tinyint": 125, "smallint": 32765, "integer": 294967295, "bigint": 17000000 } +</pre></div></div></li> +</ul></div> +<div class="section"> +<h3><a name="Float"></a><a name="PrimitiveTypesFloat" id="PrimitiveTypesFloat">Float</a></h3> +<p><tt>float</tt> represents approximate numeric data values using 4 bytes. The range of a float value can be from 2^(-149) to (2-2^(-23)·2^(127) for both positive and negative. Beyond these ranges will get <tt>INF</tt> or <tt>-INF</tt>.</p> + +<ul> + +<li> +<p>Example:</p> + +<div class="source"> +<div class="source"> +<pre>{ "v1": float("NaN"), "v2": float("INF"), "v3": float("-INF"), "v4": float("-2013.5") }; +</pre></div></div></li> +</ul> + +<ul> + +<li> +<p>The expected result is:</p> + +<div class="source"> +<div class="source"> +<pre>{ "v1": NaN, "v2": Infinity, "v3": -Infinity, "v4": -2013.5 } +</pre></div></div></li> +</ul></div> +<div class="section"> +<h3><a name="Double_double_precision"></a><a name="PrimitiveTypesDouble" id="PrimitiveTypesDouble">Double (double precision)</a></h3> +<p><tt>double</tt> represents approximate numeric data values using 8 bytes. The range of a double value can be from (2^(-1022)) to (2-2^(-52))·2^(1023) for both positive and negative. Beyond these ranges will get <tt>INF</tt> or <tt>-INF</tt>.</p> + +<ul> + +<li> +<p>Example:</p> + +<div class="source"> +<div class="source"> +<pre>{ "v1": double("NaN"), "v2": double("INF"), "v3": double("-INF"), "v4": "-2013.593823748327284" }; +</pre></div></div></li> +</ul> + +<ul> + +<li> +<p>The expected result is:</p> + +<div class="source"> +<div class="source"> +<pre>{ "v1": NaN, "v2": Infinity, "v3": -Infinity, "v4": -2013.5938237483274 } +</pre></div></div></li> +</ul> +<p><tt>Double precision</tt> is an alias of <tt>double</tt>.</p></div> +<div class="section"> +<h3><a name="String"></a><a name="PrimitiveTypesString" id="PrimitiveTypesString">String</a></h3> +<p><tt>string</tt> represents a sequence of characters. The total length of the sequence can be up to 2,147,483,648.</p> + +<ul> + +<li> +<p>Example:</p> + +<div class="source"> +<div class="source"> +<pre>{ "v1": string("This is a string."), "v2": string("\"This is a quoted string\"") }; +</pre></div></div></li> +</ul> + +<ul> + +<li> +<p>The expected result is:</p> + +<div class="source"> +<div class="source"> +<pre>{ "v1": "This is a string.", "v2": "\"This is a quoted string\"" } +</pre></div></div></li> +</ul></div> +<div class="section"> +<h3><a name="Binary"></a><a name="PrimitiveTypesBinary" id="PrimitiveTypesBinary">Binary</a></h3> +<p><tt>binary</tt> represents a sequence of bytes. It can be constructed from a <tt>hex</tt> or a <tt>base64</tt> string sequence. The total length of the byte sequence can be up to 2,147,483,648.</p> + +<ul> + +<li> +<p>Example:</p> + +<div class="source"> +<div class="source"> +<pre>{ + "hex1" : hex("ABCDEF0123456789"), + "hex2": hex("abcdef0123456789"), + "base64_1" : base64("0123456789qwertyui+/"), + "base64_2" : base64('QXN0ZXJpeA==') +}; +</pre></div></div></li> + +<li> +<p>The default output format is in <tt>hex</tt> format. Thus, the expected result is:</p> + +<div class="source"> +<div class="source"> +<pre>{ + "hex1": hex("ABCDEF0123456789"), + "hex2": hex("ABCDEF0123456789"), + "base64_1": hex("D35DB7E39EBBF3DAB07ABB72BA2FBF"), + "base64_2": hex("41737465726978") +} +</pre></div></div></li> +</ul></div> +<div class="section"> +<h3><a name="Point"></a><a name="PrimitiveTypesPoint" id="PrimitiveTypesPoint">Point</a></h3> +<p><tt>point</tt> is the fundamental two-dimensional building block for spatial types. It consists of two <tt>double</tt> coordinates x and y.</p> + +<ul> + +<li> +<p>Example:</p> + +<div class="source"> +<div class="source"> +<pre>{ "v1": point("80.10d, -10E5"), "v2": point("5.10E-10d, -10E5") }; +</pre></div></div></li> +</ul> + +<ul> + +<li> +<p>The expected result is:</p> + +<div class="source"> +<div class="source"> +<pre>{ "v1": point("80.1,-1000000.0"), "v2": point("5.1E-10,-1000000.0") } +</pre></div></div></li> +</ul></div> +<div class="section"> +<h3><a name="Line"></a><a name="PrimitiveTypesLine" id="PrimitiveTypesLine">Line</a></h3> +<p><tt>line</tt> consists of two points that represent the start and the end points of a line segment.</p> + +<ul> + +<li> +<p>Example:</p> + +<div class="source"> +<div class="source"> +<pre>{ "v1": line("10.1234,11.1e-1 +10.2E-2,-11.22"), "v2": line("0.1234,-1.00e-10 +10.5E-2,-01.02") }; +</pre></div></div></li> +</ul> + +<ul> + +<li> +<p>The expected result is:</p> + +<div class="source"> +<div class="source"> +<pre>{ "v1": line("10.1234,1.11 0.102,-11.22"), "v2": line("0.1234,-1.0E-10 0.105,-1.02") } +</pre></div></div></li> +</ul></div> +<div class="section"> +<h3><a name="Rectangle"></a><a name="PrimitiveTypesRectangle" id="PrimitiveTypesRectangle">Rectangle</a></h3> +<p><tt>rectangle</tt> consists of two points that represent the <i><i>bottom left</i></i> and <i><i>upper right</i></i> corners of a rectangle.</p> + +<ul> + +<li> +<p>Example:</p> + +<div class="source"> +<div class="source"> +<pre>{ "v1": rectangle("5.1,11.8 87.6,15.6548"), "v2": rectangle("0.1234,-1.00e-10 5.5487,0.48765") }; +</pre></div></div></li> +</ul> + +<ul> + +<li> +<p>The expected result is:</p> + +<div class="source"> +<div class="source"> +<pre>{ "v1": rectangle("5.1,11.8 87.6,15.6548"), "v2": rectangle("0.1234,-1.0E-10 5.5487,0.48765") } +</pre></div></div></li> +</ul></div> +<div class="section"> +<h3><a name="Circle"></a><a name="PrimitiveTypesCircle" id="PrimitiveTypesCircle">Circle</a></h3> +<p><tt>circle</tt> consists of one point that represents the center of the circle and a radius of type <tt>double</tt>.</p> + +<ul> + +<li> +<p>Example:</p> + +<div class="source"> +<div class="source"> +<pre>{ "v1": circle("10.1234,11.1e-1 +10.2E-2"), "v2": circle("0.1234,-1.00e-10 +10.5E-2") }; +</pre></div></div></li> +</ul> + +<ul> + +<li> +<p>The expected result is:</p> + +<div class="source"> +<div class="source"> +<pre>{ "v1": circle("10.1234,1.11 0.102"), "v2": circle("0.1234,-1.0E-10 0.105") } +</pre></div></div></li> +</ul></div> +<div class="section"> +<h3><a name="Polygon"></a><a name="PrimitiveTypesPolygon" id="PrimitiveTypesPolygon">Polygon</a></h3> +<p><tt>polygon</tt> consists of <i><i>n</i></i> points that represent the vertices of a <i><i>simple closed</i></i> polygon.</p> + +<ul> + +<li> +<p>Example:</p> + +<div class="source"> +<div class="source"> +<pre>{ + "v1": polygon("-1.2,+1.3e2 -2.14E+5,2.15 -3.5e+2,03.6 -4.6E-3,+4.81"), + "v2": polygon("-1.0,+10.5e2 -02.15E+50,2.5 -1.0,+3.3e3 -2.50E+05,20.15 +3.5e+2,03.6 -4.60E-3,+4.75 -2,+1.0e2 -2.00E+5,20.10 30.5,03.25 -4.33E-3,+4.75") +}; +</pre></div></div></li> +</ul> + +<ul> + +<li> +<p>The expected result is:</p> + +<div class="source"> +<div class="source"> +<pre>{ + "v1": polygon("-1.2,130.0 -214000.0,2.15 -350.0,3.6 -0.0046,4.81"), + "v2": polygon("-1.0,1050.0 -2.15E50,2.5 -1.0,3300.0 -250000.0,20.15 350.0,3.6 -0.0046,4.75 -2.0,100.0 -200000.0,20.1 30.5,3.25 -0.00433,4.75") } +} +</pre></div></div></li> +</ul></div> +<div class="section"> +<h3><a name="Date"></a><a name="PrimitiveTypesDate" id="PrimitiveTypesDate">Date</a></h3> +<p><tt>date</tt> represents a time point along the Gregorian calendar system specified by the year, month and day. ASTERIX supports the date from <tt>-9999-01-01</tt> to <tt>9999-12-31</tt>.</p> +<p>A date value can be represented in two formats, extended format and basic format.</p> + +<ul> + +<li>Extended format is represented as <tt>[-]yyyy-mm-dd</tt> for <tt>year-month-day</tt>. Each field should be padded if there are less digits than the format specified.</li> + +<li>Basic format is in the format of <tt>[-]yyyymmdd</tt>.</li> + +<li> +<p>Example:</p> + +<div class="source"> +<div class="source"> +<pre>{ "v1": date("2013-01-01"), "v2": date("-19700101") }; +</pre></div></div></li> +</ul> + +<ul> + +<li> +<p>The expected result is:</p> + +<div class="source"> +<div class="source"> +<pre>{ "v1": date("2013-01-01"), "v2": date("-1970-01-01") } +</pre></div></div></li> +</ul></div> +<div class="section"> +<h3><a name="Time"></a><a name="PrimitiveTypesTime" id="PrimitiveTypesTime">Time</a></h3> +<p><tt>time</tt> type describes the time within the range of a day. It is represented by three fields: hour, minute and second. Millisecond field is optional as the fraction of the second field. Its extended format is as <tt>hh:mm:ss[.mmm]</tt> and the basic format is <tt>hhmmss[mmm]</tt>. The value domain is from <tt>00:00:00.000</tt> to <tt>23:59:59.999</tt>.</p> +<p>Timezone field is optional for a time value. Timezone is represented as <tt>[+|-]hh:mm</tt> for extended format or <tt>[+|-]hhmm</tt> for basic format. Note that the sign designators cannot be omitted. <tt>Z</tt> can also be used to represent the UTC local time. If no timezone information is given, it is UTC by default.</p> + +<ul> + +<li> +<p>Example:</p> + +<div class="source"> +<div class="source"> +<pre>{ "v1": time("12:12:12.039Z"), "v2": time("000000000-0800") }; +</pre></div></div></li> +</ul> + +<ul> + +<li> +<p>The expected result is:</p> + +<div class="source"> +<div class="source"> +<pre>{ "v1": time("12:12:12.039Z"), "v2": time("08:00:00.000Z") } +</pre></div></div></li> +</ul></div> +<div class="section"> +<h3><a name="Datetime_Timestamp"></a><a name="PrimitiveTypesDateTime" id="PrimitiveTypesDateTime">Datetime (Timestamp)</a></h3> +<p>A <tt>datetime</tt> value is a combination of an <tt>date</tt> and <tt>time</tt>, representing a fixed time point along the Gregorian calendar system. The value is among <tt>-9999-01-01 00:00:00.000</tt> and <tt>9999-12-31 23:59:59.999</tt>.</p> +<p>A <tt>datetime</tt> value is represented as a combination of the representation of its <tt>date</tt> part and <tt>time</tt> part, separated by a separator <tt>T</tt>. Either extended or basic format can be used, and the two parts should be the same format.</p> +<p>Millisecond field and timezone field are optional, as specified in the <tt>time</tt> type.</p> + +<ul> + +<li> +<p>Example:</p> + +<div class="source"> +<div class="source"> +<pre>{ "v1": datetime("2013-01-01T12:12:12.039Z"), "v2": datetime("-19700101T000000000-0800") }; +</pre></div></div></li> +</ul> + +<ul> + +<li> +<p>The expected result is:</p> + +<div class="source"> +<div class="source"> +<pre>{ "v1": datetime("2013-01-01T12:12:12.039Z"), "v2": datetime("-1970-01-01T08:00:00.000Z") } +</pre></div></div></li> +</ul> +<p><tt>timestamp</tt> is an alias of <tt>datetime</tt>.</p></div> +<div class="section"> +<h3><a name="DurationYear_month_durationDay_time_duration"></a><a name="PrimitiveTypesDuration" id="PrimitiveTypesDuration">Duration/Year_month_duration/Day_time_duration</a></h3> +<p><tt>duration</tt> represents a duration of time. A duration value is specified by integers on at least one of the following fields: year, month, day, hour, minute, second, and millisecond.</p> +<p>A duration value is in the format of <tt>[-]PnYnMnDTnHnMn.mmmS</tt>. The millisecond part (as the fraction of the second field) is optional, and when no millisecond field is used, the decimal point should also be absent.</p> +<p>Negative durations are also supported for the arithmetic operations between time instance types (<tt>date</tt>, <tt>time</tt> and <tt>datetime</tt>), and is used to roll the time back for the given duration. For example <tt>date("2012-01-01") + duration("-P3D")</tt> will return <tt>date("2011-12-29")</tt>.</p> +<p>There are also two sub-duration types, namely <tt>year_month_duration</tt> and <tt>day_time_duration</tt>. <tt>year_month_duration</tt> represents only the years and months of a duration, while <tt>day_time_duration</tt> represents only the day to millisecond fields. Different from the <tt>duration</tt> type, both these two subtypes are totally ordered, so they can be used for comparison and index construction.</p> +<p>Note that a canonical representation of the duration is always returned, regardless whether the duration is in the canonical representation or not from the user’s input. More information about canonical representation can be found from <a class="externalLink" href="http://www.w3.org/TR/xpath-functions/#canonical-dayTimeDuration">XPath dayTimeDuration Canonical Representation</a> and <a class="externalLink" href="http://www.w3.org/TR/xpath-functions/#canonical-yearMonthDuration">yearMonthDuration Canonical Representation</a>.</p> + +<ul> + +<li> +<p>Example:</p> + +<div class="source"> +<div class="source"> +<pre>{ "v1": duration("P100Y12MT12M"), "v2": duration("-PT20.943S") }; +</pre></div></div></li> +</ul> + +<ul> + +<li> +<p>The expected result is:</p> + +<div class="source"> +<div class="source"> +<pre>{ "v1": duration("P101YT12M"), "v2": duration("-PT20.943S") } +</pre></div></div></li> +</ul></div> +<div class="section"> +<h3><a name="Interval"></a><a name="PrimitiveTypesInterval" id="PrimitiveTypesInterval">Interval</a></h3> +<p><tt>interval</tt> represents inclusive-exclusive ranges of time. It is defined by two time point values with the same temporal type(<tt>date</tt>, <tt>time</tt> or <tt>datetime</tt>).</p> + +<ul> + +<li> +<p>Example:</p> + +<div class="source"> +<div class="source"> +<pre>{ + "v1": interval(date("2013-01-01"), date("20130505")), + "v2": interval(time("00:01:01"), time("213901049+0800")), + "v3": interval(datetime("2013-01-01T00:01:01"), datetime("20130505T213901049+0800")) +}; +</pre></div></div></li> +</ul> + +<ul> + +<li> +<p>The expected result is:</p> + +<div class="source"> +<div class="source"> +<pre>{ + "v1": interval(date("2013-01-01"), date("2013-05-05")), + "v2": interval(time("00:01:01.000Z"), time("13:39:01.049Z")), + "v3": interval(datetime("2013-01-01T00:01:01.000Z"), datetime("2013-05-05T13:39:01.049Z")) +} +</pre></div></div></li> +</ul></div> +<div class="section"> +<h3><a name="UUID"></a><a name="PrimitiveTypesUUID" id="PrimitiveTypesUUID">UUID</a></h3> +<p><tt>uuid</tt> represents a UUID value, which stands for Universally unique identifier. It is defined by a canonical format using hexadecimal text with inserted hyphen characters. (E.g.: 5a28ce1e-6a74-4201-9e8f-683256e5706f). This type is generally used to store auto-generated primary key values.</p> + +<ul> + +<li> +<p>Example:</p> + +<div class="source"> +<div class="source"> +<pre>return { "v1":uuid("5c848e5c-6b6a-498f-8452-8847a2957421") } +</pre></div></div></li> +</ul> + +<ul> + +<li> +<p>The expected result is:</p> + +<div class="source"> +<div class="source"> +<pre>{ "v1": uuid("5c848e5c-6b6a-498f-8452-8847a2957421") } +</pre></div></div></li> +</ul></div></div> +<div class="section"> +<h2><a name="Incomplete_Information_Types"></a><a name="IncompleteInformationTypes" id="IncompleteInformationTypes">Incomplete Information Types</a></h2> +<div class="section"> +<h3><a name="Null"></a><a name="IncompleteInformationTypesNull" id="IncompleteInformationTypesNull">Null</a></h3> +<p><tt>null</tt> is a special value that is often used to represent an unknown value. For example, a user might not be able to know the value of a field and let it be <tt>null</tt>.</p> + +<ul> + +<li> +<p>Example:</p> + +<div class="source"> +<div class="source"> +<pre>{ "field": null }; +</pre></div></div></li> +</ul> + +<ul> + +<li> +<p>The expected result is:</p> + +<div class="source"> +<div class="source"> +<pre>{ "field": null } +</pre></div></div></li> +</ul></div> +<div class="section"> +<h3><a name="Missing"></a><a name="IncompleteInformationTypesMissing" id="IncompleteInformationTypesMissing">Missing</a></h3> +<p><tt>missing</tt> represents a missing name-value pair in a object. If the referenced field does not exist, an empty result value is returned by the query.</p> +<p>As neither the data model nor the system enforces homogeneity for datasets or collections, items in a dataset or collection can be of heterogeneous types and so a field can be present in one object and <tt>missing</tt> in another.</p> + +<ul> + +<li> +<p>Example:</p> + +<div class="source"> +<div class="source"> +<pre>{ "field": missing }; +</pre></div></div></li> +</ul> + +<ul> + +<li> +<p>The expected result is:</p> + +<div class="source"> +<div class="source"> +<pre>{ } +</pre></div></div></li> +</ul> +<p>Since a field with value <tt>missing</tt> means the field is absent, we get an empty object.</p></div></div> +<div class="section"> +<h2><a name="Derived_Types"></a><a name="DerivedTypes" id="DerivedTypes">Derived Types</a></h2> +<div class="section"> +<h3><a name="Object"></a><a name="DerivedTypesObject" id="DerivedTypesObject">Object</a></h3> +<p>A <tt>object</tt> contains a set of fields, where each field is described by its name and type. A object type is either open or closed. Open objects can contain fields that are not part of the type definition, while closed objects cannot. Syntactically, object constructors are surrounded by curly braces “{…}”.</p> +<p>An example would be</p> + +<div class="source"> +<div class="source"> +<pre> { "id": 213508, "name": "Alice Bob" } +</pre></div></div></div> +<div class="section"> +<h3><a name="Array"></a><a name="DerivedTypesArray" id="DerivedTypesArray">Array</a></h3> +<p>An <tt>array</tt> is a container that holds a fixed number of values. Array constructors are denoted by brackets: “[…]”.</p> +<p>An example would be</p> + +<div class="source"> +<div class="source"> +<pre> ["alice", 123, "bob", null] +</pre></div></div></div> +<div class="section"> +<h3><a name="Multiset"></a><a name="DerivedTypesMultiset" id="DerivedTypesMultiset">Multiset</a></h3> +<p>A <tt>multiset</tt> is a generalization of the concept of a set that, unlike a set, allows multiple instances of the multiset’s elements. Multiset constructors are denoted by two opening curly braces followed by data and two closing curly braces, like “{{…}}”.</p> +<p>An example would be</p> + +<div class="source"> +<div class="source"> +<pre> {{"hello", 9328, "world", [1, 2, null]}} +</pre></div></div></div></div> + </div> + </div> + </div> + + <hr/> + + <footer> + <div class="container-fluid"> + <div class="row span12">Copyright © 2017 + <a href="https://www.apache.org/">The Apache Software Foundation</a>. + All Rights Reserved. + + </div> + + <?xml version="1.0" encoding="UTF-8"?> +<div class="row-fluid">Apache AsterixDB, AsterixDB, Apache, the Apache + feather logo, and the Apache AsterixDB project logo are either + registered trademarks or trademarks of The Apache Software + Foundation in the United States and other countries. + All other marks mentioned may be trademarks or registered + trademarks of their respective owners.</div> + + + </div> + </footer> + </body> +</html> http://git-wip-us.apache.org/repos/asf/asterixdb-site/blob/bf2c56b0/docs/0.9.0/feeds/tutorial.html ---------------------------------------------------------------------- diff --git a/docs/0.9.0/feeds/tutorial.html b/docs/0.9.0/feeds/tutorial.html new file mode 100644 index 0000000..337391a --- /dev/null +++ b/docs/0.9.0/feeds/tutorial.html @@ -0,0 +1,442 @@ +<!DOCTYPE html> +<!-- + | Generated by Apache Maven Doxia at 2017-01-24 + | Rendered using Apache Maven Fluido Skin 1.3.0 +--> +<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en"> + <head> + <meta charset="UTF-8" /> + <meta name="viewport" content="width=device-width, initial-scale=1.0" /> + <meta name="Date-Revision-yyyymmdd" content="20170124" /> + <meta http-equiv="Content-Language" content="en" /> + <title>AsterixDB – Support for Data Ingestion in AsterixDB</title> + <link rel="stylesheet" href="../css/apache-maven-fluido-1.3.0.min.css" /> + <link rel="stylesheet" href="../css/site.css" /> + <link rel="stylesheet" href="../css/print.css" media="print" /> + + + <script type="text/javascript" src="../js/apache-maven-fluido-1.3.0.min.js"></script> + + + +<script>(function(i,s,o,g,r,a,m){i['GoogleAnalyticsObject']=r;i[r]=i[r]||function(){ + (i[r].q=i[r].q||[]).push(arguments)},i[r].l=1*new Date();a=s.createElement(o), + m=s.getElementsByTagName(o)[0];a.async=1;a.src=g;m.parentNode.insertBefore(a,m) + })(window,document,'script','//www.google-analytics.com/analytics.js','ga'); + + ga('create', 'UA-41536543-1', 'uci.edu'); + ga('send', 'pageview');</script> + + </head> + <body class="topBarDisabled"> + + + + + <div class="container-fluid"> + <div id="banner"> + <div class="pull-left"> + <a href=".././" id="bannerLeft"> + <img src="../images/asterixlogo.png" alt="AsterixDB"/> + </a> + </div> + <div class="pull-right"> </div> + <div class="clear"><hr/></div> + </div> + + <div id="breadcrumbs"> + <ul class="breadcrumb"> + + + <li id="publishDate">Last Published: 2017-01-24</li> + + + + <li id="projectVersion" class="pull-right">Version: 0.9.0</li> + + <li class="divider pull-right">|</li> + + <li class="pull-right"> <a href="../index.html" title="Documentation Home"> + Documentation Home</a> + </li> + + </ul> + </div> + + + <div class="row-fluid"> + <div id="leftColumn" class="span3"> + <div class="well sidebar-nav"> + + + <ul class="nav nav-list"> + <li class="nav-header">Get Started - Installation</li> + + <li> + + <a href="../ncservice.html" title="Option 1: using NCService"> + <i class="none"></i> + Option 1: using NCService</a> + </li> + + <li> + + <a href="../install.html" title="Option 2: using Managix"> + <i class="none"></i> + Option 2: using Managix</a> + </li> + + <li> + + <a href="../yarn.html" title="Option 3: using YARN"> + <i class="none"></i> + Option 3: using YARN</a> + </li> + <li class="nav-header">AsterixDB Primer</li> + + <li> + + <a href="../sqlpp/primer-sqlpp.html" title="Option 1: using SQL++"> + <i class="none"></i> + Option 1: using SQL++</a> + </li> + + <li> + + <a href="../aql/primer.html" title="Option 2: using AQL"> + <i class="none"></i> + Option 2: using AQL</a> + </li> + <li class="nav-header">Data Model</li> + + <li> + + <a href="../datamodel.html" title="The Asterix Data Model"> + <i class="none"></i> + The Asterix Data Model</a> + </li> + <li class="nav-header">Queries - SQL++</li> + + <li> + + <a href="../sqlpp/manual.html" title="The SQL++ Query Language"> + <i class="none"></i> + The SQL++ Query Language</a> + </li> + + <li> + + <a href="../sqlpp/builtins.html" title="Builtin Functions"> + <i class="none"></i> + Builtin Functions</a> + </li> + <li class="nav-header">Queries - AQL</li> + + <li> + + <a href="../aql/manual.html" title="The Asterix Query Language (AQL)"> + <i class="none"></i> + The Asterix Query Language (AQL)</a> + </li> + + <li> + + <a href="../aql/builtins.html" title="Builtin Functions"> + <i class="none"></i> + Builtin Functions</a> + </li> + <li class="nav-header">Advanced Features</li> + + <li> + + <a href="../aql/similarity.html" title="Support of Similarity Queries"> + <i class="none"></i> + Support of Similarity Queries</a> + </li> + + <li> + + <a href="../aql/fulltext.html" title="Support of Full-text Queries"> + <i class="none"></i> + Support of Full-text Queries</a> + </li> + + <li> + + <a href="../aql/externaldata.html" title="Accessing External Data"> + <i class="none"></i> + Accessing External Data</a> + </li> + + <li class="active"> + + <a href="#"><i class="none"></i>Support for Data Ingestion</a> + </li> + + <li> + + <a href="../udf.html" title="User Defined Functions"> + <i class="none"></i> + User Defined Functions</a> + </li> + + <li> + + <a href="../aql/filters.html" title="Filter-Based LSM Index Acceleration"> + <i class="none"></i> + Filter-Based LSM Index Acceleration</a> + </li> + <li class="nav-header">API/SDK</li> + + <li> + + <a href="../api.html" title="HTTP API"> + <i class="none"></i> + HTTP API</a> + </li> + </ul> + + + + <hr class="divider" /> + + <div id="poweredBy"> + <div class="clear"></div> + <div class="clear"></div> + <div class="clear"></div> + <a href=".././" title="AsterixDB" class="builtBy"> + <img class="builtBy" alt="AsterixDB" src="../images/asterixlogo.png" /> + </a> + </div> + </div> + </div> + + + <div id="bodyColumn" class="span9" > + + <!-- ! Licensed to the Apache Software Foundation (ASF) under one + ! or more contributor license agreements. See the NOTICE file + ! distributed with this work for additional information + ! regarding copyright ownership. The ASF licenses this file + ! to you under the Apache License, Version 2.0 (the + ! "License"); you may not use this file except in compliance + ! with the License. You may obtain a copy of the License at + ! + ! http://www.apache.org/licenses/LICENSE-2.0 + ! + ! Unless required by applicable law or agreed to in writing, + ! software distributed under the License is distributed on an + ! "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + ! KIND, either express or implied. See the License for the + ! specific language governing permissions and limitations + ! under the License. + ! --><h1>Support for Data Ingestion in AsterixDB</h1> +<div class="section"> +<h2><a name="Table_of_Contents"></a><a name="atoc" id="#toc">Table of Contents</a></h2> + +<ul> + +<li><a href="#Introduction">Introduction</a></li> + +<li><a href="#FeedAdaptors">Feed Adaptors</a></li> + +<li><a href="#FeedPolicies">Feed Policies</a></li> +</ul></div> +<div class="section"> +<h2><a name="Introduction">Introduction</a></h2> +<p>In this document, we describe the support for data ingestion in AsterixDB. Data feeds are a new mechanism for having continuous data arrive into a BDMS from external sources and incrementally populate a persisted dataset and associated indexes. We add a new BDMS architectural component, called a data feed, that makes a Big Data system the caretaker for functionality that used to live outside, and we show how it improves users’ lives and system performance.</p></div> +<div class="section"> +<h2><a name="Feed_Adaptors"></a><a name="FeedAdaptors">Feed Adaptors</a></h2> +<p>The functionality of establishing a connection with a data source and receiving, parsing and translating its data into ADM objects (for storage inside AsterixDB) is contained in a feed adaptor. A feed adaptor is an implementation of an interface and its details are specific to a given data source. An adaptor may optionally be given parameters to configure its runtime behavior. Depending upon the data transfer protocol/APIs offered by the data source, a feed adaptor may operate in a push or a pull mode. Push mode involves just one initial request by the adaptor to the data source for setting up the connection. Once a connection is authorized, the data source “pushes” data to the adaptor without any subsequent requests by the adaptor. In contrast, when operating in a pull mode, the adaptor makes a separate request each time to receive data. AsterixDB currently provides built-in adaptors for several popular data sources such as Twitter, CNN, and RSS feeds. AsterixDB ad ditionally provides a generic socket-based adaptor that can be used to ingest data that is directed at a prescribed socket.</p> +<p>In this tutorial, we shall describe building two example data ingestion pipelines that cover the popular scenario of ingesting data from (a) Twitter and (b) RSS Feed source.</p> +<div class="section"> +<div class="section"> +<h4><a name="Ingesting_Twitter_Stream"></a>Ingesting Twitter Stream</h4> +<p>We shall use the built-in push-based Twitter adaptor. As a pre-requisite, we must define a Tweet using the AsterixDB Data Model (ADM) and the AsterixDB Query Language (AQL). Given below are the type definition in AQL that create a Tweet datatype which is representative of a real tweet as obtained from Twitter.</p> + +<div class="source"> +<div class="source"> +<pre> create dataverse feeds; + use dataverse feeds; + + create type TwitterUser as closed { + screen_name: string, + lang: string, + friends_count: int32, + statuses_count: int32 + }; + + create type Tweet as open { + id: int64, + user: TwitterUser + } + + create dataset Tweets (Tweet) + primary key id; +</pre></div></div> +<p>We also create a dataset that we shall use to persist the tweets in AsterixDB. Next we make use of the <tt>create feed</tt> AQL statement to define our example data feed.</p> +<div class="section"> +<h5><a name="Using_the_push_twitter_feed_adapter"></a>Using the “push_twitter” feed adapter</h5> +<p>The “push_twitter” adaptor requires setting up an application account with Twitter. To retrieve tweets, Twitter requires registering an application with Twitter. Registration involves providing a name and a brief description for the application. Each application has an associated OAuth authentication credential that includes OAuth keys and tokens. Accessing the Twitter API requires providing the following. 1. Consumer Key (API Key) 2. Consumer Secret (API Secret) 3. Access Token 4. Access Token Secret</p> +<p>The “push_twitter” adaptor takes as configuration the above mentioned parameters. End users are required to obtain the above authentication credentials prior to using the “push_twitter” adaptor. For further information on obtaining OAuth keys and tokens and registering an application with Twitter, please visit <a class="externalLink" href="http://apps.twitter.com">http://apps.twitter.com</a></p> +<p>Given below is an example AQL statement that creates a feed called “TwitterFeed” by using the “push_twitter” adaptor.</p> + +<div class="source"> +<div class="source"> +<pre> use dataverse feeds; + + create feed TwitterFeed if not exists using "push_twitter" + (("type-name"="Tweet"), + ("format"="twitter-status"), + ("consumer.key"="************"), + ("consumer.secret"="**************"), + ("access.token"="**********"), + ("access.token.secret"="*************")); +</pre></div></div> +<p>It is required that the above authentication parameters are provided valid values. Note that the <tt>create feed</tt> statement does not initiate the flow of data from Twitter into our AsterixDB instance. Instead, the <tt>create feed</tt> statement only results in registering the feed with AsterixDB. The flow of data along a feed is initiated when it is connected to a target dataset using the connect feed statement (which we shall revisit later).</p></div></div> +<div class="section"> +<h4><a name="Lifecycle_of_a_Feed"></a>Lifecycle of a Feed</h4> +<p>A feed is a logical artifact that is brought to life (i.e., its data flow is initiated) only when it is connected to a dataset using the <tt>connect +feed</tt> AQL statement. Subsequent to a <tt>connect feed</tt> statement, the feed is said to be in the connected state. Multiple feeds can simultaneously be connected to a dataset such that the contents of the dataset represent the union of the connected feeds. In a supported but unlikely scenario, one feed may also be simultaneously connected to different target datasets. Note that connecting a secondary feed does not require the parent feed (or any ancestor feed) to be in the connected state; the order in which feeds are connected to their respective datasets is not important. Furthermore, additional (secondary) feeds can be added to an existing hierarchy and connected to a dataset at any time without impeding/interrupting the flow of data along a connected ancestor feed.</p> + +<div class="source"> +<div class="source"> +<pre> use dataverse feeds; + + connect feed TwitterFeed to dataset Tweets; +</pre></div></div> +<p>The <tt>connect feed</tt> statement above directs AsterixDB to persist the <tt>TwitterFeed</tt> feed in the <tt>Tweets</tt> dataset. If it is required (by the high-level application) to also retain the raw tweets obtained from Twitter, the end user may additionally choose to connect TwitterFeed to a different dataset.</p> +<p>Let the feed run for a minute, then run the following query to see the latest tweets that are stored into the data set.</p> + +<div class="source"> +<div class="source"> +<pre> use dataverse feeds; + + for $i in dataset Tweets limit 10 return $i; +</pre></div></div> +<p>The flow of data from a feed into a dataset can be terminated explicitly by use of the <tt>disconnect feed</tt> statement. Disconnecting a feed from a particular dataset does not interrupt the flow of data from the feed to any other dataset(s), nor does it impact other connected feeds in the lineage.</p> + +<div class="source"> +<div class="source"> +<pre> use dataverse feeds; + + disconnect feed TwitterFeed from dataset Tweets; +</pre></div></div></div> +<div class="section"> +<h4><a name="Ingesting_an_RSS_Feed"></a>Ingesting an RSS Feed</h4> +<p>RSS (Rich Site Summary), originally RDF Site Summary and often called Really Simple Syndication, uses a family of standard web feed formats to publish frequently updated information: blog entries, news headlines, audio, video. An RSS document (called “feed”, “web feed”, or “channel”) includes full or summarized text, and metadata, like publishing date and author’s name. RSS feeds enable publishers to syndicate data automatically.</p> +<div class="section"> +<h5><a name="Using_the_rss_feed_feed_adapter"></a>Using the “rss_feed” feed adapter</h5> +<p>AsterixDB provides a built-in feed adaptor that allows retrieving data given a collection of RSS end point URLs. As observed in the case of ingesting tweets, it is required to model an RSS data item using AQL.</p> + +<div class="source"> +<div class="source"> +<pre> use dataverse feeds; + + create type Rss if not exists as open { + id: string, + title: string, + description: string, + link: string + }; + + create dataset RssDataset (Rss) + primary key id; +</pre></div></div> +<p>Next, we define an RSS feed using our built-in adaptor “rss_feed”.</p> + +<div class="source"> +<div class="source"> +<pre> use dataverse feeds; + + create feed my_feed using + rss_feed ( + ("type-name"="Rss"), + ("format"="rss"), + ("url"="http://rss.cnn.com/rss/edition.rss") + ); +</pre></div></div> +<p>In the above definition, the configuration parameter “url” can be a comma-separated list that reflects a collection of RSS URLs, where each URL corresponds to an RSS endpoint or a RSS feed. The “rss_adaptor” retrieves data from each of the specified RSS URLs (comma separated values) in parallel.</p> +<p>The following statements connect the feed into the <tt>RssDataset</tt>:</p> + +<div class="source"> +<div class="source"> +<pre> use dataverse feeds; + + connect feed my_feed to dataset RssDataset; +</pre></div></div> +<p>The following statements show the latest data from the data set, and disconnect the feed from the data set.</p> + +<div class="source"> +<div class="source"> +<pre> use dataverse feeds; + + for $i in dataset RssDataset limit 10 return $i; + + disconnect feed my_feed from dataset RssDataset; +</pre></div></div> +<p>AsterixDB also allows multiple feeds to be connected to form a cascade network to process data.</p></div></div></div></div> +<div class="section"> +<h2><a name="Policies_for_Feed_Ingestion"></a><a name="FeedPolicies">Policies for Feed Ingestion</a></h2> +<p>Multiple feeds may be concurrently operational on an AsterixDB cluster, each competing for resources (CPU cycles, network bandwidth, disk IO) to maintain pace with their respective data sources. As a data management system, AsterixDB is able to manage a set of concurrent feeds and make dynamic decisions related to the allocation of resources, resolving resource bottlenecks and the handling of failures. Each feed has its own set of constraints, influenced largely by the nature of its data source and the applications that intend to consume and process the ingested data. Consider an application that intends to discover the trending topics on Twitter by analyzing tweets that are being processed. Losing a few tweets may be acceptable. In contrast, when ingesting from a data source that provides a click-stream of ad clicks, losing data would translate to a loss of revenue for an application that tracks revenue by charging advertisers per click.</p> +<p>AsterixDB allows a data feed to have an associated ingestion policy that is expressed as a collection of parameters and associated values. An ingestion policy dictates the runtime behavior of the feed in response to resource bottlenecks and failures. AsterixDB provides a list of policy parameters that help customize the system’s runtime behavior when handling excess objects. AsterixDB provides a set of built-in policies, each constructed by setting appropriate value(s) for the policy parameter(s) from the table below.</p> +<div class="section"> +<div class="section"> +<h4><a name="Policy_Parameters"></a>Policy Parameters</h4> + +<ul> + +<li> +<p><i>excess.records.spill</i>: Set to true if objects that cannot be processed by an operator for lack of resources (referred to as excess objects hereafter) should be persisted to the local disk for deferred processing. (Default: false)</p></li> + +<li> +<p><i>excess.records.discard</i>: Set to true if excess objects should be discarded. (Default: false)</p></li> + +<li> +<p><i>excess.records.throttle</i>: Set to true if rate of arrival of objects is required to be reduced in an adaptive manner to prevent having any excess objects (Default: false)</p></li> + +<li> +<p><i>excess.records.elastic</i>: Set to true if the system should attempt to resolve resource bottlenecks by re-structuring and/or rescheduling the feed ingestion pipeline. (Default: false)</p></li> + +<li> +<p><i>recover.soft.failure</i>: Set to true if the feed must attempt to survive any runtime exception. A false value permits an early termination of a feed in such an event. (Default: true)</p></li> + +<li> +<p><i>recover.soft.failure</i>: Set to true if the feed must attempt to survive a hardware failures (loss of AsterixDB node(s)). A false value permits the early termination of a feed in the event of a hardware failure (Default: false)</p></li> +</ul> +<p>Note that the end user may choose to form a custom policy. For example, it is possible in AsterixDB to create a custom policy that spills excess objects to disk and subsequently resorts to throttling if the spillage crosses a configured threshold. In all cases, the desired ingestion policy is specified as part of the <tt>connect feed</tt> statement or else the “Basic” policy will be chosen as the default. It is worth noting that a feed can be connected to a dataset at any time, which is independent from other related feeds in the hierarchy.</p> + +<div class="source"> +<div class="source"> +<pre> use dataverse feeds; + + connect feed TwitterFeed to dataset Tweets + using policy Basic ; +</pre></div></div></div></div></div> + </div> + </div> + </div> + + <hr/> + + <footer> + <div class="container-fluid"> + <div class="row span12">Copyright © 2017 + <a href="https://www.apache.org/">The Apache Software Foundation</a>. + All Rights Reserved. + + </div> + + <?xml version="1.0" encoding="UTF-8"?> +<div class="row-fluid">Apache AsterixDB, AsterixDB, Apache, the Apache + feather logo, and the Apache AsterixDB project logo are either + registered trademarks or trademarks of The Apache Software + Foundation in the United States and other countries. + All other marks mentioned may be trademarks or registered + trademarks of their respective owners.</div> + + + </div> + </footer> + </body> +</html> http://git-wip-us.apache.org/repos/asf/asterixdb-site/blob/bf2c56b0/docs/0.9.0/images/AsterixCluster.png ---------------------------------------------------------------------- diff --git a/docs/0.9.0/images/AsterixCluster.png b/docs/0.9.0/images/AsterixCluster.png new file mode 100644 index 0000000..a16ee26 Binary files /dev/null and b/docs/0.9.0/images/AsterixCluster.png differ http://git-wip-us.apache.org/repos/asf/asterixdb-site/blob/bf2c56b0/docs/0.9.0/images/accessories-text-editor.png ---------------------------------------------------------------------- diff --git a/docs/0.9.0/images/accessories-text-editor.png b/docs/0.9.0/images/accessories-text-editor.png new file mode 100644 index 0000000..abc3366 Binary files /dev/null and b/docs/0.9.0/images/accessories-text-editor.png differ http://git-wip-us.apache.org/repos/asf/asterixdb-site/blob/bf2c56b0/docs/0.9.0/images/add.gif ---------------------------------------------------------------------- diff --git a/docs/0.9.0/images/add.gif b/docs/0.9.0/images/add.gif new file mode 100644 index 0000000..1cb3dbf Binary files /dev/null and b/docs/0.9.0/images/add.gif differ http://git-wip-us.apache.org/repos/asf/asterixdb-site/blob/bf2c56b0/docs/0.9.0/images/apache-maven-project-2.png ---------------------------------------------------------------------- diff --git a/docs/0.9.0/images/apache-maven-project-2.png b/docs/0.9.0/images/apache-maven-project-2.png new file mode 100644 index 0000000..6c096ec Binary files /dev/null and b/docs/0.9.0/images/apache-maven-project-2.png differ http://git-wip-us.apache.org/repos/asf/asterixdb-site/blob/bf2c56b0/docs/0.9.0/images/application-certificate.png ---------------------------------------------------------------------- diff --git a/docs/0.9.0/images/application-certificate.png b/docs/0.9.0/images/application-certificate.png new file mode 100644 index 0000000..cc6aff6 Binary files /dev/null and b/docs/0.9.0/images/application-certificate.png differ http://git-wip-us.apache.org/repos/asf/asterixdb-site/blob/bf2c56b0/docs/0.9.0/images/asf_logo_wide.png ---------------------------------------------------------------------- diff --git a/docs/0.9.0/images/asf_logo_wide.png b/docs/0.9.0/images/asf_logo_wide.png new file mode 100644 index 0000000..56a4369 Binary files /dev/null and b/docs/0.9.0/images/asf_logo_wide.png differ http://git-wip-us.apache.org/repos/asf/asterixdb-site/blob/bf2c56b0/docs/0.9.0/images/asterix_webui.png ---------------------------------------------------------------------- diff --git a/docs/0.9.0/images/asterix_webui.png b/docs/0.9.0/images/asterix_webui.png new file mode 100644 index 0000000..27522c4 Binary files /dev/null and b/docs/0.9.0/images/asterix_webui.png differ http://git-wip-us.apache.org/repos/asf/asterixdb-site/blob/bf2c56b0/docs/0.9.0/images/asterixlogo.png ---------------------------------------------------------------------- diff --git a/docs/0.9.0/images/asterixlogo.png b/docs/0.9.0/images/asterixlogo.png new file mode 100644 index 0000000..45cd64f Binary files /dev/null and b/docs/0.9.0/images/asterixlogo.png differ http://git-wip-us.apache.org/repos/asf/asterixdb-site/blob/bf2c56b0/docs/0.9.0/images/contact-new.png ---------------------------------------------------------------------- diff --git a/docs/0.9.0/images/contact-new.png b/docs/0.9.0/images/contact-new.png new file mode 100644 index 0000000..ebc4316 Binary files /dev/null and b/docs/0.9.0/images/contact-new.png differ http://git-wip-us.apache.org/repos/asf/asterixdb-site/blob/bf2c56b0/docs/0.9.0/images/document-properties.png ---------------------------------------------------------------------- diff --git a/docs/0.9.0/images/document-properties.png b/docs/0.9.0/images/document-properties.png new file mode 100644 index 0000000..34c2409 Binary files /dev/null and b/docs/0.9.0/images/document-properties.png differ http://git-wip-us.apache.org/repos/asf/asterixdb-site/blob/bf2c56b0/docs/0.9.0/images/drive-harddisk.png ---------------------------------------------------------------------- diff --git a/docs/0.9.0/images/drive-harddisk.png b/docs/0.9.0/images/drive-harddisk.png new file mode 100644 index 0000000..d7ce475 Binary files /dev/null and b/docs/0.9.0/images/drive-harddisk.png differ http://git-wip-us.apache.org/repos/asf/asterixdb-site/blob/bf2c56b0/docs/0.9.0/images/egg-logo.png ---------------------------------------------------------------------- diff --git a/docs/0.9.0/images/egg-logo.png b/docs/0.9.0/images/egg-logo.png new file mode 100644 index 0000000..c04e70d Binary files /dev/null and b/docs/0.9.0/images/egg-logo.png differ http://git-wip-us.apache.org/repos/asf/asterixdb-site/blob/bf2c56b0/docs/0.9.0/images/fix.gif ---------------------------------------------------------------------- diff --git a/docs/0.9.0/images/fix.gif b/docs/0.9.0/images/fix.gif new file mode 100644 index 0000000..b7eb3dc Binary files /dev/null and b/docs/0.9.0/images/fix.gif differ http://git-wip-us.apache.org/repos/asf/asterixdb-site/blob/bf2c56b0/docs/0.9.0/images/hyrax_ts.png ---------------------------------------------------------------------- diff --git a/docs/0.9.0/images/hyrax_ts.png b/docs/0.9.0/images/hyrax_ts.png new file mode 100644 index 0000000..001c788 Binary files /dev/null and b/docs/0.9.0/images/hyrax_ts.png differ http://git-wip-us.apache.org/repos/asf/asterixdb-site/blob/bf2c56b0/docs/0.9.0/images/icon_error_sml.gif ---------------------------------------------------------------------- diff --git a/docs/0.9.0/images/icon_error_sml.gif b/docs/0.9.0/images/icon_error_sml.gif new file mode 100644 index 0000000..12e9a01 Binary files /dev/null and b/docs/0.9.0/images/icon_error_sml.gif differ http://git-wip-us.apache.org/repos/asf/asterixdb-site/blob/bf2c56b0/docs/0.9.0/images/icon_help_sml.gif ---------------------------------------------------------------------- diff --git a/docs/0.9.0/images/icon_help_sml.gif b/docs/0.9.0/images/icon_help_sml.gif new file mode 100644 index 0000000..aaf20e6 Binary files /dev/null and b/docs/0.9.0/images/icon_help_sml.gif differ http://git-wip-us.apache.org/repos/asf/asterixdb-site/blob/bf2c56b0/docs/0.9.0/images/icon_info_sml.gif ---------------------------------------------------------------------- diff --git a/docs/0.9.0/images/icon_info_sml.gif b/docs/0.9.0/images/icon_info_sml.gif new file mode 100644 index 0000000..b776326 Binary files /dev/null and b/docs/0.9.0/images/icon_info_sml.gif differ http://git-wip-us.apache.org/repos/asf/asterixdb-site/blob/bf2c56b0/docs/0.9.0/images/icon_success_sml.gif ---------------------------------------------------------------------- diff --git a/docs/0.9.0/images/icon_success_sml.gif b/docs/0.9.0/images/icon_success_sml.gif new file mode 100644 index 0000000..0a19527 Binary files /dev/null and b/docs/0.9.0/images/icon_success_sml.gif differ http://git-wip-us.apache.org/repos/asf/asterixdb-site/blob/bf2c56b0/docs/0.9.0/images/icon_warning_sml.gif ---------------------------------------------------------------------- diff --git a/docs/0.9.0/images/icon_warning_sml.gif b/docs/0.9.0/images/icon_warning_sml.gif new file mode 100644 index 0000000..ac6ad6a Binary files /dev/null and b/docs/0.9.0/images/icon_warning_sml.gif differ http://git-wip-us.apache.org/repos/asf/asterixdb-site/blob/bf2c56b0/docs/0.9.0/images/image-x-generic.png ---------------------------------------------------------------------- diff --git a/docs/0.9.0/images/image-x-generic.png b/docs/0.9.0/images/image-x-generic.png new file mode 100644 index 0000000..ab49efb Binary files /dev/null and b/docs/0.9.0/images/image-x-generic.png differ http://git-wip-us.apache.org/repos/asf/asterixdb-site/blob/bf2c56b0/docs/0.9.0/images/internet-web-browser.png ---------------------------------------------------------------------- diff --git a/docs/0.9.0/images/internet-web-browser.png b/docs/0.9.0/images/internet-web-browser.png new file mode 100644 index 0000000..307d6ac Binary files /dev/null and b/docs/0.9.0/images/internet-web-browser.png differ http://git-wip-us.apache.org/repos/asf/asterixdb-site/blob/bf2c56b0/docs/0.9.0/images/logos/build-by-maven-black.png ---------------------------------------------------------------------- diff --git a/docs/0.9.0/images/logos/build-by-maven-black.png b/docs/0.9.0/images/logos/build-by-maven-black.png new file mode 100644 index 0000000..919fd0f Binary files /dev/null and b/docs/0.9.0/images/logos/build-by-maven-black.png differ http://git-wip-us.apache.org/repos/asf/asterixdb-site/blob/bf2c56b0/docs/0.9.0/images/logos/build-by-maven-white.png ---------------------------------------------------------------------- diff --git a/docs/0.9.0/images/logos/build-by-maven-white.png b/docs/0.9.0/images/logos/build-by-maven-white.png new file mode 100644 index 0000000..7d44c9c Binary files /dev/null and b/docs/0.9.0/images/logos/build-by-maven-white.png differ http://git-wip-us.apache.org/repos/asf/asterixdb-site/blob/bf2c56b0/docs/0.9.0/images/logos/maven-feather.png ---------------------------------------------------------------------- diff --git a/docs/0.9.0/images/logos/maven-feather.png b/docs/0.9.0/images/logos/maven-feather.png new file mode 100644 index 0000000..b5ada83 Binary files /dev/null and b/docs/0.9.0/images/logos/maven-feather.png differ http://git-wip-us.apache.org/repos/asf/asterixdb-site/blob/bf2c56b0/docs/0.9.0/images/network-server.png ---------------------------------------------------------------------- diff --git a/docs/0.9.0/images/network-server.png b/docs/0.9.0/images/network-server.png new file mode 100644 index 0000000..1d12e19 Binary files /dev/null and b/docs/0.9.0/images/network-server.png differ http://git-wip-us.apache.org/repos/asf/asterixdb-site/blob/bf2c56b0/docs/0.9.0/images/package-x-generic.png ---------------------------------------------------------------------- diff --git a/docs/0.9.0/images/package-x-generic.png b/docs/0.9.0/images/package-x-generic.png new file mode 100644 index 0000000..8b7e9e6 Binary files /dev/null and b/docs/0.9.0/images/package-x-generic.png differ http://git-wip-us.apache.org/repos/asf/asterixdb-site/blob/bf2c56b0/docs/0.9.0/images/profiles/pre-release.png ---------------------------------------------------------------------- diff --git a/docs/0.9.0/images/profiles/pre-release.png b/docs/0.9.0/images/profiles/pre-release.png new file mode 100644 index 0000000..d448e85 Binary files /dev/null and b/docs/0.9.0/images/profiles/pre-release.png differ http://git-wip-us.apache.org/repos/asf/asterixdb-site/blob/bf2c56b0/docs/0.9.0/images/profiles/retired.png ---------------------------------------------------------------------- diff --git a/docs/0.9.0/images/profiles/retired.png b/docs/0.9.0/images/profiles/retired.png new file mode 100644 index 0000000..f89f6a2 Binary files /dev/null and b/docs/0.9.0/images/profiles/retired.png differ http://git-wip-us.apache.org/repos/asf/asterixdb-site/blob/bf2c56b0/docs/0.9.0/images/profiles/sandbox.png ---------------------------------------------------------------------- diff --git a/docs/0.9.0/images/profiles/sandbox.png b/docs/0.9.0/images/profiles/sandbox.png new file mode 100644 index 0000000..f88b362 Binary files /dev/null and b/docs/0.9.0/images/profiles/sandbox.png differ http://git-wip-us.apache.org/repos/asf/asterixdb-site/blob/bf2c56b0/docs/0.9.0/images/remove.gif ---------------------------------------------------------------------- diff --git a/docs/0.9.0/images/remove.gif b/docs/0.9.0/images/remove.gif new file mode 100644 index 0000000..fc65631 Binary files /dev/null and b/docs/0.9.0/images/remove.gif differ http://git-wip-us.apache.org/repos/asf/asterixdb-site/blob/bf2c56b0/docs/0.9.0/images/rss.png ---------------------------------------------------------------------- diff --git a/docs/0.9.0/images/rss.png b/docs/0.9.0/images/rss.png new file mode 100644 index 0000000..a9850ee Binary files /dev/null and b/docs/0.9.0/images/rss.png differ http://git-wip-us.apache.org/repos/asf/asterixdb-site/blob/bf2c56b0/docs/0.9.0/images/running_inst.png ---------------------------------------------------------------------- diff --git a/docs/0.9.0/images/running_inst.png b/docs/0.9.0/images/running_inst.png new file mode 100644 index 0000000..66eb03a Binary files /dev/null and b/docs/0.9.0/images/running_inst.png differ http://git-wip-us.apache.org/repos/asf/asterixdb-site/blob/bf2c56b0/docs/0.9.0/images/update.gif ---------------------------------------------------------------------- diff --git a/docs/0.9.0/images/update.gif b/docs/0.9.0/images/update.gif new file mode 100644 index 0000000..b2a6d0b Binary files /dev/null and b/docs/0.9.0/images/update.gif differ http://git-wip-us.apache.org/repos/asf/asterixdb-site/blob/bf2c56b0/docs/0.9.0/images/window-new.png ---------------------------------------------------------------------- diff --git a/docs/0.9.0/images/window-new.png b/docs/0.9.0/images/window-new.png new file mode 100644 index 0000000..0e12ef9 Binary files /dev/null and b/docs/0.9.0/images/window-new.png differ http://git-wip-us.apache.org/repos/asf/asterixdb-site/blob/bf2c56b0/docs/0.9.0/images/yarn_clust.png ---------------------------------------------------------------------- diff --git a/docs/0.9.0/images/yarn_clust.png b/docs/0.9.0/images/yarn_clust.png new file mode 100644 index 0000000..5e386bc Binary files /dev/null and b/docs/0.9.0/images/yarn_clust.png differ http://git-wip-us.apache.org/repos/asf/asterixdb-site/blob/bf2c56b0/docs/0.9.0/img/glyphicons-halflings-white.png ---------------------------------------------------------------------- diff --git a/docs/0.9.0/img/glyphicons-halflings-white.png b/docs/0.9.0/img/glyphicons-halflings-white.png new file mode 100644 index 0000000..3bf6484 Binary files /dev/null and b/docs/0.9.0/img/glyphicons-halflings-white.png differ http://git-wip-us.apache.org/repos/asf/asterixdb-site/blob/bf2c56b0/docs/0.9.0/img/glyphicons-halflings.png ---------------------------------------------------------------------- diff --git a/docs/0.9.0/img/glyphicons-halflings.png b/docs/0.9.0/img/glyphicons-halflings.png new file mode 100644 index 0000000..a996999 Binary files /dev/null and b/docs/0.9.0/img/glyphicons-halflings.png differ http://git-wip-us.apache.org/repos/asf/asterixdb-site/blob/bf2c56b0/docs/0.9.0/index.html ---------------------------------------------------------------------- diff --git a/docs/0.9.0/index.html b/docs/0.9.0/index.html new file mode 100644 index 0000000..ef83927 --- /dev/null +++ b/docs/0.9.0/index.html @@ -0,0 +1,284 @@ +<!DOCTYPE html> +<!-- + | Generated by Apache Maven Doxia at 2017-01-24 + | Rendered using Apache Maven Fluido Skin 1.3.0 +--> +<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en"> + <head> + <meta charset="UTF-8" /> + <meta name="viewport" content="width=device-width, initial-scale=1.0" /> + <meta name="Date-Revision-yyyymmdd" content="20170124" /> + <meta http-equiv="Content-Language" content="en" /> + <title>AsterixDB – AsterixDB</title> + <link rel="stylesheet" href="./css/apache-maven-fluido-1.3.0.min.css" /> + <link rel="stylesheet" href="./css/site.css" /> + <link rel="stylesheet" href="./css/print.css" media="print" /> + + + <script type="text/javascript" src="./js/apache-maven-fluido-1.3.0.min.js"></script> + + + +<script>(function(i,s,o,g,r,a,m){i['GoogleAnalyticsObject']=r;i[r]=i[r]||function(){ + (i[r].q=i[r].q||[]).push(arguments)},i[r].l=1*new Date();a=s.createElement(o), + m=s.getElementsByTagName(o)[0];a.async=1;a.src=g;m.parentNode.insertBefore(a,m) + })(window,document,'script','//www.google-analytics.com/analytics.js','ga'); + + ga('create', 'UA-41536543-1', 'uci.edu'); + ga('send', 'pageview');</script> + + </head> + <body class="topBarDisabled"> + + + + + <div class="container-fluid"> + <div id="banner"> + <div class="pull-left"> + <a href="./" id="bannerLeft"> + <img src="images/asterixlogo.png" alt="AsterixDB"/> + </a> + </div> + <div class="pull-right"> </div> + <div class="clear"><hr/></div> + </div> + + <div id="breadcrumbs"> + <ul class="breadcrumb"> + + + <li id="publishDate">Last Published: 2017-01-24</li> + + + + <li id="projectVersion" class="pull-right">Version: 0.9.0</li> + + <li class="divider pull-right">|</li> + + <li class="pull-right"> <a href="index.html" title="Documentation Home"> + Documentation Home</a> + </li> + + </ul> + </div> + + + <div class="row-fluid"> + <div id="leftColumn" class="span3"> + <div class="well sidebar-nav"> + + + <ul class="nav nav-list"> + <li class="nav-header">Get Started - Installation</li> + + <li> + + <a href="ncservice.html" title="Option 1: using NCService"> + <i class="none"></i> + Option 1: using NCService</a> + </li> + + <li> + + <a href="install.html" title="Option 2: using Managix"> + <i class="none"></i> + Option 2: using Managix</a> + </li> + + <li> + + <a href="yarn.html" title="Option 3: using YARN"> + <i class="none"></i> + Option 3: using YARN</a> + </li> + <li class="nav-header">AsterixDB Primer</li> + + <li> + + <a href="sqlpp/primer-sqlpp.html" title="Option 1: using SQL++"> + <i class="none"></i> + Option 1: using SQL++</a> + </li> + + <li> + + <a href="aql/primer.html" title="Option 2: using AQL"> + <i class="none"></i> + Option 2: using AQL</a> + </li> + <li class="nav-header">Data Model</li> + + <li> + + <a href="datamodel.html" title="The Asterix Data Model"> + <i class="none"></i> + The Asterix Data Model</a> + </li> + <li class="nav-header">Queries - SQL++</li> + + <li> + + <a href="sqlpp/manual.html" title="The SQL++ Query Language"> + <i class="none"></i> + The SQL++ Query Language</a> + </li> + + <li> + + <a href="sqlpp/builtins.html" title="Builtin Functions"> + <i class="none"></i> + Builtin Functions</a> + </li> + <li class="nav-header">Queries - AQL</li> + + <li> + + <a href="aql/manual.html" title="The Asterix Query Language (AQL)"> + <i class="none"></i> + The Asterix Query Language (AQL)</a> + </li> + + <li> + + <a href="aql/builtins.html" title="Builtin Functions"> + <i class="none"></i> + Builtin Functions</a> + </li> + <li class="nav-header">Advanced Features</li> + + <li> + + <a href="aql/similarity.html" title="Support of Similarity Queries"> + <i class="none"></i> + Support of Similarity Queries</a> + </li> + + <li> + + <a href="aql/fulltext.html" title="Support of Full-text Queries"> + <i class="none"></i> + Support of Full-text Queries</a> + </li> + + <li> + + <a href="aql/externaldata.html" title="Accessing External Data"> + <i class="none"></i> + Accessing External Data</a> + </li> + + <li> + + <a href="feeds/tutorial.html" title="Support for Data Ingestion"> + <i class="none"></i> + Support for Data Ingestion</a> + </li> + + <li> + + <a href="udf.html" title="User Defined Functions"> + <i class="none"></i> + User Defined Functions</a> + </li> + + <li> + + <a href="aql/filters.html" title="Filter-Based LSM Index Acceleration"> + <i class="none"></i> + Filter-Based LSM Index Acceleration</a> + </li> + <li class="nav-header">API/SDK</li> + + <li> + + <a href="api.html" title="HTTP API"> + <i class="none"></i> + HTTP API</a> + </li> + </ul> + + + + <hr class="divider" /> + + <div id="poweredBy"> + <div class="clear"></div> + <div class="clear"></div> + <div class="clear"></div> + <a href="./" title="AsterixDB" class="builtBy"> + <img class="builtBy" alt="AsterixDB" src="images/asterixlogo.png" /> + </a> + </div> + </div> + </div> + + + <div id="bodyColumn" class="span9" > + + <!-- ! Licensed to the Apache Software Foundation (ASF) under one + ! or more contributor license agreements. See the NOTICE file + ! distributed with this work for additional information + ! regarding copyright ownership. The ASF licenses this file + ! to you under the Apache License, Version 2.0 (the + ! "License"); you may not use this file except in compliance + ! with the License. You may obtain a copy of the License at + ! + ! http://www.apache.org/licenses/LICENSE-2.0 + ! + ! Unless required by applicable law or agreed to in writing, + ! software distributed under the License is distributed on an + ! "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + ! KIND, either express or implied. See the License for the + ! specific language governing permissions and limitations + ! under the License. + ! --><h1>AsterixDB</h1> +<p>AsterixDB is a BDMS (Big Data Management System) with a rich feature set that sets it apart from other Big Data platforms. Its feature set makes it well-suited to modern needs such as web data warehousing and social data storage and analysis. AsterixDB has:</p> + +<ul> + +<li>A semistructured NoSQL style data model (ADM) resulting from extending JSON with object database ideas</li> + +<li>Two expressive and declarative query languages (SQL++ and AQL) that support a broad range of queries and analysis over semistructured data</li> + +<li>A parallel runtime query execution engine, Apache Hyracks, that has been scale-tested on up to 1000+ cores and 500+ disks</li> + +<li>Partitioned LSM-based data storage and indexing to support efficient ingestion and management of semistructured data</li> + +<li>Support for query access to externally stored data (e.g., data in HDFS) as well as to data stored natively by AsterixDB</li> + +<li>A rich set of primitive data types, including spatial and temporal data in addition to integer, floating point, and textual data</li> + +<li>Secondary indexing options that include B+ trees, R trees, and inverted keyword (exact and fuzzy) index types</li> + +<li>Support for fuzzy and spatial queries as well as for more traditional parametric queries</li> + +<li>Basic transactional (concurrency and recovery) capabilities akin to those of a NoSQL store</li> +</ul> + </div> + </div> + </div> + + <hr/> + + <footer> + <div class="container-fluid"> + <div class="row span12">Copyright © 2017 + <a href="https://www.apache.org/">The Apache Software Foundation</a>. + All Rights Reserved. + + </div> + + <?xml version="1.0" encoding="UTF-8"?> +<div class="row-fluid">Apache AsterixDB, AsterixDB, Apache, the Apache + feather logo, and the Apache AsterixDB project logo are either + registered trademarks or trademarks of The Apache Software + Foundation in the United States and other countries. + All other marks mentioned may be trademarks or registered + trademarks of their respective owners.</div> + + + </div> + </footer> + </body> +</html>