Added: datafu/site/docs/spark/2.1.0/datafu/spark/SparkDFUtilsBridge.html
URL: 
http://svn.apache.org/viewvc/datafu/site/docs/spark/2.1.0/datafu/spark/SparkDFUtilsBridge.html?rev=1925323&view=auto
==============================================================================
--- datafu/site/docs/spark/2.1.0/datafu/spark/SparkDFUtilsBridge.html (added)
+++ datafu/site/docs/spark/2.1.0/datafu/spark/SparkDFUtilsBridge.html Tue Apr 
29 18:54:44 2025
@@ -0,0 +1,810 @@
+<!DOCTYPE html >
+<html>
+        <head>
+          <meta http-equiv="X-UA-Compatible" content="IE=edge" />
+          <meta name="viewport" content="width=device-width, 
initial-scale=1.0, maximum-scale=1.0, user-scalable=no" />
+          <title>datafu-spark 2.1.0 API  - 
datafu.spark.SparkDFUtilsBridge</title>
+          <meta name="description" content="datafu - spark 2.1.0 API - 
datafu.spark.SparkDFUtilsBridge" />
+          <meta name="keywords" content="datafu spark 2.1.0 API 
datafu.spark.SparkDFUtilsBridge" />
+          <meta http-equiv="content-type" content="text/html; charset=UTF-8" />
+          
+      
+      <link href="../../lib/index.css" media="screen" type="text/css" 
rel="stylesheet" />
+      <link href="../../lib/template.css" media="screen" type="text/css" 
rel="stylesheet" />
+      <link href="../../lib/diagrams.css" media="screen" type="text/css" 
rel="stylesheet" id="diagrams-css" />
+      <script type="text/javascript" src="../../lib/jquery.min.js"></script>
+      <script type="text/javascript" 
src="../../lib/jquery.panzoom.min.js"></script>
+      <script type="text/javascript" 
src="../../lib/jquery.mousewheel.min.js"></script>
+      <script type="text/javascript" src="../../lib/index.js"></script>
+      <script type="text/javascript" src="../../index.js"></script>
+      <script type="text/javascript" src="../../lib/scheduler.js"></script>
+      <script type="text/javascript" src="../../lib/template.js"></script>
+      
+      <script type="text/javascript">
+        /* this variable can be used by the JS to determine the path to the 
root document */
+        var toRoot = '../../';
+      </script>
+    
+        </head>
+        <body>
+      <div id="search">
+        <span id="doc-title">datafu-spark 2.1.0 API<span 
id="doc-version"></span></span>
+        <span class="close-results"><span class="left">&lt;</span> Back</span>
+        <div id="textfilter">
+          <span class="input">
+            <input autocapitalize="none" placeholder="Search" id="index-input" 
type="text" accesskey="/" />
+            <i class="clear material-icons"></i>
+            <i id="search-icon" class="material-icons"></i>
+          </span>
+        </div>
+    </div>
+      <div id="search-results">
+        <div id="search-progress">
+          <div id="progress-fill"></div>
+        </div>
+        <div id="results-content">
+          <div id="entity-results"></div>
+          <div id="member-results"></div>
+        </div>
+      </div>
+      <div id="content-scroll-container" style="-webkit-overflow-scrolling: 
touch;">
+        <div id="content-container" style="-webkit-overflow-scrolling: touch;">
+          <div id="subpackage-spacer">
+            <div id="packages">
+              <h1>Packages</h1>
+              <ul>
+                <li name="_root_.root" visbl="pub" class="indented0 " 
data-isabs="false" fullComment="yes" group="Ungrouped">
+      <a id="_root_"></a><a id="root:_root_"></a>
+      <span class="permalink">
+      <a href="../../index.html" title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span>
+      <span class="modifier_kind">
+        <span class="modifier"></span>
+        <span class="kind">package</span>
+      </span>
+      <span class="symbol">
+        <a title="" href="../../index.html"><span class="name">root</span></a>
+      </span>
+      
+      <div class="fullcomment"><dl class="attributes block"> <dt>Definition 
Classes</dt><dd><a href="../../index.html" class="extype" 
name="_root_">root</a></dd></dl></div>
+    </li><li name="_root_.datafu" visbl="pub" class="indented1 " 
data-isabs="false" fullComment="yes" group="Ungrouped">
+      <a id="datafu"></a><a id="datafu:datafu"></a>
+      <span class="permalink">
+      <a href="../../datafu/index.html" title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span>
+      <span class="modifier_kind">
+        <span class="modifier"></span>
+        <span class="kind">package</span>
+      </span>
+      <span class="symbol">
+        <a title="" href="../index.html"><span class="name">datafu</span></a>
+      </span>
+      
+      <div class="fullcomment"><dl class="attributes block"> <dt>Definition 
Classes</dt><dd><a href="../../index.html" class="extype" 
name="_root_">root</a></dd></dl></div>
+    </li><li name="datafu.spark" visbl="pub" class="indented2 " 
data-isabs="false" fullComment="yes" group="Ungrouped">
+      <a id="spark"></a><a id="spark:spark"></a>
+      <span class="permalink">
+      <a href="../../datafu/spark/index.html" title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span>
+      <span class="modifier_kind">
+        <span class="modifier"></span>
+        <span class="kind">package</span>
+      </span>
+      <span class="symbol">
+        <a title="" href="index.html"><span class="name">spark</span></a>
+      </span>
+      
+      <div class="fullcomment"><dl class="attributes block"> <dt>Definition 
Classes</dt><dd><a href="../index.html" class="extype" 
name="datafu">datafu</a></dd></dl></div>
+    </li><li class="current-entities indented2">
+                        <span class="separator"></span>
+                        <a class="object" href="Aggregators$.html" title="This 
file contains UDAFs which extend the Aggregator class."></a>
+                        <a href="Aggregators$.html" title="This file contains 
UDAFs which extend the Aggregator class.">Aggregators</a>
+                      </li><li class="current-entities indented2">
+                        <span class="separator"></span>
+                        <a class="class" href="CoreBridgeDirectory.html" 
title="Contains all python files needed by the bridge itself"></a>
+                        <a href="CoreBridgeDirectory.html" title="Contains all 
python files needed by the bridge itself">CoreBridgeDirectory</a>
+                      </li><li class="current-entities indented2">
+                        <span class="separator"></span>
+                        <a class="object" href="DataFrameOps$.html" 
title="implicit class to enable easier usage e.g:"></a>
+                        <a href="DataFrameOps$.html" title="implicit class to 
enable easier usage e.g:">DataFrameOps</a>
+                      </li><li class="current-entities indented2">
+                        <span class="separator"></span>
+                        <a class="object" href="PythonPathsManager$.html" 
title="There are two phases of resolving python files path:"></a>
+                        <a href="PythonPathsManager$.html" title="There are 
two phases of resolving python files path:">PythonPathsManager</a>
+                      </li><li class="current-entities indented2">
+                        <span class="separator"></span>
+                        <a class="class" href="PythonResource.html" 
title="Represents a resource that needs to be added to PYTHONPATH used by 
ScalaPythonBridge."></a>
+                        <a href="PythonResource.html" title="Represents a 
resource that needs to be added to PYTHONPATH used by 
ScalaPythonBridge.">PythonResource</a>
+                      </li><li class="current-entities indented2">
+                        <span class="separator"></span>
+                        <a class="object" href="ResourceCloning$.html" 
title="Utility for extracting resource from a jar and copy it to a temporary 
location"></a>
+                        <a href="ResourceCloning$.html" title="Utility for 
extracting resource from a jar and copy it to a temporary 
location">ResourceCloning</a>
+                      </li><li class="current-entities indented2">
+                        <span class="separator"></span>
+                        <a class="object" href="ScalaPythonBridge$.html" 
title="Do not instantiate this class! Use the companion object instead."></a>
+                        <a href="ScalaPythonBridge$.html" title="Do not 
instantiate this class! Use the companion object instead.">ScalaPythonBridge</a>
+                      </li><li class="current-entities indented2">
+                        <span class="separator"></span>
+                        <a class="class" href="ScalaPythonBridgeRunner.html" 
title="this class let's the user invoke PySpark code from scala example 
usage:"></a>
+                        <a href="ScalaPythonBridgeRunner.html" title="this 
class let's the user invoke PySpark code from scala example 
usage:">ScalaPythonBridgeRunner</a>
+                      </li><li class="current-entities indented2">
+                        <span class="separator"></span>
+                        <a class="object" href="SparkDFUtils$.html" 
title=""></a>
+                        <a href="SparkDFUtils$.html" title="">SparkDFUtils</a>
+                      </li><li class="current-entities indented2">
+                        <span class="separator"></span>
+                        <a class="class" href="" title="class definition so we 
could expose this functionality in PySpark"></a>
+                        <a href="" title="class definition so we could expose 
this functionality in PySpark">SparkDFUtilsBridge</a>
+                      </li>
+              </ul>
+            </div>
+          </div>
+          <div id="content">
+            <body class="class type">
+      <div id="definition">
+        <div class="big-circle class">c</div>
+        <p id="owner"><a href="../index.html" class="extype" 
name="datafu">datafu</a>.<a href="index.html" class="extype" 
name="datafu.spark">spark</a></p>
+        <h1>SparkDFUtilsBridge<span class="permalink">
+      <a href="../../datafu/spark/SparkDFUtilsBridge.html" title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span></h1>
+        <h3><span class="morelinks"></span></h3>
+      </div>
+
+      <h4 id="signature" class="signature">
+      <span class="modifier_kind">
+        <span class="modifier"></span>
+        <span class="kind">class</span>
+      </span>
+      <span class="symbol">
+        <span class="name">SparkDFUtilsBridge</span><span class="result"> 
extends <span class="extype" name="scala.AnyRef">AnyRef</span></span>
+      </span>
+      </h4>
+
+      
+          <div id="comment" class="fullcommenttop"><div class="comment 
cmt"><p>class definition so we could expose this functionality in PySpark
+</p></div><div class="toggleContainer block">
+          <span class="toggle">
+            Linear Supertypes
+          </span>
+          <div class="superTypes hiddenContent"><span class="extype" 
name="scala.AnyRef">AnyRef</span>, <span class="extype" 
name="scala.Any">Any</span></div>
+        </div></div>
+        
+
+      <div id="mbrsel">
+        <div class="toggle"></div>
+        <div id="memberfilter">
+          <i class="material-icons arrow"></i>
+          <span class="input">
+            <input id="mbrsel-input" placeholder="Filter all members" 
type="text" accesskey="/" />
+          </span>
+          <i class="clear material-icons"></i>
+        </div>
+        <div id="filterby">
+          <div id="order">
+            <span class="filtertype">Ordering</span>
+            <ol>
+              
+              <li class="alpha in"><span>Alphabetic</span></li>
+              <li class="inherit out"><span>By Inheritance</span></li>
+            </ol>
+          </div>
+          <div class="ancestors">
+                  <span class="filtertype">Inherited<br />
+                  </span>
+                  <ol id="linearization">
+                    <li class="in" 
name="datafu.spark.SparkDFUtilsBridge"><span>SparkDFUtilsBridge</span></li><li 
class="in" name="scala.AnyRef"><span>AnyRef</span></li><li class="in" 
name="scala.Any"><span>Any</span></li>
+                  </ol>
+                </div><div class="ancestors">
+              <span class="filtertype"></span>
+              <ol>
+                <li class="hideall out"><span>Hide All</span></li>
+                <li class="showall in"><span>Show All</span></li>
+              </ol>
+            </div>
+          <div id="visbl">
+              <span class="filtertype">Visibility</span>
+              <ol><li class="public in"><span>Public</span></li><li class="all 
out"><span>All</span></li></ol>
+            </div>
+        </div>
+      </div>
+
+      <div id="template">
+        <div id="allMembers">
+        <div id="constructors" class="members">
+              <h3>Instance Constructors</h3>
+              <ol><li name="datafu.spark.SparkDFUtilsBridge#&lt;init&gt;" 
visbl="pub" class="indented0 " data-isabs="false" fullComment="no" 
group="Ungrouped">
+      <a id="&lt;init&gt;():datafu.spark.SparkDFUtilsBridge"></a><a 
id="&lt;init&gt;:SparkDFUtilsBridge"></a>
+      <span class="permalink">
+      <a 
href="../../datafu/spark/SparkDFUtilsBridge.html#&lt;init&gt;():datafu.spark.SparkDFUtilsBridge"
 title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span>
+      <span class="modifier_kind">
+        <span class="modifier"></span>
+        <span class="kind">new</span>
+      </span>
+      <span class="symbol">
+        <span class="name">SparkDFUtilsBridge</span><span 
class="params">()</span>
+      </span>
+      
+      
+    </li></ol>
+            </div>
+
+        
+
+        
+
+        <div class="values members">
+              <h3>Value Members</h3>
+              <ol>
+                <li name="scala.AnyRef#!=" visbl="pub" class="indented0 " 
data-isabs="false" fullComment="yes" group="Ungrouped">
+      <a id="!=(x$1:Any):Boolean"></a><a id="!=(Any):Boolean"></a>
+      <span class="permalink">
+      <a href="../../datafu/spark/SparkDFUtilsBridge.html#!=(x$1:Any):Boolean" 
title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span>
+      <span class="modifier_kind">
+        <span class="modifier">final </span>
+        <span class="kind">def</span>
+      </span>
+      <span class="symbol">
+        <span title="gt4s: $bang$eq" class="name">!=</span><span 
class="params">(<span name="arg0">arg0: <span class="extype" 
name="scala.Any">Any</span></span>)</span><span class="result">: <span 
class="extype" name="scala.Boolean">Boolean</span></span>
+      </span>
+      
+      <div class="fullcomment"><dl class="attributes block"> <dt>Definition 
Classes</dt><dd>AnyRef → Any</dd></dl></div>
+    </li><li name="scala.AnyRef###" visbl="pub" class="indented0 " 
data-isabs="false" fullComment="yes" group="Ungrouped">
+      <a id="##():Int"></a>
+      <span class="permalink">
+      <a href="../../datafu/spark/SparkDFUtilsBridge.html###():Int" 
title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span>
+      <span class="modifier_kind">
+        <span class="modifier">final </span>
+        <span class="kind">def</span>
+      </span>
+      <span class="symbol">
+        <span title="gt4s: $hash$hash" class="name">##</span><span 
class="params">()</span><span class="result">: <span class="extype" 
name="scala.Int">Int</span></span>
+      </span>
+      
+      <div class="fullcomment"><dl class="attributes block"> <dt>Definition 
Classes</dt><dd>AnyRef → Any</dd></dl></div>
+    </li><li name="scala.AnyRef#==" visbl="pub" class="indented0 " 
data-isabs="false" fullComment="yes" group="Ungrouped">
+      <a id="==(x$1:Any):Boolean"></a><a id="==(Any):Boolean"></a>
+      <span class="permalink">
+      <a href="../../datafu/spark/SparkDFUtilsBridge.html#==(x$1:Any):Boolean" 
title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span>
+      <span class="modifier_kind">
+        <span class="modifier">final </span>
+        <span class="kind">def</span>
+      </span>
+      <span class="symbol">
+        <span title="gt4s: $eq$eq" class="name">==</span><span 
class="params">(<span name="arg0">arg0: <span class="extype" 
name="scala.Any">Any</span></span>)</span><span class="result">: <span 
class="extype" name="scala.Boolean">Boolean</span></span>
+      </span>
+      
+      <div class="fullcomment"><dl class="attributes block"> <dt>Definition 
Classes</dt><dd>AnyRef → Any</dd></dl></div>
+    </li><li name="scala.Any#asInstanceOf" visbl="pub" class="indented0 " 
data-isabs="false" fullComment="yes" group="Ungrouped">
+      <a id="asInstanceOf[T0]:T0"></a>
+      <span class="permalink">
+      <a href="../../datafu/spark/SparkDFUtilsBridge.html#asInstanceOf[T0]:T0" 
title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span>
+      <span class="modifier_kind">
+        <span class="modifier">final </span>
+        <span class="kind">def</span>
+      </span>
+      <span class="symbol">
+        <span class="name">asInstanceOf</span><span class="tparams">[<span 
name="T0">T0</span>]</span><span class="result">: <span class="extype" 
name="scala.Any.asInstanceOf.T0">T0</span></span>
+      </span>
+      
+      <div class="fullcomment"><dl class="attributes block"> <dt>Definition 
Classes</dt><dd>Any</dd></dl></div>
+    </li><li name="datafu.spark.SparkDFUtilsBridge#broadcastJoinSkewed" 
visbl="pub" class="indented0 " data-isabs="false" fullComment="no" 
group="Ungrouped">
+      <a 
id="broadcastJoinSkewed(notSkewed:org.apache.spark.sql.DataFrame,skewed:org.apache.spark.sql.DataFrame,joinCol:String,numRowsToBroadcast:Int,filterCnt:Long,joinType:String):org.apache.spark.sql.DataFrame"></a><a
 
id="broadcastJoinSkewed(DataFrame,DataFrame,String,Int,Long,String):DataFrame"></a>
+      <span class="permalink">
+      <a 
href="../../datafu/spark/SparkDFUtilsBridge.html#broadcastJoinSkewed(notSkewed:org.apache.spark.sql.DataFrame,skewed:org.apache.spark.sql.DataFrame,joinCol:String,numRowsToBroadcast:Int,filterCnt:Long,joinType:String):org.apache.spark.sql.DataFrame"
 title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span>
+      <span class="modifier_kind">
+        <span class="modifier"></span>
+        <span class="kind">def</span>
+      </span>
+      <span class="symbol">
+        <span class="name">broadcastJoinSkewed</span><span 
class="params">(<span name="notSkewed">notSkewed: <a 
href="../../org/apache/spark/sql/index.html#DataFrame=org.apache.spark.sql.Dataset[org.apache.spark.sql.Row]"
 class="extmbr" name="org.apache.spark.sql.DataFrame">DataFrame</a></span>, 
<span name="skewed">skewed: <a 
href="../../org/apache/spark/sql/index.html#DataFrame=org.apache.spark.sql.Dataset[org.apache.spark.sql.Row]"
 class="extmbr" name="org.apache.spark.sql.DataFrame">DataFrame</a></span>, 
<span name="joinCol">joinCol: <span class="extype" 
name="scala.Predef.String">String</span></span>, <span 
name="numRowsToBroadcast">numRowsToBroadcast: <span class="extype" 
name="scala.Int">Int</span></span>, <span name="filterCnt">filterCnt: <span 
class="extype" name="scala.Long">Long</span></span>, <span 
name="joinType">joinType: <span class="extype" 
name="scala.Predef.String">String</span></span>)</span><span class="result">: 
<a href="../../org/apache/spark/sql/index.html#Data
 Frame=org.apache.spark.sql.Dataset[org.apache.spark.sql.Row]" class="extmbr" 
name="org.apache.spark.sql.DataFrame">DataFrame</a></span>
+      </span>
+      
+      
+    </li><li name="datafu.spark.SparkDFUtilsBridge#changeSchema" visbl="pub" 
class="indented0 " data-isabs="false" fullComment="no" group="Ungrouped">
+      <a 
id="changeSchema(df:org.apache.spark.sql.DataFrame,newScheme:java.util.List[String]):org.apache.spark.sql.DataFrame"></a><a
 id="changeSchema(DataFrame,List[String]):DataFrame"></a>
+      <span class="permalink">
+      <a 
href="../../datafu/spark/SparkDFUtilsBridge.html#changeSchema(df:org.apache.spark.sql.DataFrame,newScheme:java.util.List[String]):org.apache.spark.sql.DataFrame"
 title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span>
+      <span class="modifier_kind">
+        <span class="modifier"></span>
+        <span class="kind">def</span>
+      </span>
+      <span class="symbol">
+        <span class="name">changeSchema</span><span class="params">(<span 
name="df">df: <a 
href="../../org/apache/spark/sql/index.html#DataFrame=org.apache.spark.sql.Dataset[org.apache.spark.sql.Row]"
 class="extmbr" name="org.apache.spark.sql.DataFrame">DataFrame</a></span>, 
<span name="newScheme">newScheme: <span class="extype" 
name="java.util.List">List</span>[<span class="extype" 
name="scala.Predef.String">String</span>]</span>)</span><span class="result">: 
<a 
href="../../org/apache/spark/sql/index.html#DataFrame=org.apache.spark.sql.Dataset[org.apache.spark.sql.Row]"
 class="extmbr" name="org.apache.spark.sql.DataFrame">DataFrame</a></span>
+      </span>
+      
+      
+    </li><li name="scala.AnyRef#clone" visbl="prt" class="indented0 " 
data-isabs="false" fullComment="yes" group="Ungrouped">
+      <a id="clone():Object"></a><a id="clone():AnyRef"></a>
+      <span class="permalink">
+      <a href="../../datafu/spark/SparkDFUtilsBridge.html#clone():Object" 
title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span>
+      <span class="modifier_kind">
+        <span class="modifier"></span>
+        <span class="kind">def</span>
+      </span>
+      <span class="symbol">
+        <span class="name">clone</span><span class="params">()</span><span 
class="result">: <span class="extype" name="scala.AnyRef">AnyRef</span></span>
+      </span>
+      
+      <div class="fullcomment"><dl class="attributes block"> 
<dt>Attributes</dt><dd>protected[<span class="extype" 
name="java.lang">lang</span>] </dd><dt>Definition 
Classes</dt><dd>AnyRef</dd><dt>Annotations</dt><dd>
+                <span class="name">@throws</span><span class="args">(<span>
+      
+      <span class="defval" 
name="classOf[java.lang.CloneNotSupportedException]">...</span>
+    </span>)</span>
+              
+                <span class="name">@native</span><span class="args">()</span>
+              
+        </dd></dl></div>
+    </li><li name="datafu.spark.SparkDFUtilsBridge#dedupByAllExcept" 
visbl="pub" class="indented0 " data-isabs="false" fullComment="no" 
group="Ungrouped">
+      <a 
id="dedupByAllExcept(df:org.apache.spark.sql.DataFrame,ignoredColumn:String):org.apache.spark.sql.DataFrame"></a><a
 id="dedupByAllExcept(DataFrame,String):DataFrame"></a>
+      <span class="permalink">
+      <a 
href="../../datafu/spark/SparkDFUtilsBridge.html#dedupByAllExcept(df:org.apache.spark.sql.DataFrame,ignoredColumn:String):org.apache.spark.sql.DataFrame"
 title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span>
+      <span class="modifier_kind">
+        <span class="modifier"></span>
+        <span class="kind">def</span>
+      </span>
+      <span class="symbol">
+        <span class="name">dedupByAllExcept</span><span class="params">(<span 
name="df">df: <a 
href="../../org/apache/spark/sql/index.html#DataFrame=org.apache.spark.sql.Dataset[org.apache.spark.sql.Row]"
 class="extmbr" name="org.apache.spark.sql.DataFrame">DataFrame</a></span>, 
<span name="ignoredColumn">ignoredColumn: <span class="extype" 
name="scala.Predef.String">String</span></span>)</span><span class="result">: 
<a 
href="../../org/apache/spark/sql/index.html#DataFrame=org.apache.spark.sql.Dataset[org.apache.spark.sql.Row]"
 class="extmbr" name="org.apache.spark.sql.DataFrame">DataFrame</a></span>
+      </span>
+      
+      
+    </li><li name="datafu.spark.SparkDFUtilsBridge#dedupRandomN" visbl="pub" 
class="indented0 " data-isabs="false" fullComment="no" group="Ungrouped">
+      <a 
id="dedupRandomN(df:org.apache.spark.sql.DataFrame,groupCol:org.apache.spark.sql.Column,maxSize:Int):org.apache.spark.sql.DataFrame"></a><a
 id="dedupRandomN(DataFrame,Column,Int):DataFrame"></a>
+      <span class="permalink">
+      <a 
href="../../datafu/spark/SparkDFUtilsBridge.html#dedupRandomN(df:org.apache.spark.sql.DataFrame,groupCol:org.apache.spark.sql.Column,maxSize:Int):org.apache.spark.sql.DataFrame"
 title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span>
+      <span class="modifier_kind">
+        <span class="modifier"></span>
+        <span class="kind">def</span>
+      </span>
+      <span class="symbol">
+        <span class="name">dedupRandomN</span><span class="params">(<span 
name="df">df: <a 
href="../../org/apache/spark/sql/index.html#DataFrame=org.apache.spark.sql.Dataset[org.apache.spark.sql.Row]"
 class="extmbr" name="org.apache.spark.sql.DataFrame">DataFrame</a></span>, 
<span name="groupCol">groupCol: <span class="extype" 
name="org.apache.spark.sql.Column">Column</span></span>, <span 
name="maxSize">maxSize: <span class="extype" 
name="scala.Int">Int</span></span>)</span><span class="result">: <a 
href="../../org/apache/spark/sql/index.html#DataFrame=org.apache.spark.sql.Dataset[org.apache.spark.sql.Row]"
 class="extmbr" name="org.apache.spark.sql.DataFrame">DataFrame</a></span>
+      </span>
+      
+      
+    </li><li name="datafu.spark.SparkDFUtilsBridge#dedupTopN" visbl="pub" 
class="indented0 " data-isabs="false" fullComment="no" group="Ungrouped">
+      <a 
id="dedupTopN(df:org.apache.spark.sql.DataFrame,n:Int,groupCol:org.apache.spark.sql.Column,orderCols:java.util.List[org.apache.spark.sql.Column]):org.apache.spark.sql.DataFrame"></a><a
 id="dedupTopN(DataFrame,Int,Column,List[Column]):DataFrame"></a>
+      <span class="permalink">
+      <a 
href="../../datafu/spark/SparkDFUtilsBridge.html#dedupTopN(df:org.apache.spark.sql.DataFrame,n:Int,groupCol:org.apache.spark.sql.Column,orderCols:java.util.List[org.apache.spark.sql.Column]):org.apache.spark.sql.DataFrame"
 title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span>
+      <span class="modifier_kind">
+        <span class="modifier"></span>
+        <span class="kind">def</span>
+      </span>
+      <span class="symbol">
+        <span class="name">dedupTopN</span><span class="params">(<span 
name="df">df: <a 
href="../../org/apache/spark/sql/index.html#DataFrame=org.apache.spark.sql.Dataset[org.apache.spark.sql.Row]"
 class="extmbr" name="org.apache.spark.sql.DataFrame">DataFrame</a></span>, 
<span name="n">n: <span class="extype" name="scala.Int">Int</span></span>, 
<span name="groupCol">groupCol: <span class="extype" 
name="org.apache.spark.sql.Column">Column</span></span>, <span 
name="orderCols">orderCols: <span class="extype" 
name="java.util.List">List</span>[<span class="extype" 
name="org.apache.spark.sql.Column">Column</span>]</span>)</span><span 
class="result">: <a 
href="../../org/apache/spark/sql/index.html#DataFrame=org.apache.spark.sql.Dataset[org.apache.spark.sql.Row]"
 class="extmbr" name="org.apache.spark.sql.DataFrame">DataFrame</a></span>
+      </span>
+      
+      
+    </li><li name="datafu.spark.SparkDFUtilsBridge#dedupWithCombiner" 
visbl="pub" class="indented0 " data-isabs="false" fullComment="no" 
group="Ungrouped">
+      <a 
id="dedupWithCombiner(df:org.apache.spark.sql.DataFrame,groupCol:java.util.List[org.apache.spark.sql.Column],orderByCol:java.util.List[org.apache.spark.sql.Column],desc:Boolean,columnsFilter:java.util.List[String],columnsFilterKeep:Boolean):org.apache.spark.sql.DataFrame"></a><a
 
id="dedupWithCombiner(DataFrame,List[Column],List[Column],Boolean,List[String],Boolean):DataFrame"></a>
+      <span class="permalink">
+      <a 
href="../../datafu/spark/SparkDFUtilsBridge.html#dedupWithCombiner(df:org.apache.spark.sql.DataFrame,groupCol:java.util.List[org.apache.spark.sql.Column],orderByCol:java.util.List[org.apache.spark.sql.Column],desc:Boolean,columnsFilter:java.util.List[String],columnsFilterKeep:Boolean):org.apache.spark.sql.DataFrame"
 title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span>
+      <span class="modifier_kind">
+        <span class="modifier"></span>
+        <span class="kind">def</span>
+      </span>
+      <span class="symbol">
+        <span class="name">dedupWithCombiner</span><span class="params">(<span 
name="df">df: <a 
href="../../org/apache/spark/sql/index.html#DataFrame=org.apache.spark.sql.Dataset[org.apache.spark.sql.Row]"
 class="extmbr" name="org.apache.spark.sql.DataFrame">DataFrame</a></span>, 
<span name="groupCol">groupCol: <span class="extype" 
name="java.util.List">List</span>[<span class="extype" 
name="org.apache.spark.sql.Column">Column</span>]</span>, <span 
name="orderByCol">orderByCol: <span class="extype" 
name="java.util.List">List</span>[<span class="extype" 
name="org.apache.spark.sql.Column">Column</span>]</span>, <span 
name="desc">desc: <span class="extype" 
name="scala.Boolean">Boolean</span></span>, <span 
name="columnsFilter">columnsFilter: <span class="extype" 
name="java.util.List">List</span>[<span class="extype" 
name="scala.Predef.String">String</span>]</span>, <span 
name="columnsFilterKeep">columnsFilterKeep: <span class="extype" 
name="scala.Boolean">Boolean</span></span>)</span><s
 pan class="result">: <a 
href="../../org/apache/spark/sql/index.html#DataFrame=org.apache.spark.sql.Dataset[org.apache.spark.sql.Row]"
 class="extmbr" name="org.apache.spark.sql.DataFrame">DataFrame</a></span>
+      </span>
+      
+      
+    </li><li name="datafu.spark.SparkDFUtilsBridge#dedupWithOrder" visbl="pub" 
class="indented0 " data-isabs="false" fullComment="no" group="Ungrouped">
+      <a 
id="dedupWithOrder(df:org.apache.spark.sql.DataFrame,groupCol:org.apache.spark.sql.Column,orderCols:java.util.List[org.apache.spark.sql.Column]):org.apache.spark.sql.DataFrame"></a><a
 id="dedupWithOrder(DataFrame,Column,List[Column]):DataFrame"></a>
+      <span class="permalink">
+      <a 
href="../../datafu/spark/SparkDFUtilsBridge.html#dedupWithOrder(df:org.apache.spark.sql.DataFrame,groupCol:org.apache.spark.sql.Column,orderCols:java.util.List[org.apache.spark.sql.Column]):org.apache.spark.sql.DataFrame"
 title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span>
+      <span class="modifier_kind">
+        <span class="modifier"></span>
+        <span class="kind">def</span>
+      </span>
+      <span class="symbol">
+        <span class="name">dedupWithOrder</span><span class="params">(<span 
name="df">df: <a 
href="../../org/apache/spark/sql/index.html#DataFrame=org.apache.spark.sql.Dataset[org.apache.spark.sql.Row]"
 class="extmbr" name="org.apache.spark.sql.DataFrame">DataFrame</a></span>, 
<span name="groupCol">groupCol: <span class="extype" 
name="org.apache.spark.sql.Column">Column</span></span>, <span 
name="orderCols">orderCols: <span class="extype" 
name="java.util.List">List</span>[<span class="extype" 
name="org.apache.spark.sql.Column">Column</span>]</span>)</span><span 
class="result">: <a 
href="../../org/apache/spark/sql/index.html#DataFrame=org.apache.spark.sql.Dataset[org.apache.spark.sql.Row]"
 class="extmbr" name="org.apache.spark.sql.DataFrame">DataFrame</a></span>
+      </span>
+      
+      
+    </li><li name="scala.AnyRef#eq" visbl="pub" class="indented0 " 
data-isabs="false" fullComment="yes" group="Ungrouped">
+      <a id="eq(x$1:AnyRef):Boolean"></a><a id="eq(AnyRef):Boolean"></a>
+      <span class="permalink">
+      <a 
href="../../datafu/spark/SparkDFUtilsBridge.html#eq(x$1:AnyRef):Boolean" 
title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span>
+      <span class="modifier_kind">
+        <span class="modifier">final </span>
+        <span class="kind">def</span>
+      </span>
+      <span class="symbol">
+        <span class="name">eq</span><span class="params">(<span 
name="arg0">arg0: <span class="extype" 
name="scala.AnyRef">AnyRef</span></span>)</span><span class="result">: <span 
class="extype" name="scala.Boolean">Boolean</span></span>
+      </span>
+      
+      <div class="fullcomment"><dl class="attributes block"> <dt>Definition 
Classes</dt><dd>AnyRef</dd></dl></div>
+    </li><li name="scala.AnyRef#equals" visbl="pub" class="indented0 " 
data-isabs="false" fullComment="yes" group="Ungrouped">
+      <a id="equals(x$1:Any):Boolean"></a><a id="equals(Any):Boolean"></a>
+      <span class="permalink">
+      <a 
href="../../datafu/spark/SparkDFUtilsBridge.html#equals(x$1:Any):Boolean" 
title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span>
+      <span class="modifier_kind">
+        <span class="modifier"></span>
+        <span class="kind">def</span>
+      </span>
+      <span class="symbol">
+        <span class="name">equals</span><span class="params">(<span 
name="arg0">arg0: <span class="extype" 
name="scala.Any">Any</span></span>)</span><span class="result">: <span 
class="extype" name="scala.Boolean">Boolean</span></span>
+      </span>
+      
+      <div class="fullcomment"><dl class="attributes block"> <dt>Definition 
Classes</dt><dd>AnyRef → Any</dd></dl></div>
+    </li><li name="datafu.spark.SparkDFUtilsBridge#explodeArray" visbl="pub" 
class="indented0 " data-isabs="false" fullComment="no" group="Ungrouped">
+      <a 
id="explodeArray(df:org.apache.spark.sql.DataFrame,arrayCol:org.apache.spark.sql.Column,alias:String):org.apache.spark.sql.DataFrame"></a><a
 id="explodeArray(DataFrame,Column,String):DataFrame"></a>
+      <span class="permalink">
+      <a 
href="../../datafu/spark/SparkDFUtilsBridge.html#explodeArray(df:org.apache.spark.sql.DataFrame,arrayCol:org.apache.spark.sql.Column,alias:String):org.apache.spark.sql.DataFrame"
 title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span>
+      <span class="modifier_kind">
+        <span class="modifier"></span>
+        <span class="kind">def</span>
+      </span>
+      <span class="symbol">
+        <span class="name">explodeArray</span><span class="params">(<span 
name="df">df: <a 
href="../../org/apache/spark/sql/index.html#DataFrame=org.apache.spark.sql.Dataset[org.apache.spark.sql.Row]"
 class="extmbr" name="org.apache.spark.sql.DataFrame">DataFrame</a></span>, 
<span name="arrayCol">arrayCol: <span class="extype" 
name="org.apache.spark.sql.Column">Column</span></span>, <span 
name="alias">alias: <span class="extype" 
name="scala.Predef.String">String</span></span>)</span><span class="result">: 
<a 
href="../../org/apache/spark/sql/index.html#DataFrame=org.apache.spark.sql.Dataset[org.apache.spark.sql.Row]"
 class="extmbr" name="org.apache.spark.sql.DataFrame">DataFrame</a></span>
+      </span>
+      
+      
+    </li><li name="scala.AnyRef#finalize" visbl="prt" class="indented0 " 
data-isabs="false" fullComment="yes" group="Ungrouped">
+      <a id="finalize():Unit"></a>
+      <span class="permalink">
+      <a href="../../datafu/spark/SparkDFUtilsBridge.html#finalize():Unit" 
title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span>
+      <span class="modifier_kind">
+        <span class="modifier"></span>
+        <span class="kind">def</span>
+      </span>
+      <span class="symbol">
+        <span class="name">finalize</span><span class="params">()</span><span 
class="result">: <span class="extype" name="scala.Unit">Unit</span></span>
+      </span>
+      
+      <div class="fullcomment"><dl class="attributes block"> 
<dt>Attributes</dt><dd>protected[<span class="extype" 
name="java.lang">lang</span>] </dd><dt>Definition 
Classes</dt><dd>AnyRef</dd><dt>Annotations</dt><dd>
+                <span class="name">@throws</span><span class="args">(<span>
+      
+      <span class="symbol">classOf[java.lang.Throwable]</span>
+    </span>)</span>
+              
+        </dd></dl></div>
+    </li><li name="scala.AnyRef#getClass" visbl="pub" class="indented0 " 
data-isabs="false" fullComment="yes" group="Ungrouped">
+      <a id="getClass():Class[_]"></a>
+      <span class="permalink">
+      <a href="../../datafu/spark/SparkDFUtilsBridge.html#getClass():Class[_]" 
title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span>
+      <span class="modifier_kind">
+        <span class="modifier">final </span>
+        <span class="kind">def</span>
+      </span>
+      <span class="symbol">
+        <span class="name">getClass</span><span class="params">()</span><span 
class="result">: <span class="extype" 
name="java.lang.Class">Class</span>[_]</span>
+      </span>
+      
+      <div class="fullcomment"><dl class="attributes block"> <dt>Definition 
Classes</dt><dd>AnyRef → Any</dd><dt>Annotations</dt><dd>
+                <span class="name">@native</span><span class="args">()</span>
+              
+        </dd></dl></div>
+    </li><li name="scala.AnyRef#hashCode" visbl="pub" class="indented0 " 
data-isabs="false" fullComment="yes" group="Ungrouped">
+      <a id="hashCode():Int"></a>
+      <span class="permalink">
+      <a href="../../datafu/spark/SparkDFUtilsBridge.html#hashCode():Int" 
title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span>
+      <span class="modifier_kind">
+        <span class="modifier"></span>
+        <span class="kind">def</span>
+      </span>
+      <span class="symbol">
+        <span class="name">hashCode</span><span class="params">()</span><span 
class="result">: <span class="extype" name="scala.Int">Int</span></span>
+      </span>
+      
+      <div class="fullcomment"><dl class="attributes block"> <dt>Definition 
Classes</dt><dd>AnyRef → Any</dd><dt>Annotations</dt><dd>
+                <span class="name">@native</span><span class="args">()</span>
+              
+        </dd></dl></div>
+    </li><li name="scala.Any#isInstanceOf" visbl="pub" class="indented0 " 
data-isabs="false" fullComment="yes" group="Ungrouped">
+      <a id="isInstanceOf[T0]:Boolean"></a>
+      <span class="permalink">
+      <a 
href="../../datafu/spark/SparkDFUtilsBridge.html#isInstanceOf[T0]:Boolean" 
title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span>
+      <span class="modifier_kind">
+        <span class="modifier">final </span>
+        <span class="kind">def</span>
+      </span>
+      <span class="symbol">
+        <span class="name">isInstanceOf</span><span class="tparams">[<span 
name="T0">T0</span>]</span><span class="result">: <span class="extype" 
name="scala.Boolean">Boolean</span></span>
+      </span>
+      
+      <div class="fullcomment"><dl class="attributes block"> <dt>Definition 
Classes</dt><dd>Any</dd></dl></div>
+    </li><li name="datafu.spark.SparkDFUtilsBridge#joinSkewed" visbl="pub" 
class="indented0 " data-isabs="false" fullComment="no" group="Ungrouped">
+      <a 
id="joinSkewed(dfLeft:org.apache.spark.sql.DataFrame,dfRight:org.apache.spark.sql.DataFrame,joinExprs:org.apache.spark.sql.Column,numShards:Int,joinType:String):org.apache.spark.sql.DataFrame"></a><a
 id="joinSkewed(DataFrame,DataFrame,Column,Int,String):DataFrame"></a>
+      <span class="permalink">
+      <a 
href="../../datafu/spark/SparkDFUtilsBridge.html#joinSkewed(dfLeft:org.apache.spark.sql.DataFrame,dfRight:org.apache.spark.sql.DataFrame,joinExprs:org.apache.spark.sql.Column,numShards:Int,joinType:String):org.apache.spark.sql.DataFrame"
 title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span>
+      <span class="modifier_kind">
+        <span class="modifier"></span>
+        <span class="kind">def</span>
+      </span>
+      <span class="symbol">
+        <span class="name">joinSkewed</span><span class="params">(<span 
name="dfLeft">dfLeft: <a 
href="../../org/apache/spark/sql/index.html#DataFrame=org.apache.spark.sql.Dataset[org.apache.spark.sql.Row]"
 class="extmbr" name="org.apache.spark.sql.DataFrame">DataFrame</a></span>, 
<span name="dfRight">dfRight: <a 
href="../../org/apache/spark/sql/index.html#DataFrame=org.apache.spark.sql.Dataset[org.apache.spark.sql.Row]"
 class="extmbr" name="org.apache.spark.sql.DataFrame">DataFrame</a></span>, 
<span name="joinExprs">joinExprs: <span class="extype" 
name="org.apache.spark.sql.Column">Column</span></span>, <span 
name="numShards">numShards: <span class="extype" 
name="scala.Int">Int</span></span>, <span name="joinType">joinType: <span 
class="extype" name="scala.Predef.String">String</span></span>)</span><span 
class="result">: <a 
href="../../org/apache/spark/sql/index.html#DataFrame=org.apache.spark.sql.Dataset[org.apache.spark.sql.Row]"
 class="extmbr" name="org.apache.spark.sql.DataFram
 e">DataFrame</a></span>
+      </span>
+      
+      
+    </li><li name="datafu.spark.SparkDFUtilsBridge#joinWithRange" visbl="pub" 
class="indented0 " data-isabs="false" fullComment="no" group="Ungrouped">
+      <a 
id="joinWithRange(dfSingle:org.apache.spark.sql.DataFrame,colSingle:String,dfRange:org.apache.spark.sql.DataFrame,colRangeStart:String,colRangeEnd:String,DECREASE_FACTOR:Long):org.apache.spark.sql.DataFrame"></a><a
 
id="joinWithRange(DataFrame,String,DataFrame,String,String,Long):DataFrame"></a>
+      <span class="permalink">
+      <a 
href="../../datafu/spark/SparkDFUtilsBridge.html#joinWithRange(dfSingle:org.apache.spark.sql.DataFrame,colSingle:String,dfRange:org.apache.spark.sql.DataFrame,colRangeStart:String,colRangeEnd:String,DECREASE_FACTOR:Long):org.apache.spark.sql.DataFrame"
 title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span>
+      <span class="modifier_kind">
+        <span class="modifier"></span>
+        <span class="kind">def</span>
+      </span>
+      <span class="symbol">
+        <span class="name">joinWithRange</span><span class="params">(<span 
name="dfSingle">dfSingle: <a 
href="../../org/apache/spark/sql/index.html#DataFrame=org.apache.spark.sql.Dataset[org.apache.spark.sql.Row]"
 class="extmbr" name="org.apache.spark.sql.DataFrame">DataFrame</a></span>, 
<span name="colSingle">colSingle: <span class="extype" 
name="scala.Predef.String">String</span></span>, <span name="dfRange">dfRange: 
<a 
href="../../org/apache/spark/sql/index.html#DataFrame=org.apache.spark.sql.Dataset[org.apache.spark.sql.Row]"
 class="extmbr" name="org.apache.spark.sql.DataFrame">DataFrame</a></span>, 
<span name="colRangeStart">colRangeStart: <span class="extype" 
name="scala.Predef.String">String</span></span>, <span 
name="colRangeEnd">colRangeEnd: <span class="extype" 
name="scala.Predef.String">String</span></span>, <span 
name="DECREASE_FACTOR">DECREASE_FACTOR: <span class="extype" 
name="scala.Long">Long</span></span>)</span><span class="result">: <a 
href="../../org/apache/spark/
 
sql/index.html#DataFrame=org.apache.spark.sql.Dataset[org.apache.spark.sql.Row]"
 class="extmbr" name="org.apache.spark.sql.DataFrame">DataFrame</a></span>
+      </span>
+      
+      
+    </li><li name="datafu.spark.SparkDFUtilsBridge#joinWithRangeAndDedup" 
visbl="pub" class="indented0 " data-isabs="false" fullComment="no" 
group="Ungrouped">
+      <a 
id="joinWithRangeAndDedup(dfSingle:org.apache.spark.sql.DataFrame,colSingle:String,dfRange:org.apache.spark.sql.DataFrame,colRangeStart:String,colRangeEnd:String,DECREASE_FACTOR:Long,dedupSmallRange:Boolean):org.apache.spark.sql.DataFrame"></a><a
 
id="joinWithRangeAndDedup(DataFrame,String,DataFrame,String,String,Long,Boolean):DataFrame"></a>
+      <span class="permalink">
+      <a 
href="../../datafu/spark/SparkDFUtilsBridge.html#joinWithRangeAndDedup(dfSingle:org.apache.spark.sql.DataFrame,colSingle:String,dfRange:org.apache.spark.sql.DataFrame,colRangeStart:String,colRangeEnd:String,DECREASE_FACTOR:Long,dedupSmallRange:Boolean):org.apache.spark.sql.DataFrame"
 title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span>
+      <span class="modifier_kind">
+        <span class="modifier"></span>
+        <span class="kind">def</span>
+      </span>
+      <span class="symbol">
+        <span class="name">joinWithRangeAndDedup</span><span 
class="params">(<span name="dfSingle">dfSingle: <a 
href="../../org/apache/spark/sql/index.html#DataFrame=org.apache.spark.sql.Dataset[org.apache.spark.sql.Row]"
 class="extmbr" name="org.apache.spark.sql.DataFrame">DataFrame</a></span>, 
<span name="colSingle">colSingle: <span class="extype" 
name="scala.Predef.String">String</span></span>, <span name="dfRange">dfRange: 
<a 
href="../../org/apache/spark/sql/index.html#DataFrame=org.apache.spark.sql.Dataset[org.apache.spark.sql.Row]"
 class="extmbr" name="org.apache.spark.sql.DataFrame">DataFrame</a></span>, 
<span name="colRangeStart">colRangeStart: <span class="extype" 
name="scala.Predef.String">String</span></span>, <span 
name="colRangeEnd">colRangeEnd: <span class="extype" 
name="scala.Predef.String">String</span></span>, <span 
name="DECREASE_FACTOR">DECREASE_FACTOR: <span class="extype" 
name="scala.Long">Long</span></span>, <span 
name="dedupSmallRange">dedupSmallRange: <span c
 lass="extype" name="scala.Boolean">Boolean</span></span>)</span><span 
class="result">: <a 
href="../../org/apache/spark/sql/index.html#DataFrame=org.apache.spark.sql.Dataset[org.apache.spark.sql.Row]"
 class="extmbr" name="org.apache.spark.sql.DataFrame">DataFrame</a></span>
+      </span>
+      
+      
+    </li><li name="scala.AnyRef#ne" visbl="pub" class="indented0 " 
data-isabs="false" fullComment="yes" group="Ungrouped">
+      <a id="ne(x$1:AnyRef):Boolean"></a><a id="ne(AnyRef):Boolean"></a>
+      <span class="permalink">
+      <a 
href="../../datafu/spark/SparkDFUtilsBridge.html#ne(x$1:AnyRef):Boolean" 
title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span>
+      <span class="modifier_kind">
+        <span class="modifier">final </span>
+        <span class="kind">def</span>
+      </span>
+      <span class="symbol">
+        <span class="name">ne</span><span class="params">(<span 
name="arg0">arg0: <span class="extype" 
name="scala.AnyRef">AnyRef</span></span>)</span><span class="result">: <span 
class="extype" name="scala.Boolean">Boolean</span></span>
+      </span>
+      
+      <div class="fullcomment"><dl class="attributes block"> <dt>Definition 
Classes</dt><dd>AnyRef</dd></dl></div>
+    </li><li name="scala.AnyRef#notify" visbl="pub" class="indented0 " 
data-isabs="false" fullComment="yes" group="Ungrouped">
+      <a id="notify():Unit"></a>
+      <span class="permalink">
+      <a href="../../datafu/spark/SparkDFUtilsBridge.html#notify():Unit" 
title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span>
+      <span class="modifier_kind">
+        <span class="modifier">final </span>
+        <span class="kind">def</span>
+      </span>
+      <span class="symbol">
+        <span class="name">notify</span><span class="params">()</span><span 
class="result">: <span class="extype" name="scala.Unit">Unit</span></span>
+      </span>
+      
+      <div class="fullcomment"><dl class="attributes block"> <dt>Definition 
Classes</dt><dd>AnyRef</dd><dt>Annotations</dt><dd>
+                <span class="name">@native</span><span class="args">()</span>
+              
+        </dd></dl></div>
+    </li><li name="scala.AnyRef#notifyAll" visbl="pub" class="indented0 " 
data-isabs="false" fullComment="yes" group="Ungrouped">
+      <a id="notifyAll():Unit"></a>
+      <span class="permalink">
+      <a href="../../datafu/spark/SparkDFUtilsBridge.html#notifyAll():Unit" 
title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span>
+      <span class="modifier_kind">
+        <span class="modifier">final </span>
+        <span class="kind">def</span>
+      </span>
+      <span class="symbol">
+        <span class="name">notifyAll</span><span class="params">()</span><span 
class="result">: <span class="extype" name="scala.Unit">Unit</span></span>
+      </span>
+      
+      <div class="fullcomment"><dl class="attributes block"> <dt>Definition 
Classes</dt><dd>AnyRef</dd><dt>Annotations</dt><dd>
+                <span class="name">@native</span><span class="args">()</span>
+              
+        </dd></dl></div>
+    </li><li name="scala.AnyRef#synchronized" visbl="pub" class="indented0 " 
data-isabs="false" fullComment="yes" group="Ungrouped">
+      <a id="synchronized[T0](x$1:=&gt;T0):T0"></a><a 
id="synchronized[T0](⇒T0):T0"></a>
+      <span class="permalink">
+      <a 
href="../../datafu/spark/SparkDFUtilsBridge.html#synchronized[T0](x$1:=&gt;T0):T0"
 title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span>
+      <span class="modifier_kind">
+        <span class="modifier">final </span>
+        <span class="kind">def</span>
+      </span>
+      <span class="symbol">
+        <span class="name">synchronized</span><span class="tparams">[<span 
name="T0">T0</span>]</span><span class="params">(<span name="arg0">arg0: ⇒ 
<span class="extype" 
name="java.lang.AnyRef.synchronized.T0">T0</span></span>)</span><span 
class="result">: <span class="extype" 
name="java.lang.AnyRef.synchronized.T0">T0</span></span>
+      </span>
+      
+      <div class="fullcomment"><dl class="attributes block"> <dt>Definition 
Classes</dt><dd>AnyRef</dd></dl></div>
+    </li><li name="scala.AnyRef#toString" visbl="pub" class="indented0 " 
data-isabs="false" fullComment="yes" group="Ungrouped">
+      <a id="toString():String"></a>
+      <span class="permalink">
+      <a href="../../datafu/spark/SparkDFUtilsBridge.html#toString():String" 
title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span>
+      <span class="modifier_kind">
+        <span class="modifier"></span>
+        <span class="kind">def</span>
+      </span>
+      <span class="symbol">
+        <span class="name">toString</span><span class="params">()</span><span 
class="result">: <span class="extype" 
name="java.lang.String">String</span></span>
+      </span>
+      
+      <div class="fullcomment"><dl class="attributes block"> <dt>Definition 
Classes</dt><dd>AnyRef → Any</dd></dl></div>
+    </li><li name="scala.AnyRef#wait" visbl="pub" class="indented0 " 
data-isabs="false" fullComment="yes" group="Ungrouped">
+      <a id="wait():Unit"></a>
+      <span class="permalink">
+      <a href="../../datafu/spark/SparkDFUtilsBridge.html#wait():Unit" 
title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span>
+      <span class="modifier_kind">
+        <span class="modifier">final </span>
+        <span class="kind">def</span>
+      </span>
+      <span class="symbol">
+        <span class="name">wait</span><span class="params">()</span><span 
class="result">: <span class="extype" name="scala.Unit">Unit</span></span>
+      </span>
+      
+      <div class="fullcomment"><dl class="attributes block"> <dt>Definition 
Classes</dt><dd>AnyRef</dd><dt>Annotations</dt><dd>
+                <span class="name">@throws</span><span class="args">(<span>
+      
+      <span class="defval" 
name="classOf[java.lang.InterruptedException]">...</span>
+    </span>)</span>
+              
+        </dd></dl></div>
+    </li><li name="scala.AnyRef#wait" visbl="pub" class="indented0 " 
data-isabs="false" fullComment="yes" group="Ungrouped">
+      <a id="wait(x$1:Long,x$2:Int):Unit"></a><a id="wait(Long,Int):Unit"></a>
+      <span class="permalink">
+      <a 
href="../../datafu/spark/SparkDFUtilsBridge.html#wait(x$1:Long,x$2:Int):Unit" 
title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span>
+      <span class="modifier_kind">
+        <span class="modifier">final </span>
+        <span class="kind">def</span>
+      </span>
+      <span class="symbol">
+        <span class="name">wait</span><span class="params">(<span 
name="arg0">arg0: <span class="extype" name="scala.Long">Long</span></span>, 
<span name="arg1">arg1: <span class="extype" 
name="scala.Int">Int</span></span>)</span><span class="result">: <span 
class="extype" name="scala.Unit">Unit</span></span>
+      </span>
+      
+      <div class="fullcomment"><dl class="attributes block"> <dt>Definition 
Classes</dt><dd>AnyRef</dd><dt>Annotations</dt><dd>
+                <span class="name">@throws</span><span class="args">(<span>
+      
+      <span class="defval" 
name="classOf[java.lang.InterruptedException]">...</span>
+    </span>)</span>
+              
+        </dd></dl></div>
+    </li><li name="scala.AnyRef#wait" visbl="pub" class="indented0 " 
data-isabs="false" fullComment="yes" group="Ungrouped">
+      <a id="wait(x$1:Long):Unit"></a><a id="wait(Long):Unit"></a>
+      <span class="permalink">
+      <a href="../../datafu/spark/SparkDFUtilsBridge.html#wait(x$1:Long):Unit" 
title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span>
+      <span class="modifier_kind">
+        <span class="modifier">final </span>
+        <span class="kind">def</span>
+      </span>
+      <span class="symbol">
+        <span class="name">wait</span><span class="params">(<span 
name="arg0">arg0: <span class="extype" 
name="scala.Long">Long</span></span>)</span><span class="result">: <span 
class="extype" name="scala.Unit">Unit</span></span>
+      </span>
+      
+      <div class="fullcomment"><dl class="attributes block"> <dt>Definition 
Classes</dt><dd>AnyRef</dd><dt>Annotations</dt><dd>
+                <span class="name">@throws</span><span class="args">(<span>
+      
+      <span class="defval" 
name="classOf[java.lang.InterruptedException]">...</span>
+    </span>)</span>
+              
+                <span class="name">@native</span><span class="args">()</span>
+              
+        </dd></dl></div>
+    </li>
+              </ol>
+            </div>
+
+        
+
+        
+        </div>
+
+        <div id="inheritedMembers">
+        <div class="parent" name="scala.AnyRef">
+              <h3>Inherited from <span class="extype" 
name="scala.AnyRef">AnyRef</span></h3>
+            </div><div class="parent" name="scala.Any">
+              <h3>Inherited from <span class="extype" 
name="scala.Any">Any</span></h3>
+            </div>
+        
+        </div>
+
+        <div id="groupedMembers">
+        <div class="group" name="Ungrouped">
+              <h3>Ungrouped</h3>
+              
+            </div>
+        </div>
+
+      </div>
+
+      <div id="tooltip"></div>
+
+      <div id="footer">  </div>
+    </body>
+          </div>
+        </div>
+      </div>
+    </body>
+      </html>

Added: datafu/site/docs/spark/2.1.0/datafu/spark/index.html
URL: 
http://svn.apache.org/viewvc/datafu/site/docs/spark/2.1.0/datafu/spark/index.html?rev=1925323&view=auto
==============================================================================
--- datafu/site/docs/spark/2.1.0/datafu/spark/index.html (added)
+++ datafu/site/docs/spark/2.1.0/datafu/spark/index.html Tue Apr 29 18:54:44 
2025
@@ -0,0 +1,433 @@
+<!DOCTYPE html >
+<html>
+        <head>
+          <meta http-equiv="X-UA-Compatible" content="IE=edge" />
+          <meta name="viewport" content="width=device-width, 
initial-scale=1.0, maximum-scale=1.0, user-scalable=no" />
+          <title>datafu-spark 2.1.0 API  - datafu.spark</title>
+          <meta name="description" content="datafu - spark 2.1.0 API - 
datafu.spark" />
+          <meta name="keywords" content="datafu spark 2.1.0 API datafu.spark" 
/>
+          <meta http-equiv="content-type" content="text/html; charset=UTF-8" />
+          
+      
+      <link href="../../lib/index.css" media="screen" type="text/css" 
rel="stylesheet" />
+      <link href="../../lib/template.css" media="screen" type="text/css" 
rel="stylesheet" />
+      <link href="../../lib/diagrams.css" media="screen" type="text/css" 
rel="stylesheet" id="diagrams-css" />
+      <script type="text/javascript" src="../../lib/jquery.min.js"></script>
+      <script type="text/javascript" 
src="../../lib/jquery.panzoom.min.js"></script>
+      <script type="text/javascript" 
src="../../lib/jquery.mousewheel.min.js"></script>
+      <script type="text/javascript" src="../../lib/index.js"></script>
+      <script type="text/javascript" src="../../index.js"></script>
+      <script type="text/javascript" src="../../lib/scheduler.js"></script>
+      <script type="text/javascript" src="../../lib/template.js"></script>
+      
+      <script type="text/javascript">
+        /* this variable can be used by the JS to determine the path to the 
root document */
+        var toRoot = '../../';
+      </script>
+    
+        </head>
+        <body>
+      <div id="search">
+        <span id="doc-title">datafu-spark 2.1.0 API<span 
id="doc-version"></span></span>
+        <span class="close-results"><span class="left">&lt;</span> Back</span>
+        <div id="textfilter">
+          <span class="input">
+            <input autocapitalize="none" placeholder="Search" id="index-input" 
type="text" accesskey="/" />
+            <i class="clear material-icons"></i>
+            <i id="search-icon" class="material-icons"></i>
+          </span>
+        </div>
+    </div>
+      <div id="search-results">
+        <div id="search-progress">
+          <div id="progress-fill"></div>
+        </div>
+        <div id="results-content">
+          <div id="entity-results"></div>
+          <div id="member-results"></div>
+        </div>
+      </div>
+      <div id="content-scroll-container" style="-webkit-overflow-scrolling: 
touch;">
+        <div id="content-container" style="-webkit-overflow-scrolling: touch;">
+          <div id="subpackage-spacer">
+            <div id="packages">
+              <h1>Packages</h1>
+              <ul>
+                <li name="_root_.root" visbl="pub" class="indented0 " 
data-isabs="false" fullComment="yes" group="Ungrouped">
+      <a id="_root_"></a><a id="root:_root_"></a>
+      <span class="permalink">
+      <a href="../../index.html" title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span>
+      <span class="modifier_kind">
+        <span class="modifier"></span>
+        <span class="kind">package</span>
+      </span>
+      <span class="symbol">
+        <a title="" href="../../index.html"><span class="name">root</span></a>
+      </span>
+      
+      <div class="fullcomment"><dl class="attributes block"> <dt>Definition 
Classes</dt><dd><a href="../../index.html" class="extype" 
name="_root_">root</a></dd></dl></div>
+    </li><li name="_root_.datafu" visbl="pub" class="indented1 " 
data-isabs="false" fullComment="yes" group="Ungrouped">
+      <a id="datafu"></a><a id="datafu:datafu"></a>
+      <span class="permalink">
+      <a href="../../datafu/index.html" title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span>
+      <span class="modifier_kind">
+        <span class="modifier"></span>
+        <span class="kind">package</span>
+      </span>
+      <span class="symbol">
+        <a title="" href="../index.html"><span class="name">datafu</span></a>
+      </span>
+      
+      <div class="fullcomment"><dl class="attributes block"> <dt>Definition 
Classes</dt><dd><a href="../../index.html" class="extype" 
name="_root_">root</a></dd></dl></div>
+    </li><li name="datafu.spark" visbl="pub" class="indented2 current" 
data-isabs="false" fullComment="yes" group="Ungrouped">
+      <a id="spark"></a><a id="spark:spark"></a>
+      <span class="permalink">
+      <a href="../../datafu/spark/index.html" title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span>
+      <span class="modifier_kind">
+        <span class="modifier"></span>
+        <span class="kind">package</span>
+      </span>
+      <span class="symbol">
+        <span class="name">spark</span>
+      </span>
+      
+      <div class="fullcomment"><dl class="attributes block"> <dt>Definition 
Classes</dt><dd><a href="../index.html" class="extype" 
name="datafu">datafu</a></dd></dl></div>
+    </li><li class="current-entities indented2">
+                        <span class="separator"></span>
+                        <a class="object" href="Aggregators$.html" title="This 
file contains UDAFs which extend the Aggregator class."></a>
+                        <a href="Aggregators$.html" title="This file contains 
UDAFs which extend the Aggregator class.">Aggregators</a>
+                      </li><li class="current-entities indented2">
+                        <span class="separator"></span>
+                        <a class="class" href="CoreBridgeDirectory.html" 
title="Contains all python files needed by the bridge itself"></a>
+                        <a href="CoreBridgeDirectory.html" title="Contains all 
python files needed by the bridge itself">CoreBridgeDirectory</a>
+                      </li><li class="current-entities indented2">
+                        <span class="separator"></span>
+                        <a class="object" href="DataFrameOps$.html" 
title="implicit class to enable easier usage e.g:"></a>
+                        <a href="DataFrameOps$.html" title="implicit class to 
enable easier usage e.g:">DataFrameOps</a>
+                      </li><li class="current-entities indented2">
+                        <span class="separator"></span>
+                        <a class="object" href="PythonPathsManager$.html" 
title="There are two phases of resolving python files path:"></a>
+                        <a href="PythonPathsManager$.html" title="There are 
two phases of resolving python files path:">PythonPathsManager</a>
+                      </li><li class="current-entities indented2">
+                        <span class="separator"></span>
+                        <a class="class" href="PythonResource.html" 
title="Represents a resource that needs to be added to PYTHONPATH used by 
ScalaPythonBridge."></a>
+                        <a href="PythonResource.html" title="Represents a 
resource that needs to be added to PYTHONPATH used by 
ScalaPythonBridge.">PythonResource</a>
+                      </li><li class="current-entities indented2">
+                        <span class="separator"></span>
+                        <a class="object" href="ResourceCloning$.html" 
title="Utility for extracting resource from a jar and copy it to a temporary 
location"></a>
+                        <a href="ResourceCloning$.html" title="Utility for 
extracting resource from a jar and copy it to a temporary 
location">ResourceCloning</a>
+                      </li><li class="current-entities indented2">
+                        <span class="separator"></span>
+                        <a class="object" href="ScalaPythonBridge$.html" 
title="Do not instantiate this class! Use the companion object instead."></a>
+                        <a href="ScalaPythonBridge$.html" title="Do not 
instantiate this class! Use the companion object instead.">ScalaPythonBridge</a>
+                      </li><li class="current-entities indented2">
+                        <span class="separator"></span>
+                        <a class="class" href="ScalaPythonBridgeRunner.html" 
title="this class let's the user invoke PySpark code from scala example 
usage:"></a>
+                        <a href="ScalaPythonBridgeRunner.html" title="this 
class let's the user invoke PySpark code from scala example 
usage:">ScalaPythonBridgeRunner</a>
+                      </li><li class="current-entities indented2">
+                        <span class="separator"></span>
+                        <a class="object" href="SparkDFUtils$.html" 
title=""></a>
+                        <a href="SparkDFUtils$.html" title="">SparkDFUtils</a>
+                      </li><li class="current-entities indented2">
+                        <span class="separator"></span>
+                        <a class="class" href="SparkDFUtilsBridge.html" 
title="class definition so we could expose this functionality in PySpark"></a>
+                        <a href="SparkDFUtilsBridge.html" title="class 
definition so we could expose this functionality in 
PySpark">SparkDFUtilsBridge</a>
+                      </li>
+              </ul>
+            </div>
+          </div>
+          <div id="content">
+            <body class="package value">
+      <div id="definition">
+        <div class="big-circle package">p</div>
+        <p id="owner"><a href="../index.html" class="extype" 
name="datafu">datafu</a></p>
+        <h1>spark<span class="permalink">
+      <a href="../../datafu/spark/index.html" title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span></h1>
+        
+      </div>
+
+      <h4 id="signature" class="signature">
+      <span class="modifier_kind">
+        <span class="modifier"></span>
+        <span class="kind">package</span>
+      </span>
+      <span class="symbol">
+        <span class="name">spark</span>
+      </span>
+      </h4>
+
+      
+          <div id="comment" class="fullcommenttop"></div>
+        
+
+      <div id="mbrsel">
+        <div class="toggle"></div>
+        <div id="memberfilter">
+          <i class="material-icons arrow"></i>
+          <span class="input">
+            <input id="mbrsel-input" placeholder="Filter all members" 
type="text" accesskey="/" />
+          </span>
+          <i class="clear material-icons"></i>
+        </div>
+        <div id="filterby">
+          <div id="order">
+            <span class="filtertype">Ordering</span>
+            <ol>
+              
+              <li class="alpha in"><span>Alphabetic</span></li>
+              
+            </ol>
+          </div>
+          
+          <div id="visbl">
+              <span class="filtertype">Visibility</span>
+              <ol><li class="public in"><span>Public</span></li><li class="all 
out"><span>All</span></li></ol>
+            </div>
+        </div>
+      </div>
+
+      <div id="template">
+        <div id="allMembers">
+        
+
+        <div id="types" class="types members">
+              <h3>Type Members</h3>
+              <ol><li name="datafu.spark.CoreBridgeDirectory" visbl="pub" 
class="indented0 " data-isabs="false" fullComment="no" group="Ungrouped">
+      <a id="CoreBridgeDirectoryextendsPythonResource"></a><a 
id="CoreBridgeDirectory:CoreBridgeDirectory"></a>
+      <span class="permalink">
+      <a href="../../datafu/spark/CoreBridgeDirectory.html" title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span>
+      <span class="modifier_kind">
+        <span class="modifier"></span>
+        <span class="kind">class</span>
+      </span>
+      <span class="symbol">
+        <a title="Contains all python files needed by the bridge itself" 
href="CoreBridgeDirectory.html"><span 
class="name">CoreBridgeDirectory</span></a><span class="result"> extends <a 
href="PythonResource.html" class="extype" 
name="datafu.spark.PythonResource">PythonResource</a></span>
+      </span>
+      
+      <p class="shortcomment cmt">Contains all python files needed by the 
bridge itself
+</p>
+    </li><li name="datafu.spark.PythonResource" visbl="pub" class="indented0 " 
data-isabs="true" fullComment="yes" group="Ungrouped">
+      <a id="PythonResourceextendsAnyRef"></a><a 
id="PythonResource:PythonResource"></a>
+      <span class="permalink">
+      <a href="../../datafu/spark/PythonResource.html" title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span>
+      <span class="modifier_kind">
+        <span class="modifier">abstract </span>
+        <span class="kind">class</span>
+      </span>
+      <span class="symbol">
+        <a title="Represents a resource that needs to be added to PYTHONPATH 
used by ScalaPythonBridge." href="PythonResource.html"><span 
class="name">PythonResource</span></a><span class="result"> extends <span 
class="extype" name="scala.AnyRef">AnyRef</span></span>
+      </span>
+      
+      <p class="shortcomment cmt">Represents a resource that needs to be added 
to PYTHONPATH used by ScalaPythonBridge.</p><div class="fullcomment"><div 
class="comment cmt"><p>Represents a resource that needs to be added to 
PYTHONPATH used by ScalaPythonBridge.</p><p>To ensure your python resources 
(modules, files, etc.) are properly added to the bridge,
+do the following:
+1)  Put all the resource under some root directory with a unique name x, and 
make sure path/to/x
+is visible to the class loader (usually just use src/main/resources/x).
+2)  Extend this class like this:
+class MyResource extends PythonResource(&quot;x&quot;)
+This assumes x is under src/main/resources/x
+3)  (since we use ServiceLoader) Add a file to your jar/project:
+META-INF/services/spark.utils.PythonResource
+with a single line containing the full name (including package) of 
MyResource.</p><p>This process involves scanning the entire jar and copying 
files from the jar to some temporary
+location, so if your jar is really big consider putting the resources in a 
smaller jar.
+</p></div></div>
+    </li><li name="datafu.spark.ScalaPythonBridgeRunner" visbl="pub" 
class="indented0 " data-isabs="false" fullComment="yes" group="Ungrouped">
+      <a id="ScalaPythonBridgeRunnerextendsProductwithSerializable"></a><a 
id="ScalaPythonBridgeRunner:ScalaPythonBridgeRunner"></a>
+      <span class="permalink">
+      <a href="../../datafu/spark/ScalaPythonBridgeRunner.html" 
title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span>
+      <span class="modifier_kind">
+        <span class="modifier"></span>
+        <span class="kind">case class</span>
+      </span>
+      <span class="symbol">
+        <a title="this class let's the user invoke PySpark code from scala 
example usage:" href="ScalaPythonBridgeRunner.html"><span 
class="name">ScalaPythonBridgeRunner</span></a><span class="params">(<span 
name="extraPath">extraPath: <span class="extype" 
name="scala.Predef.String">String</span> = <span 
class="symbol">&quot;&quot;</span></span>)</span><span class="result"> extends 
<span class="extype" name="scala.Product">Product</span> with <span 
class="extype" name="scala.Serializable">Serializable</span></span>
+      </span>
+      
+      <p class="shortcomment cmt">this class let's the user invoke PySpark 
code from scala
+example usage:</p><div class="fullcomment"><div class="comment cmt"><p>this 
class let's the user invoke PySpark code from scala
+example usage:</p><p>val runner = ScalaPythonBridgeRunner()
+runner.runPythonFile(&quot;my_package/my_pyspark_logic.py&quot;)</p></div></div>
+    </li><li name="datafu.spark.SparkDFUtilsBridge" visbl="pub" 
class="indented0 " data-isabs="false" fullComment="no" group="Ungrouped">
+      <a id="SparkDFUtilsBridgeextendsAnyRef"></a><a 
id="SparkDFUtilsBridge:SparkDFUtilsBridge"></a>
+      <span class="permalink">
+      <a href="../../datafu/spark/SparkDFUtilsBridge.html" title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span>
+      <span class="modifier_kind">
+        <span class="modifier"></span>
+        <span class="kind">class</span>
+      </span>
+      <span class="symbol">
+        <a title="class definition so we could expose this functionality in 
PySpark" href="SparkDFUtilsBridge.html"><span 
class="name">SparkDFUtilsBridge</span></a><span class="result"> extends <span 
class="extype" name="scala.AnyRef">AnyRef</span></span>
+      </span>
+      
+      <p class="shortcomment cmt">class definition so we could expose this 
functionality in PySpark
+</p>
+    </li></ol>
+            </div>
+
+        
+
+        <div class="values members">
+              <h3>Value Members</h3>
+              <ol>
+                <li name="datafu.spark.Aggregators" visbl="pub" 
class="indented0 " data-isabs="false" fullComment="yes" group="Ungrouped">
+      <a id="Aggregators"></a><a id="Aggregators:Aggregators"></a>
+      <span class="permalink">
+      <a href="../../datafu/spark/Aggregators$.html" title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span>
+      <span class="modifier_kind">
+        <span class="modifier"></span>
+        <span class="kind">object</span>
+      </span>
+      <span class="symbol">
+        <a title="This file contains UDAFs which extend the Aggregator class." 
href="Aggregators$.html"><span class="name">Aggregators</span></a>
+      </span>
+      
+      <p class="shortcomment cmt">This file contains UDAFs which extend the 
Aggregator class.</p><div class="fullcomment"><div class="comment cmt"><p>This 
file contains UDAFs which extend the Aggregator class.
+They were migrated from previous implementations which used 
UserDefinedAggregateFunction</p><p>The implementations below reuse the 
intermediate buffer in the merge function
+( see 
https://stackoverflow.com/questions/77713959/can-you-reuse-one-of-the-buffers-in-the-merge-method-of-spark-aggregators
 )
+</p></div></div>
+    </li><li name="datafu.spark.DataFrameOps" visbl="pub" class="indented0 " 
data-isabs="false" fullComment="yes" group="Ungrouped">
+      <a id="DataFrameOps"></a><a id="DataFrameOps:DataFrameOps"></a>
+      <span class="permalink">
+      <a href="../../datafu/spark/DataFrameOps$.html" title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span>
+      <span class="modifier_kind">
+        <span class="modifier"></span>
+        <span class="kind">object</span>
+      </span>
+      <span class="symbol">
+        <a title="implicit class to enable easier usage e.g:" 
href="DataFrameOps$.html"><span class="name">DataFrameOps</span></a>
+      </span>
+      
+      <p class="shortcomment cmt">implicit class to enable easier usage 
e.g:</p><div class="fullcomment"><div class="comment cmt"><p>implicit class to 
enable easier usage e.g:</p><p>df.dedup(..)</p><p>instead 
of:</p><p>SparkDFUtils.dedup(...)</p></div></div>
+    </li><li name="datafu.spark.PythonPathsManager" visbl="pub" 
class="indented0 " data-isabs="false" fullComment="yes" group="Ungrouped">
+      <a id="PythonPathsManager"></a><a 
id="PythonPathsManager:PythonPathsManager"></a>
+      <span class="permalink">
+      <a href="../../datafu/spark/PythonPathsManager$.html" title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span>
+      <span class="modifier_kind">
+        <span class="modifier"></span>
+        <span class="kind">object</span>
+      </span>
+      <span class="symbol">
+        <a title="There are two phases of resolving python files path:" 
href="PythonPathsManager$.html"><span class="name">PythonPathsManager</span></a>
+      </span>
+      
+      <p class="shortcomment cmt">There are two phases of resolving python 
files path:</p><div class="fullcomment"><div class="comment cmt"><p>There are 
two phases of resolving python files path:</p><p>1) When launching spark:
+  the files need to be added to spark.executorEnv.PYTHONPATH</p><p>2) When 
executing python file via bridge:
+  the files need to be added to the process PYTHONPATH.
+  This is different than the previous phase because
+  this python process is spawned by datafu-spark, not by spark, and always on 
the driver.
+</p></div></div>
+    </li><li name="datafu.spark.ResourceCloning" visbl="pub" class="indented0 
" data-isabs="false" fullComment="no" group="Ungrouped">
+      <a id="ResourceCloning"></a><a id="ResourceCloning:ResourceCloning"></a>
+      <span class="permalink">
+      <a href="../../datafu/spark/ResourceCloning$.html" title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span>
+      <span class="modifier_kind">
+        <span class="modifier"></span>
+        <span class="kind">object</span>
+      </span>
+      <span class="symbol">
+        <a title="Utility for extracting resource from a jar and copy it to a 
temporary location" href="ResourceCloning$.html"><span 
class="name">ResourceCloning</span></a>
+      </span>
+      
+      <p class="shortcomment cmt">Utility for extracting resource from a jar 
and copy it to a temporary location
+</p>
+    </li><li name="datafu.spark.ScalaPythonBridge" visbl="pub" 
class="indented0 " data-isabs="false" fullComment="yes" group="Ungrouped">
+      <a id="ScalaPythonBridge"></a><a 
id="ScalaPythonBridge:ScalaPythonBridge"></a>
+      <span class="permalink">
+      <a href="../../datafu/spark/ScalaPythonBridge$.html" title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span>
+      <span class="modifier_kind">
+        <span class="modifier"></span>
+        <span class="kind">object</span>
+      </span>
+      <span class="symbol">
+        <a title="Do not instantiate this class! Use the companion object 
instead." href="ScalaPythonBridge$.html"><span 
class="name">ScalaPythonBridge</span></a>
+      </span>
+      
+      <p class="shortcomment cmt">Do not instantiate this class! Use the 
companion object instead.</p><div class="fullcomment"><div class="comment 
cmt"><p>Do not instantiate this class! Use the companion object instead.
+This class should only be used by python
+</p></div></div>
+    </li><li name="datafu.spark.SparkDFUtils" visbl="pub" class="indented0 " 
data-isabs="false" fullComment="no" group="Ungrouped">
+      <a id="SparkDFUtils"></a><a id="SparkDFUtils:SparkDFUtils"></a>
+      <span class="permalink">
+      <a href="../../datafu/spark/SparkDFUtils$.html" title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span>
+      <span class="modifier_kind">
+        <span class="modifier"></span>
+        <span class="kind">object</span>
+      </span>
+      <span class="symbol">
+        <a title="" href="SparkDFUtils$.html"><span 
class="name">SparkDFUtils</span></a>
+      </span>
+      
+      
+    </li>
+              </ol>
+            </div>
+
+        
+
+        
+        </div>
+
+        <div id="inheritedMembers">
+        
+        
+        </div>
+
+        <div id="groupedMembers">
+        <div class="group" name="Ungrouped">
+              <h3>Ungrouped</h3>
+              
+            </div>
+        </div>
+
+      </div>
+
+      <div id="tooltip"></div>
+
+      <div id="footer">  </div>
+    </body>
+          </div>
+        </div>
+      </div>
+    </body>
+      </html>

Added: datafu/site/docs/spark/2.1.0/index.html
URL: 
http://svn.apache.org/viewvc/datafu/site/docs/spark/2.1.0/index.html?rev=1925323&view=auto
==============================================================================
--- datafu/site/docs/spark/2.1.0/index.html (added)
+++ datafu/site/docs/spark/2.1.0/index.html Tue Apr 29 18:54:44 2025
@@ -0,0 +1,174 @@
+<!DOCTYPE html >
+<html>
+        <head>
+          <meta http-equiv="X-UA-Compatible" content="IE=edge" />
+          <meta name="viewport" content="width=device-width, 
initial-scale=1.0, maximum-scale=1.0, user-scalable=no" />
+          <title>datafu-spark 2.1.0 API </title>
+          <meta name="description" content="datafu - spark 2.1.0 API " />
+          <meta name="keywords" content="datafu spark 2.1.0 API " />
+          <meta http-equiv="content-type" content="text/html; charset=UTF-8" />
+          
+      
+      <link href="lib/index.css" media="screen" type="text/css" 
rel="stylesheet" />
+      <link href="lib/template.css" media="screen" type="text/css" 
rel="stylesheet" />
+      <link href="lib/diagrams.css" media="screen" type="text/css" 
rel="stylesheet" id="diagrams-css" />
+      <script type="text/javascript" src="lib/jquery.min.js"></script>
+      <script type="text/javascript" src="lib/jquery.panzoom.min.js"></script>
+      <script type="text/javascript" 
src="lib/jquery.mousewheel.min.js"></script>
+      <script type="text/javascript" src="lib/index.js"></script>
+      <script type="text/javascript" src="index.js"></script>
+      <script type="text/javascript" src="lib/scheduler.js"></script>
+      <script type="text/javascript" src="lib/template.js"></script>
+      
+      <script type="text/javascript">
+        /* this variable can be used by the JS to determine the path to the 
root document */
+        var toRoot = '';
+      </script>
+    
+        </head>
+        <body>
+      <div id="search">
+        <span id="doc-title">datafu-spark 2.1.0 API<span 
id="doc-version"></span></span>
+        <span class="close-results"><span class="left">&lt;</span> Back</span>
+        <div id="textfilter">
+          <span class="input">
+            <input autocapitalize="none" placeholder="Search" id="index-input" 
type="text" accesskey="/" />
+            <i class="clear material-icons"></i>
+            <i id="search-icon" class="material-icons"></i>
+          </span>
+        </div>
+    </div>
+      <div id="search-results">
+        <div id="search-progress">
+          <div id="progress-fill"></div>
+        </div>
+        <div id="results-content">
+          <div id="entity-results"></div>
+          <div id="member-results"></div>
+        </div>
+      </div>
+      <div id="content-scroll-container" style="-webkit-overflow-scrolling: 
touch;">
+        <div id="content-container" style="-webkit-overflow-scrolling: touch;">
+          <div id="subpackage-spacer">
+            <div id="packages">
+              <h1>Packages</h1>
+              <ul>
+                <li name="_root_.root" visbl="pub" class="indented0 current" 
data-isabs="false" fullComment="no" group="Ungrouped">
+      <a id="_root_"></a><a id="root:_root_"></a>
+      <span class="permalink">
+      <a href="index.html" title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span>
+      <span class="modifier_kind">
+        <span class="modifier"></span>
+        <span class="kind">package</span>
+      </span>
+      <span class="symbol">
+        <span class="name">root</span>
+      </span>
+      
+      
+    </li><li name="_root_.datafu" visbl="pub" class="indented1 " 
data-isabs="false" fullComment="no" group="Ungrouped">
+      <a id="datafu"></a><a id="datafu:datafu"></a>
+      <span class="permalink">
+      <a href="datafu/index.html" title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span>
+      <span class="modifier_kind">
+        <span class="modifier"></span>
+        <span class="kind">package</span>
+      </span>
+      <span class="symbol">
+        <a title="" href="datafu/index.html"><span 
class="name">datafu</span></a>
+      </span>
+      
+      
+    </li><li name="_root_.org" visbl="pub" class="indented1 " 
data-isabs="false" fullComment="no" group="Ungrouped">
+      <a id="org"></a><a id="org:org"></a>
+      <span class="permalink">
+      <a href="org/index.html" title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span>
+      <span class="modifier_kind">
+        <span class="modifier"></span>
+        <span class="kind">package</span>
+      </span>
+      <span class="symbol">
+        <a title="" href="org/index.html"><span class="name">org</span></a>
+      </span>
+      
+      
+    </li>
+              </ul>
+            </div>
+          </div>
+          <div id="content">
+            <body class="package value">
+      <div id="definition">
+        <div class="big-circle package">p</div>
+        
+        <h1>root package<span class="permalink">
+      <a href="index.html" title="Permalink">
+        <i class="material-icons"></i>
+      </a>
+    </span></h1>
+        
+      </div>
+
+      <h4 id="signature" class="signature">
+      <span class="modifier_kind">
+        <span class="modifier"></span>
+        <span class="kind">package</span>
+      </span>
+      <span class="symbol">
+        <span class="name">root</span>
+      </span>
+      </h4>
+
+      
+          <div id="comment" class="fullcommenttop"></div>
+        
+
+      
+
+      <div id="template">
+        <div id="allMembers">
+        
+
+        
+
+        
+
+        
+
+        
+
+        
+        </div>
+
+        <div id="inheritedMembers">
+        
+        
+        </div>
+
+        <div id="groupedMembers">
+        <div class="group" name="Ungrouped">
+              <h3>Ungrouped</h3>
+              
+            </div>
+        </div>
+
+      </div>
+
+      <div id="tooltip"></div>
+
+      <div id="footer">  </div>
+    </body>
+          </div>
+        </div>
+      </div>
+    </body>
+      </html>

Added: datafu/site/docs/spark/2.1.0/index.js
URL: 
http://svn.apache.org/viewvc/datafu/site/docs/spark/2.1.0/index.js?rev=1925323&view=auto
==============================================================================
--- datafu/site/docs/spark/2.1.0/index.js (added)
+++ datafu/site/docs/spark/2.1.0/index.js Tue Apr 29 18:54:44 2025
@@ -0,0 +1 @@

[... 3 lines stripped ...]
Added: datafu/site/docs/spark/2.1.0/lib/MaterialIcons-Regular.eot
URL: 
http://svn.apache.org/viewvc/datafu/site/docs/spark/2.1.0/lib/MaterialIcons-Regular.eot?rev=1925323&view=auto
==============================================================================
Binary file - no diff available.

Propchange: datafu/site/docs/spark/2.1.0/lib/MaterialIcons-Regular.eot
------------------------------------------------------------------------------
    svn:mime-type = application/octet-stream

Added: datafu/site/docs/spark/2.1.0/lib/MaterialIcons-Regular.ttf
URL: 
http://svn.apache.org/viewvc/datafu/site/docs/spark/2.1.0/lib/MaterialIcons-Regular.ttf?rev=1925323&view=auto
==============================================================================
Binary file - no diff available.

Propchange: datafu/site/docs/spark/2.1.0/lib/MaterialIcons-Regular.ttf
------------------------------------------------------------------------------
    svn:mime-type = application/octet-stream

Added: datafu/site/docs/spark/2.1.0/lib/MaterialIcons-Regular.woff
URL: 
http://svn.apache.org/viewvc/datafu/site/docs/spark/2.1.0/lib/MaterialIcons-Regular.woff?rev=1925323&view=auto
==============================================================================
Binary file - no diff available.

Propchange: datafu/site/docs/spark/2.1.0/lib/MaterialIcons-Regular.woff
------------------------------------------------------------------------------
    svn:mime-type = application/octet-stream

Added: datafu/site/docs/spark/2.1.0/lib/abstract_type.svg
URL: 
http://svn.apache.org/viewvc/datafu/site/docs/spark/2.1.0/lib/abstract_type.svg?rev=1925323&view=auto
==============================================================================
--- datafu/site/docs/spark/2.1.0/lib/abstract_type.svg (added)
+++ datafu/site/docs/spark/2.1.0/lib/abstract_type.svg Tue Apr 29 18:54:44 2025
@@ -0,0 +1,54 @@
+<svg xmlns="http://www.w3.org/2000/svg"; 
xmlns:xlink="http://www.w3.org/1999/xlink"; width="72px" height="72px" 
viewBox="0 0 72 72" version="1.1">
+  <defs>
+    <filter x="-50%" y="-50%" width="200%" height="200%" 
filterUnits="objectBoundingBox" id="filter-1">
+      <feOffset dx="0" dy="4" in="SourceAlpha" result="shadowOffsetOuter1"/>
+      <feGaussianBlur stdDeviation="2" in="shadowOffsetOuter1" 
result="shadowBlurOuter1"/>
+      <feColorMatrix values="0 0 0 0 0   0 0 0 0 0   0 0 0 0 0  0 0 0 0.14 0" 
in="shadowBlurOuter1" type="matrix" result="shadowMatrixOuter1"/>
+      <feMerge>
+        <feMergeNode in="shadowMatrixOuter1"/>
+        <feMergeNode in="SourceGraphic"/>
+      </feMerge>
+    </filter>
+    <circle id="path-2" cx="32" cy="32" r="32"/>
+    <filter x="-50%" y="-50%" width="200%" height="200%" 
filterUnits="objectBoundingBox" id="filter-4">
+      <feOffset dx="0" dy="4" in="SourceAlpha" result="shadowOffsetOuter1"/>
+      <feGaussianBlur stdDeviation="2" in="shadowOffsetOuter1" 
result="shadowBlurOuter1"/>
+      <feColorMatrix values="0 0 0 0 0   0 0 0 0 0   0 0 0 0 0  0 0 0 0.14 0" 
in="shadowBlurOuter1" type="matrix" result="shadowMatrixOuter1"/>
+      <feOffset dx="0" dy="1" in="SourceAlpha" result="shadowOffsetInner1"/>
+      <feGaussianBlur stdDeviation="0" in="shadowOffsetInner1" 
result="shadowBlurInner1"/>
+      <feComposite in="shadowBlurInner1" in2="SourceAlpha" 
operator="arithmetic" k2="-1" k3="1" result="shadowInnerInner1"/>
+      <feColorMatrix values="0 0 0 0 1   0 0 0 0 1   0 0 0 0 1  0 0 0 0.14 0" 
in="shadowInnerInner1" type="matrix" result="shadowMatrixInner1"/>
+      <feOffset dx="0" dy="-1" in="SourceAlpha" result="shadowOffsetInner2"/>
+      <feGaussianBlur stdDeviation="0" in="shadowOffsetInner2" 
result="shadowBlurInner2"/>
+      <feComposite in="shadowBlurInner2" in2="SourceAlpha" 
operator="arithmetic" k2="-1" k3="1" result="shadowInnerInner2"/>
+      <feColorMatrix values="0 0 0 0 0   0 0 0 0 0   0 0 0 0 0  0 0 0 0.14 0" 
in="shadowInnerInner2" type="matrix" result="shadowMatrixInner2"/>
+      <feMerge>
+        <feMergeNode in="shadowMatrixOuter1"/>
+        <feMergeNode in="SourceGraphic"/>
+        <feMergeNode in="shadowMatrixInner1"/>
+        <feMergeNode in="shadowMatrixInner2"/>
+      </feMerge>
+    </filter>
+    <path id="path-5" d="M32 61C49.673112 61 64 48.0162577 64 32 64 15.9837423 
49.673112 3 32 3 14.326888 3 0 15.9837423 0 32 0 48.0162577 14.326888 61 32 
61Z"/>
+  </defs>
+  <g id="Page-1" stroke="none" stroke-width="1" fill="none" 
fill-rule="evenodd">
+    <g id="Artboard-1" transform="translate(-298.000000, -91.000000)">
+      <g id="BG" transform="translate(302.000000, 91.000000)">
+        <g id="Icon">
+          <mask id="mask-3" fill="white">
+            <use xlink:href="#path-2"/>
+          </mask>
+          <use id="Mask" fill="#6C7A89" filter="url(#filter-1)" 
xlink:href="#path-2"/>
+          <mask id="mask-6" fill="white">
+            <use xlink:href="#path-5"/>
+          </mask>
+          <text id="a" mask="url(#mask-6)" font-family="Open Sans, Helvetica 
Neueu, Sans-serif" font-size="40" font-weight="normal" fill="#FFFFFF">
+            <tspan x="21" y="43">
+              a
+            </tspan>
+          </text>
+        </g>
+      </g>
+    </g>
+  </g>
+</svg>



Reply via email to