http://git-wip-us.apache.org/repos/asf/spark-website/blob/52917ac4/site/docs/2.4.0/api/R/columnfunctions.html ---------------------------------------------------------------------- diff --git a/site/docs/2.4.0/api/R/columnfunctions.html b/site/docs/2.4.0/api/R/columnfunctions.html new file mode 100644 index 0000000..6c05dfd --- /dev/null +++ b/site/docs/2.4.0/api/R/columnfunctions.html @@ -0,0 +1,55 @@ +<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd"><html xmlns="http://www.w3.org/1999/xhtml"><head><title>R: A set of operations working with SparkDataFrame columns</title> +<meta http-equiv="Content-Type" content="text/html; charset=utf-8" /> +<link rel="stylesheet" type="text/css" href="R.css" /> +</head><body> + +<table width="100%" summary="page for asc {SparkR}"><tr><td>asc {SparkR}</td><td style="text-align: right;">R Documentation</td></tr></table> + +<h2>A set of operations working with SparkDataFrame columns</h2> + +<h3>Description</h3> + +<p>A set of operations working with SparkDataFrame columns +</p> + + +<h3>Usage</h3> + +<pre> +asc(x) + +contains(x, ...) + +desc(x) + +getField(x, ...) + +getItem(x, ...) + +isNaN(x) + +isNull(x) + +isNotNull(x) + +like(x, ...) + +rlike(x, ...) +</pre> + + +<h3>Arguments</h3> + +<table summary="R argblock"> +<tr valign="top"><td><code>x</code></td> +<td> +<p>a Column object.</p> +</td></tr> +<tr valign="top"><td><code>...</code></td> +<td> +<p>additional argument(s).</p> +</td></tr> +</table> + +<hr /><div style="text-align: center;">[Package <em>SparkR</em> version 2.4.0 <a href="00Index.html">Index</a>]</div> +</body></html>
http://git-wip-us.apache.org/repos/asf/spark-website/blob/52917ac4/site/docs/2.4.0/api/R/columns.html ---------------------------------------------------------------------- diff --git a/site/docs/2.4.0/api/R/columns.html b/site/docs/2.4.0/api/R/columns.html new file mode 100644 index 0000000..35a8660 --- /dev/null +++ b/site/docs/2.4.0/api/R/columns.html @@ -0,0 +1,145 @@ +<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd"><html xmlns="http://www.w3.org/1999/xhtml"><head><title>R: Column Names of SparkDataFrame</title> +<meta http-equiv="Content-Type" content="text/html; charset=utf-8" /> +<link rel="stylesheet" type="text/css" href="R.css" /> + +<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/8.3/styles/github.min.css"> +<script src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/8.3/highlight.min.js"></script> +<script src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/8.3/languages/r.min.js"></script> +<script>hljs.initHighlightingOnLoad();</script> +</head><body> + +<table width="100%" summary="page for colnames {SparkR}"><tr><td>colnames {SparkR}</td><td style="text-align: right;">R Documentation</td></tr></table> + +<h2>Column Names of SparkDataFrame</h2> + +<h3>Description</h3> + +<p>Return a vector of column names. +</p> + + +<h3>Usage</h3> + +<pre> +colnames(x, do.NULL = TRUE, prefix = "col") + +colnames(x) <- value + +columns(x) + +## S4 method for signature 'SparkDataFrame' +columns(x) + +## S4 method for signature 'SparkDataFrame' +names(x) + +## S4 replacement method for signature 'SparkDataFrame' +names(x) <- value + +## S4 method for signature 'SparkDataFrame' +colnames(x) + +## S4 replacement method for signature 'SparkDataFrame' +colnames(x) <- value +</pre> + + +<h3>Arguments</h3> + +<table summary="R argblock"> +<tr valign="top"><td><code>x</code></td> +<td> +<p>a SparkDataFrame.</p> +</td></tr> +<tr valign="top"><td><code>do.NULL</code></td> +<td> +<p>currently not used.</p> +</td></tr> +<tr valign="top"><td><code>prefix</code></td> +<td> +<p>currently not used.</p> +</td></tr> +<tr valign="top"><td><code>value</code></td> +<td> +<p>a character vector. Must have the same length as the number +of columns to be renamed.</p> +</td></tr> +</table> + + +<h3>Note</h3> + +<p>columns since 1.4.0 +</p> +<p>names since 1.5.0 +</p> +<p>names<- since 1.5.0 +</p> +<p>colnames since 1.6.0 +</p> +<p>colnames<- since 1.6.0 +</p> + + +<h3>See Also</h3> + +<p>Other SparkDataFrame functions: <code><a href="SparkDataFrame.html">SparkDataFrame-class</a></code>, +<code><a href="summarize.html">agg</a></code>, <code><a href="alias.html">alias</a></code>, +<code><a href="arrange.html">arrange</a></code>, <code><a href="as.data.frame.html">as.data.frame</a></code>, +<code><a href="attach.html">attach,SparkDataFrame-method</a></code>, +<code><a href="broadcast.html">broadcast</a></code>, <code><a href="cache.html">cache</a></code>, +<code><a href="checkpoint.html">checkpoint</a></code>, <code><a href="coalesce.html">coalesce</a></code>, +<code><a href="collect.html">collect</a></code>, <code><a href="coltypes.html">coltypes</a></code>, +<code><a href="createOrReplaceTempView.html">createOrReplaceTempView</a></code>, +<code><a href="crossJoin.html">crossJoin</a></code>, <code><a href="cube.html">cube</a></code>, +<code><a href="dapplyCollect.html">dapplyCollect</a></code>, <code><a href="dapply.html">dapply</a></code>, +<code><a href="describe.html">describe</a></code>, <code><a href="dim.html">dim</a></code>, +<code><a href="distinct.html">distinct</a></code>, <code><a href="dropDuplicates.html">dropDuplicates</a></code>, +<code><a href="nafunctions.html">dropna</a></code>, <code><a href="drop.html">drop</a></code>, +<code><a href="dtypes.html">dtypes</a></code>, <code><a href="exceptAll.html">exceptAll</a></code>, +<code><a href="except.html">except</a></code>, <code><a href="explain.html">explain</a></code>, +<code><a href="filter.html">filter</a></code>, <code><a href="first.html">first</a></code>, +<code><a href="gapplyCollect.html">gapplyCollect</a></code>, <code><a href="gapply.html">gapply</a></code>, +<code><a href="getNumPartitions.html">getNumPartitions</a></code>, <code><a href="groupBy.html">group_by</a></code>, +<code><a href="head.html">head</a></code>, <code><a href="hint.html">hint</a></code>, +<code><a href="histogram.html">histogram</a></code>, <code><a href="insertInto.html">insertInto</a></code>, +<code><a href="intersectAll.html">intersectAll</a></code>, <code><a href="intersect.html">intersect</a></code>, +<code><a href="isLocal.html">isLocal</a></code>, <code><a href="isStreaming.html">isStreaming</a></code>, +<code><a href="join.html">join</a></code>, <code><a href="limit.html">limit</a></code>, +<code><a href="localCheckpoint.html">localCheckpoint</a></code>, <code><a href="merge.html">merge</a></code>, +<code><a href="mutate.html">mutate</a></code>, <code><a href="ncol.html">ncol</a></code>, +<code><a href="nrow.html">nrow</a></code>, <code><a href="persist.html">persist</a></code>, +<code><a href="printSchema.html">printSchema</a></code>, <code><a href="randomSplit.html">randomSplit</a></code>, +<code><a href="rbind.html">rbind</a></code>, <code><a href="rename.html">rename</a></code>, +<code><a href="repartitionByRange.html">repartitionByRange</a></code>, +<code><a href="repartition.html">repartition</a></code>, <code><a href="rollup.html">rollup</a></code>, +<code><a href="sample.html">sample</a></code>, <code><a href="saveAsTable.html">saveAsTable</a></code>, +<code><a href="schema.html">schema</a></code>, <code><a href="selectExpr.html">selectExpr</a></code>, +<code><a href="select.html">select</a></code>, <code><a href="showDF.html">showDF</a></code>, +<code><a href="show.html">show</a></code>, <code><a href="storageLevel.html">storageLevel</a></code>, +<code><a href="str.html">str</a></code>, <code><a href="subset.html">subset</a></code>, +<code><a href="summary.html">summary</a></code>, <code><a href="take.html">take</a></code>, +<code><a href="toJSON.html">toJSON</a></code>, <code><a href="unionByName.html">unionByName</a></code>, +<code><a href="union.html">union</a></code>, <code><a href="unpersist.html">unpersist</a></code>, +<code><a href="withColumn.html">withColumn</a></code>, <code><a href="withWatermark.html">withWatermark</a></code>, +<code><a href="with.html">with</a></code>, <code><a href="write.df.html">write.df</a></code>, +<code><a href="write.jdbc.html">write.jdbc</a></code>, <code><a href="write.json.html">write.json</a></code>, +<code><a href="write.orc.html">write.orc</a></code>, <code><a href="write.parquet.html">write.parquet</a></code>, +<code><a href="write.stream.html">write.stream</a></code>, <code><a href="write.text.html">write.text</a></code> +</p> + + +<h3>Examples</h3> + +<pre><code class="r">## Not run: +##D sparkR.session() +##D path <- "path/to/file.json" +##D df <- read.json(path) +##D columns(df) +##D colnames(df) +## End(Not run) +</code></pre> + + +<hr /><div style="text-align: center;">[Package <em>SparkR</em> version 2.4.0 <a href="00Index.html">Index</a>]</div> +</body></html> http://git-wip-us.apache.org/repos/asf/spark-website/blob/52917ac4/site/docs/2.4.0/api/R/corr.html ---------------------------------------------------------------------- diff --git a/site/docs/2.4.0/api/R/corr.html b/site/docs/2.4.0/api/R/corr.html new file mode 100644 index 0000000..798e543 --- /dev/null +++ b/site/docs/2.4.0/api/R/corr.html @@ -0,0 +1,110 @@ +<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd"><html xmlns="http://www.w3.org/1999/xhtml"><head><title>R: corr</title> +<meta http-equiv="Content-Type" content="text/html; charset=utf-8" /> +<link rel="stylesheet" type="text/css" href="R.css" /> + +<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/8.3/styles/github.min.css"> +<script src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/8.3/highlight.min.js"></script> +<script src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/8.3/languages/r.min.js"></script> +<script>hljs.initHighlightingOnLoad();</script> +</head><body> + +<table width="100%" summary="page for corr {SparkR}"><tr><td>corr {SparkR}</td><td style="text-align: right;">R Documentation</td></tr></table> + +<h2>corr</h2> + +<h3>Description</h3> + +<p>Computes the Pearson Correlation Coefficient for two Columns. +</p> + + +<h3>Usage</h3> + +<pre> +corr(x, ...) + +## S4 method for signature 'Column' +corr(x, col2) + +## S4 method for signature 'SparkDataFrame' +corr(x, colName1, colName2, + method = "pearson") +</pre> + + +<h3>Arguments</h3> + +<table summary="R argblock"> +<tr valign="top"><td><code>x</code></td> +<td> +<p>a Column or a SparkDataFrame.</p> +</td></tr> +<tr valign="top"><td><code>...</code></td> +<td> +<p>additional argument(s). If <code>x</code> is a Column, a Column +should be provided. If <code>x</code> is a SparkDataFrame, two column names should +be provided.</p> +</td></tr> +<tr valign="top"><td><code>col2</code></td> +<td> +<p>a (second) Column.</p> +</td></tr> +<tr valign="top"><td><code>colName1</code></td> +<td> +<p>the name of the first column</p> +</td></tr> +<tr valign="top"><td><code>colName2</code></td> +<td> +<p>the name of the second column</p> +</td></tr> +<tr valign="top"><td><code>method</code></td> +<td> +<p>Optional. A character specifying the method for calculating the correlation. +only "pearson" is allowed now.</p> +</td></tr> +</table> + + +<h3>Value</h3> + +<p>The Pearson Correlation Coefficient as a Double. +</p> + + +<h3>Note</h3> + +<p>corr since 1.6.0 +</p> +<p>corr since 1.6.0 +</p> + + +<h3>See Also</h3> + +<p>Other aggregate functions: <code><a href="avg.html">avg</a></code>, +<code><a href="column_aggregate_functions.html">column_aggregate_functions</a></code>, +<code><a href="count.html">count</a></code>, <code><a href="cov.html">cov</a></code>, +<code><a href="first.html">first</a></code>, <code><a href="last.html">last</a></code> +</p> +<p>Other stat functions: <code><a href="approxQuantile.html">approxQuantile</a></code>, +<code><a href="cov.html">cov</a></code>, <code><a href="crosstab.html">crosstab</a></code>, +<code><a href="freqItems.html">freqItems</a></code>, <code><a href="sampleBy.html">sampleBy</a></code> +</p> + + +<h3>Examples</h3> + +<pre><code class="r">## Not run: +##D df <- createDataFrame(cbind(model = rownames(mtcars), mtcars)) +##D head(select(df, corr(df$mpg, df$hp))) +## End(Not run) + +## Not run: +##D corr(df, "mpg", "hp") +##D corr(df, "mpg", "hp", method = "pearson") +## End(Not run) +</code></pre> + + +<hr /><div style="text-align: center;">[Package <em>SparkR</em> version 2.4.0 <a href="00Index.html">Index</a>]</div> +</body></html> http://git-wip-us.apache.org/repos/asf/spark-website/blob/52917ac4/site/docs/2.4.0/api/R/count.html ---------------------------------------------------------------------- diff --git a/site/docs/2.4.0/api/R/count.html b/site/docs/2.4.0/api/R/count.html new file mode 100644 index 0000000..c35965b --- /dev/null +++ b/site/docs/2.4.0/api/R/count.html @@ -0,0 +1,89 @@ +<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd"><html xmlns="http://www.w3.org/1999/xhtml"><head><title>R: Count</title> +<meta http-equiv="Content-Type" content="text/html; charset=utf-8" /> +<link rel="stylesheet" type="text/css" href="R.css" /> + +<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/8.3/styles/github.min.css"> +<script src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/8.3/highlight.min.js"></script> +<script src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/8.3/languages/r.min.js"></script> +<script>hljs.initHighlightingOnLoad();</script> +</head><body> + +<table width="100%" summary="page for count {SparkR}"><tr><td>count {SparkR}</td><td style="text-align: right;">R Documentation</td></tr></table> + +<h2>Count</h2> + +<h3>Description</h3> + +<p>Count the number of rows for each group when we have <code>GroupedData</code> input. +The resulting SparkDataFrame will also contain the grouping columns. +</p> +<p>This can be used as a column aggregate function with <code>Column</code> as input, +and returns the number of items in a group. +</p> + + +<h3>Usage</h3> + +<pre> +count(x) + +n(x) + +## S4 method for signature 'GroupedData' +count(x) + +## S4 method for signature 'Column' +count(x) + +## S4 method for signature 'Column' +n(x) +</pre> + + +<h3>Arguments</h3> + +<table summary="R argblock"> +<tr valign="top"><td><code>x</code></td> +<td> +<p>a GroupedData or Column.</p> +</td></tr> +</table> + + +<h3>Value</h3> + +<p>A SparkDataFrame. +</p> + + +<h3>Note</h3> + +<p>count since 1.4.0 +</p> +<p>count since 1.4.0 +</p> +<p>n since 1.4.0 +</p> + + +<h3>See Also</h3> + +<p>Other aggregate functions: <code><a href="avg.html">avg</a></code>, +<code><a href="column_aggregate_functions.html">column_aggregate_functions</a></code>, +<code><a href="corr.html">corr</a></code>, <code><a href="cov.html">cov</a></code>, +<code><a href="first.html">first</a></code>, <code><a href="last.html">last</a></code> +</p> + + +<h3>Examples</h3> + +<pre><code class="r">## Not run: +##D count(groupBy(df, "name")) +## End(Not run) +## Not run: count(df$c) +## Not run: n(df$c) +</code></pre> + + +<hr /><div style="text-align: center;">[Package <em>SparkR</em> version 2.4.0 <a href="00Index.html">Index</a>]</div> +</body></html> http://git-wip-us.apache.org/repos/asf/spark-website/blob/52917ac4/site/docs/2.4.0/api/R/cov.html ---------------------------------------------------------------------- diff --git a/site/docs/2.4.0/api/R/cov.html b/site/docs/2.4.0/api/R/cov.html new file mode 100644 index 0000000..1207736 --- /dev/null +++ b/site/docs/2.4.0/api/R/cov.html @@ -0,0 +1,137 @@ +<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd"><html xmlns="http://www.w3.org/1999/xhtml"><head><title>R: cov</title> +<meta http-equiv="Content-Type" content="text/html; charset=utf-8" /> +<link rel="stylesheet" type="text/css" href="R.css" /> + +<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/8.3/styles/github.min.css"> +<script src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/8.3/highlight.min.js"></script> +<script src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/8.3/languages/r.min.js"></script> +<script>hljs.initHighlightingOnLoad();</script> +</head><body> + +<table width="100%" summary="page for cov {SparkR}"><tr><td>cov {SparkR}</td><td style="text-align: right;">R Documentation</td></tr></table> + +<h2>cov</h2> + +<h3>Description</h3> + +<p>Compute the covariance between two expressions. +</p> + + +<h3>Usage</h3> + +<pre> +cov(x, ...) + +covar_samp(col1, col2) + +covar_pop(col1, col2) + +## S4 method for signature 'characterOrColumn' +cov(x, col2) + +## S4 method for signature 'characterOrColumn,characterOrColumn' +covar_samp(col1, col2) + +## S4 method for signature 'characterOrColumn,characterOrColumn' +covar_pop(col1, col2) + +## S4 method for signature 'SparkDataFrame' +cov(x, colName1, colName2) +</pre> + + +<h3>Arguments</h3> + +<table summary="R argblock"> +<tr valign="top"><td><code>x</code></td> +<td> +<p>a Column or a SparkDataFrame.</p> +</td></tr> +<tr valign="top"><td><code>...</code></td> +<td> +<p>additional argument(s). If <code>x</code> is a Column, a Column +should be provided. If <code>x</code> is a SparkDataFrame, two column names should +be provided.</p> +</td></tr> +<tr valign="top"><td><code>col1</code></td> +<td> +<p>the first Column.</p> +</td></tr> +<tr valign="top"><td><code>col2</code></td> +<td> +<p>the second Column.</p> +</td></tr> +<tr valign="top"><td><code>colName1</code></td> +<td> +<p>the name of the first column</p> +</td></tr> +<tr valign="top"><td><code>colName2</code></td> +<td> +<p>the name of the second column</p> +</td></tr> +</table> + + +<h3>Details</h3> + +<p><code>cov</code>: Compute the sample covariance between two expressions. +</p> +<p><code>covar_sample</code>: Alias for <code>cov</code>. +</p> +<p><code>covar_pop</code>: Computes the population covariance between two expressions. +</p> +<p><code>cov</code>: When applied to SparkDataFrame, this calculates the sample covariance of two +numerical columns of <em>one</em> SparkDataFrame. +</p> + + +<h3>Value</h3> + +<p>The covariance of the two columns. +</p> + + +<h3>Note</h3> + +<p>cov since 1.6.0 +</p> +<p>covar_samp since 2.0.0 +</p> +<p>covar_pop since 2.0.0 +</p> +<p>cov since 1.6.0 +</p> + + +<h3>See Also</h3> + +<p>Other aggregate functions: <code><a href="avg.html">avg</a></code>, +<code><a href="column_aggregate_functions.html">column_aggregate_functions</a></code>, +<code><a href="corr.html">corr</a></code>, <code><a href="count.html">count</a></code>, +<code><a href="first.html">first</a></code>, <code><a href="last.html">last</a></code> +</p> +<p>Other stat functions: <code><a href="approxQuantile.html">approxQuantile</a></code>, +<code><a href="corr.html">corr</a></code>, <code><a href="crosstab.html">crosstab</a></code>, +<code><a href="freqItems.html">freqItems</a></code>, <code><a href="sampleBy.html">sampleBy</a></code> +</p> + + +<h3>Examples</h3> + +<pre><code class="r">## Not run: +##D df <- createDataFrame(cbind(model = rownames(mtcars), mtcars)) +##D head(select(df, cov(df$mpg, df$hp), cov("mpg", "hp"), +##D covar_samp(df$mpg, df$hp), covar_samp("mpg", "hp"), +##D covar_pop(df$mpg, df$hp), covar_pop("mpg", "hp"))) +## End(Not run) + +## Not run: +##D cov(df, "mpg", "hp") +##D cov(df, df$mpg, df$hp) +## End(Not run) +</code></pre> + + +<hr /><div style="text-align: center;">[Package <em>SparkR</em> version 2.4.0 <a href="00Index.html">Index</a>]</div> +</body></html> http://git-wip-us.apache.org/repos/asf/spark-website/blob/52917ac4/site/docs/2.4.0/api/R/createDataFrame.html ---------------------------------------------------------------------- diff --git a/site/docs/2.4.0/api/R/createDataFrame.html b/site/docs/2.4.0/api/R/createDataFrame.html new file mode 100644 index 0000000..74aa58d --- /dev/null +++ b/site/docs/2.4.0/api/R/createDataFrame.html @@ -0,0 +1,90 @@ +<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd"><html xmlns="http://www.w3.org/1999/xhtml"><head><title>R: Create a SparkDataFrame</title> +<meta http-equiv="Content-Type" content="text/html; charset=utf-8" /> +<link rel="stylesheet" type="text/css" href="R.css" /> + +<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/8.3/styles/github.min.css"> +<script src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/8.3/highlight.min.js"></script> +<script src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/8.3/languages/r.min.js"></script> +<script>hljs.initHighlightingOnLoad();</script> +</head><body> + +<table width="100%" summary="page for createDataFrame {SparkR}"><tr><td>createDataFrame {SparkR}</td><td style="text-align: right;">R Documentation</td></tr></table> + +<h2>Create a SparkDataFrame</h2> + +<h3>Description</h3> + +<p>Converts R data.frame or list into SparkDataFrame. +</p> + + +<h3>Usage</h3> + +<pre> +## Default S3 method: +createDataFrame(data, schema = NULL, + samplingRatio = 1, numPartitions = NULL) + +## Default S3 method: +as.DataFrame(data, schema = NULL, samplingRatio = 1, + numPartitions = NULL) + +as.DataFrame(data, ...) +</pre> + + +<h3>Arguments</h3> + +<table summary="R argblock"> +<tr valign="top"><td><code>data</code></td> +<td> +<p>a list or data.frame.</p> +</td></tr> +<tr valign="top"><td><code>schema</code></td> +<td> +<p>a list of column names or named list (StructType), optional.</p> +</td></tr> +<tr valign="top"><td><code>samplingRatio</code></td> +<td> +<p>Currently not used.</p> +</td></tr> +<tr valign="top"><td><code>numPartitions</code></td> +<td> +<p>the number of partitions of the SparkDataFrame. Defaults to 1, this is +limited by length of the list or number of rows of the data.frame</p> +</td></tr> +<tr valign="top"><td><code>...</code></td> +<td> +<p>additional argument(s).</p> +</td></tr> +</table> + + +<h3>Value</h3> + +<p>A SparkDataFrame. +</p> + + +<h3>Note</h3> + +<p>createDataFrame since 1.4.0 +</p> +<p>as.DataFrame since 1.6.0 +</p> + + +<h3>Examples</h3> + +<pre><code class="r">## Not run: +##D sparkR.session() +##D df1 <- as.DataFrame(iris) +##D df2 <- as.DataFrame(list(3,4,5,6)) +##D df3 <- createDataFrame(iris) +##D df4 <- createDataFrame(cars, numPartitions = 2) +## End(Not run) +</code></pre> + + +<hr /><div style="text-align: center;">[Package <em>SparkR</em> version 2.4.0 <a href="00Index.html">Index</a>]</div> +</body></html> http://git-wip-us.apache.org/repos/asf/spark-website/blob/52917ac4/site/docs/2.4.0/api/R/createExternalTable-deprecated.html ---------------------------------------------------------------------- diff --git a/site/docs/2.4.0/api/R/createExternalTable-deprecated.html b/site/docs/2.4.0/api/R/createExternalTable-deprecated.html new file mode 100644 index 0000000..06ea5ea --- /dev/null +++ b/site/docs/2.4.0/api/R/createExternalTable-deprecated.html @@ -0,0 +1,93 @@ +<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd"><html xmlns="http://www.w3.org/1999/xhtml"><head><title>R: (Deprecated) Create an external table</title> +<meta http-equiv="Content-Type" content="text/html; charset=utf-8" /> +<link rel="stylesheet" type="text/css" href="R.css" /> + +<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/8.3/styles/github.min.css"> +<script src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/8.3/highlight.min.js"></script> +<script src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/8.3/languages/r.min.js"></script> +<script>hljs.initHighlightingOnLoad();</script> +</head><body> + +<table width="100%" summary="page for createExternalTable {SparkR}"><tr><td>createExternalTable {SparkR}</td><td style="text-align: right;">R Documentation</td></tr></table> + +<h2>(Deprecated) Create an external table</h2> + +<h3>Description</h3> + +<p>Creates an external table based on the dataset in a data source, +Returns a SparkDataFrame associated with the external table. +</p> + + +<h3>Usage</h3> + +<pre> +## Default S3 method: +createExternalTable(tableName, path = NULL, + source = NULL, schema = NULL, ...) +</pre> + + +<h3>Arguments</h3> + +<table summary="R argblock"> +<tr valign="top"><td><code>tableName</code></td> +<td> +<p>a name of the table.</p> +</td></tr> +<tr valign="top"><td><code>path</code></td> +<td> +<p>the path of files to load.</p> +</td></tr> +<tr valign="top"><td><code>source</code></td> +<td> +<p>the name of external data source.</p> +</td></tr> +<tr valign="top"><td><code>schema</code></td> +<td> +<p>the schema of the data required for some data sources.</p> +</td></tr> +<tr valign="top"><td><code>...</code></td> +<td> +<p>additional argument(s) passed to the method.</p> +</td></tr> +</table> + + +<h3>Details</h3> + +<p>The data source is specified by the <code>source</code> and a set of options(...). +If <code>source</code> is not specified, the default data source configured by +"spark.sql.sources.default" will be used. +</p> + + +<h3>Value</h3> + +<p>A SparkDataFrame. +</p> + + +<h3>Note</h3> + +<p>createExternalTable since 1.4.0 +</p> + + +<h3>See Also</h3> + +<p><a href="createTable.html">createTable</a> +</p> + + +<h3>Examples</h3> + +<pre><code class="r">## Not run: +##D sparkR.session() +##D df <- createExternalTable("myjson", path="path/to/json", source="json", schema) +## End(Not run) +</code></pre> + + +<hr /><div style="text-align: center;">[Package <em>SparkR</em> version 2.4.0 <a href="00Index.html">Index</a>]</div> +</body></html> http://git-wip-us.apache.org/repos/asf/spark-website/blob/52917ac4/site/docs/2.4.0/api/R/createOrReplaceTempView.html ---------------------------------------------------------------------- diff --git a/site/docs/2.4.0/api/R/createOrReplaceTempView.html b/site/docs/2.4.0/api/R/createOrReplaceTempView.html new file mode 100644 index 0000000..b7ce73d --- /dev/null +++ b/site/docs/2.4.0/api/R/createOrReplaceTempView.html @@ -0,0 +1,112 @@ +<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd"><html xmlns="http://www.w3.org/1999/xhtml"><head><title>R: Creates a temporary view using the given name.</title> +<meta http-equiv="Content-Type" content="text/html; charset=utf-8" /> +<link rel="stylesheet" type="text/css" href="R.css" /> + +<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/8.3/styles/github.min.css"> +<script src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/8.3/highlight.min.js"></script> +<script src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/8.3/languages/r.min.js"></script> +<script>hljs.initHighlightingOnLoad();</script> +</head><body> + +<table width="100%" summary="page for createOrReplaceTempView {SparkR}"><tr><td>createOrReplaceTempView {SparkR}</td><td style="text-align: right;">R Documentation</td></tr></table> + +<h2>Creates a temporary view using the given name.</h2> + +<h3>Description</h3> + +<p>Creates a new temporary view using a SparkDataFrame in the Spark Session. If a +temporary view with the same name already exists, replaces it. +</p> + + +<h3>Usage</h3> + +<pre> +createOrReplaceTempView(x, viewName) + +## S4 method for signature 'SparkDataFrame,character' +createOrReplaceTempView(x, viewName) +</pre> + + +<h3>Arguments</h3> + +<table summary="R argblock"> +<tr valign="top"><td><code>x</code></td> +<td> +<p>A SparkDataFrame</p> +</td></tr> +<tr valign="top"><td><code>viewName</code></td> +<td> +<p>A character vector containing the name of the table</p> +</td></tr> +</table> + + +<h3>Note</h3> + +<p>createOrReplaceTempView since 2.0.0 +</p> + + +<h3>See Also</h3> + +<p>Other SparkDataFrame functions: <code><a href="SparkDataFrame.html">SparkDataFrame-class</a></code>, +<code><a href="summarize.html">agg</a></code>, <code><a href="alias.html">alias</a></code>, +<code><a href="arrange.html">arrange</a></code>, <code><a href="as.data.frame.html">as.data.frame</a></code>, +<code><a href="attach.html">attach,SparkDataFrame-method</a></code>, +<code><a href="broadcast.html">broadcast</a></code>, <code><a href="cache.html">cache</a></code>, +<code><a href="checkpoint.html">checkpoint</a></code>, <code><a href="coalesce.html">coalesce</a></code>, +<code><a href="collect.html">collect</a></code>, <code><a href="columns.html">colnames</a></code>, +<code><a href="coltypes.html">coltypes</a></code>, <code><a href="crossJoin.html">crossJoin</a></code>, +<code><a href="cube.html">cube</a></code>, <code><a href="dapplyCollect.html">dapplyCollect</a></code>, +<code><a href="dapply.html">dapply</a></code>, <code><a href="describe.html">describe</a></code>, +<code><a href="dim.html">dim</a></code>, <code><a href="distinct.html">distinct</a></code>, +<code><a href="dropDuplicates.html">dropDuplicates</a></code>, <code><a href="nafunctions.html">dropna</a></code>, +<code><a href="drop.html">drop</a></code>, <code><a href="dtypes.html">dtypes</a></code>, +<code><a href="exceptAll.html">exceptAll</a></code>, <code><a href="except.html">except</a></code>, +<code><a href="explain.html">explain</a></code>, <code><a href="filter.html">filter</a></code>, +<code><a href="first.html">first</a></code>, <code><a href="gapplyCollect.html">gapplyCollect</a></code>, +<code><a href="gapply.html">gapply</a></code>, <code><a href="getNumPartitions.html">getNumPartitions</a></code>, +<code><a href="groupBy.html">group_by</a></code>, <code><a href="head.html">head</a></code>, +<code><a href="hint.html">hint</a></code>, <code><a href="histogram.html">histogram</a></code>, +<code><a href="insertInto.html">insertInto</a></code>, <code><a href="intersectAll.html">intersectAll</a></code>, +<code><a href="intersect.html">intersect</a></code>, <code><a href="isLocal.html">isLocal</a></code>, +<code><a href="isStreaming.html">isStreaming</a></code>, <code><a href="join.html">join</a></code>, +<code><a href="limit.html">limit</a></code>, <code><a href="localCheckpoint.html">localCheckpoint</a></code>, +<code><a href="merge.html">merge</a></code>, <code><a href="mutate.html">mutate</a></code>, +<code><a href="ncol.html">ncol</a></code>, <code><a href="nrow.html">nrow</a></code>, +<code><a href="persist.html">persist</a></code>, <code><a href="printSchema.html">printSchema</a></code>, +<code><a href="randomSplit.html">randomSplit</a></code>, <code><a href="rbind.html">rbind</a></code>, +<code><a href="rename.html">rename</a></code>, <code><a href="repartitionByRange.html">repartitionByRange</a></code>, +<code><a href="repartition.html">repartition</a></code>, <code><a href="rollup.html">rollup</a></code>, +<code><a href="sample.html">sample</a></code>, <code><a href="saveAsTable.html">saveAsTable</a></code>, +<code><a href="schema.html">schema</a></code>, <code><a href="selectExpr.html">selectExpr</a></code>, +<code><a href="select.html">select</a></code>, <code><a href="showDF.html">showDF</a></code>, +<code><a href="show.html">show</a></code>, <code><a href="storageLevel.html">storageLevel</a></code>, +<code><a href="str.html">str</a></code>, <code><a href="subset.html">subset</a></code>, +<code><a href="summary.html">summary</a></code>, <code><a href="take.html">take</a></code>, +<code><a href="toJSON.html">toJSON</a></code>, <code><a href="unionByName.html">unionByName</a></code>, +<code><a href="union.html">union</a></code>, <code><a href="unpersist.html">unpersist</a></code>, +<code><a href="withColumn.html">withColumn</a></code>, <code><a href="withWatermark.html">withWatermark</a></code>, +<code><a href="with.html">with</a></code>, <code><a href="write.df.html">write.df</a></code>, +<code><a href="write.jdbc.html">write.jdbc</a></code>, <code><a href="write.json.html">write.json</a></code>, +<code><a href="write.orc.html">write.orc</a></code>, <code><a href="write.parquet.html">write.parquet</a></code>, +<code><a href="write.stream.html">write.stream</a></code>, <code><a href="write.text.html">write.text</a></code> +</p> + + +<h3>Examples</h3> + +<pre><code class="r">## Not run: +##D sparkR.session() +##D path <- "path/to/file.json" +##D df <- read.json(path) +##D createOrReplaceTempView(df, "json_df") +##D new_df <- sql("SELECT * FROM json_df") +## End(Not run) +</code></pre> + + +<hr /><div style="text-align: center;">[Package <em>SparkR</em> version 2.4.0 <a href="00Index.html">Index</a>]</div> +</body></html> http://git-wip-us.apache.org/repos/asf/spark-website/blob/52917ac4/site/docs/2.4.0/api/R/createTable.html ---------------------------------------------------------------------- diff --git a/site/docs/2.4.0/api/R/createTable.html b/site/docs/2.4.0/api/R/createTable.html new file mode 100644 index 0000000..3490fa9 --- /dev/null +++ b/site/docs/2.4.0/api/R/createTable.html @@ -0,0 +1,91 @@ +<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd"><html xmlns="http://www.w3.org/1999/xhtml"><head><title>R: Creates a table based on the dataset in a data source</title> +<meta http-equiv="Content-Type" content="text/html; charset=utf-8" /> +<link rel="stylesheet" type="text/css" href="R.css" /> + +<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/8.3/styles/github.min.css"> +<script src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/8.3/highlight.min.js"></script> +<script src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/8.3/languages/r.min.js"></script> +<script>hljs.initHighlightingOnLoad();</script> +</head><body> + +<table width="100%" summary="page for createTable {SparkR}"><tr><td>createTable {SparkR}</td><td style="text-align: right;">R Documentation</td></tr></table> + +<h2>Creates a table based on the dataset in a data source</h2> + +<h3>Description</h3> + +<p>Creates a table based on the dataset in a data source. Returns a SparkDataFrame associated with +the table. +</p> + + +<h3>Usage</h3> + +<pre> +createTable(tableName, path = NULL, source = NULL, schema = NULL, + ...) +</pre> + + +<h3>Arguments</h3> + +<table summary="R argblock"> +<tr valign="top"><td><code>tableName</code></td> +<td> +<p>the qualified or unqualified name that designates a table. If no database +identifier is provided, it refers to a table in the current database.</p> +</td></tr> +<tr valign="top"><td><code>path</code></td> +<td> +<p>(optional) the path of files to load.</p> +</td></tr> +<tr valign="top"><td><code>source</code></td> +<td> +<p>(optional) the name of the data source.</p> +</td></tr> +<tr valign="top"><td><code>schema</code></td> +<td> +<p>(optional) the schema of the data required for some data sources.</p> +</td></tr> +<tr valign="top"><td><code>...</code></td> +<td> +<p>additional named parameters as options for the data source.</p> +</td></tr> +</table> + + +<h3>Details</h3> + +<p>The data source is specified by the <code>source</code> and a set of options(...). +If <code>source</code> is not specified, the default data source configured by +"spark.sql.sources.default" will be used. When a <code>path</code> is specified, an external table is +created from the data at the given path. Otherwise a managed table is created. +</p> + + +<h3>Value</h3> + +<p>A SparkDataFrame. +</p> + + +<h3>Note</h3> + +<p>createTable since 2.2.0 +</p> + + +<h3>Examples</h3> + +<pre><code class="r">## Not run: +##D sparkR.session() +##D df <- createTable("myjson", path="path/to/json", source="json", schema) +##D +##D createTable("people", source = "json", schema = schema) +##D insertInto(df, "people") +## End(Not run) +</code></pre> + + +<hr /><div style="text-align: center;">[Package <em>SparkR</em> version 2.4.0 <a href="00Index.html">Index</a>]</div> +</body></html> http://git-wip-us.apache.org/repos/asf/spark-website/blob/52917ac4/site/docs/2.4.0/api/R/crossJoin.html ---------------------------------------------------------------------- diff --git a/site/docs/2.4.0/api/R/crossJoin.html b/site/docs/2.4.0/api/R/crossJoin.html new file mode 100644 index 0000000..379bf88 --- /dev/null +++ b/site/docs/2.4.0/api/R/crossJoin.html @@ -0,0 +1,117 @@ +<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd"><html xmlns="http://www.w3.org/1999/xhtml"><head><title>R: CrossJoin</title> +<meta http-equiv="Content-Type" content="text/html; charset=utf-8" /> +<link rel="stylesheet" type="text/css" href="R.css" /> + +<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/8.3/styles/github.min.css"> +<script src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/8.3/highlight.min.js"></script> +<script src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/8.3/languages/r.min.js"></script> +<script>hljs.initHighlightingOnLoad();</script> +</head><body> + +<table width="100%" summary="page for crossJoin {SparkR}"><tr><td>crossJoin {SparkR}</td><td style="text-align: right;">R Documentation</td></tr></table> + +<h2>CrossJoin</h2> + +<h3>Description</h3> + +<p>Returns Cartesian Product on two SparkDataFrames. +</p> + + +<h3>Usage</h3> + +<pre> +## S4 method for signature 'SparkDataFrame,SparkDataFrame' +crossJoin(x, y) +</pre> + + +<h3>Arguments</h3> + +<table summary="R argblock"> +<tr valign="top"><td><code>x</code></td> +<td> +<p>A SparkDataFrame</p> +</td></tr> +<tr valign="top"><td><code>y</code></td> +<td> +<p>A SparkDataFrame</p> +</td></tr> +</table> + + +<h3>Value</h3> + +<p>A SparkDataFrame containing the result of the join operation. +</p> + + +<h3>Note</h3> + +<p>crossJoin since 2.1.0 +</p> + + +<h3>See Also</h3> + +<p><a href="merge.html">merge</a> <a href="join.html">join</a> +</p> +<p>Other SparkDataFrame functions: <code><a href="SparkDataFrame.html">SparkDataFrame-class</a></code>, +<code><a href="summarize.html">agg</a></code>, <code><a href="alias.html">alias</a></code>, +<code><a href="arrange.html">arrange</a></code>, <code><a href="as.data.frame.html">as.data.frame</a></code>, +<code><a href="attach.html">attach,SparkDataFrame-method</a></code>, +<code><a href="broadcast.html">broadcast</a></code>, <code><a href="cache.html">cache</a></code>, +<code><a href="checkpoint.html">checkpoint</a></code>, <code><a href="coalesce.html">coalesce</a></code>, +<code><a href="collect.html">collect</a></code>, <code><a href="columns.html">colnames</a></code>, +<code><a href="coltypes.html">coltypes</a></code>, +<code><a href="createOrReplaceTempView.html">createOrReplaceTempView</a></code>, +<code><a href="cube.html">cube</a></code>, <code><a href="dapplyCollect.html">dapplyCollect</a></code>, +<code><a href="dapply.html">dapply</a></code>, <code><a href="describe.html">describe</a></code>, +<code><a href="dim.html">dim</a></code>, <code><a href="distinct.html">distinct</a></code>, +<code><a href="dropDuplicates.html">dropDuplicates</a></code>, <code><a href="nafunctions.html">dropna</a></code>, +<code><a href="drop.html">drop</a></code>, <code><a href="dtypes.html">dtypes</a></code>, +<code><a href="exceptAll.html">exceptAll</a></code>, <code><a href="except.html">except</a></code>, +<code><a href="explain.html">explain</a></code>, <code><a href="filter.html">filter</a></code>, +<code><a href="first.html">first</a></code>, <code><a href="gapplyCollect.html">gapplyCollect</a></code>, +<code><a href="gapply.html">gapply</a></code>, <code><a href="getNumPartitions.html">getNumPartitions</a></code>, +<code><a href="groupBy.html">group_by</a></code>, <code><a href="head.html">head</a></code>, +<code><a href="hint.html">hint</a></code>, <code><a href="histogram.html">histogram</a></code>, +<code><a href="insertInto.html">insertInto</a></code>, <code><a href="intersectAll.html">intersectAll</a></code>, +<code><a href="intersect.html">intersect</a></code>, <code><a href="isLocal.html">isLocal</a></code>, +<code><a href="isStreaming.html">isStreaming</a></code>, <code><a href="join.html">join</a></code>, +<code><a href="limit.html">limit</a></code>, <code><a href="localCheckpoint.html">localCheckpoint</a></code>, +<code><a href="merge.html">merge</a></code>, <code><a href="mutate.html">mutate</a></code>, +<code><a href="ncol.html">ncol</a></code>, <code><a href="nrow.html">nrow</a></code>, +<code><a href="persist.html">persist</a></code>, <code><a href="printSchema.html">printSchema</a></code>, +<code><a href="randomSplit.html">randomSplit</a></code>, <code><a href="rbind.html">rbind</a></code>, +<code><a href="rename.html">rename</a></code>, <code><a href="repartitionByRange.html">repartitionByRange</a></code>, +<code><a href="repartition.html">repartition</a></code>, <code><a href="rollup.html">rollup</a></code>, +<code><a href="sample.html">sample</a></code>, <code><a href="saveAsTable.html">saveAsTable</a></code>, +<code><a href="schema.html">schema</a></code>, <code><a href="selectExpr.html">selectExpr</a></code>, +<code><a href="select.html">select</a></code>, <code><a href="showDF.html">showDF</a></code>, +<code><a href="show.html">show</a></code>, <code><a href="storageLevel.html">storageLevel</a></code>, +<code><a href="str.html">str</a></code>, <code><a href="subset.html">subset</a></code>, +<code><a href="summary.html">summary</a></code>, <code><a href="take.html">take</a></code>, +<code><a href="toJSON.html">toJSON</a></code>, <code><a href="unionByName.html">unionByName</a></code>, +<code><a href="union.html">union</a></code>, <code><a href="unpersist.html">unpersist</a></code>, +<code><a href="withColumn.html">withColumn</a></code>, <code><a href="withWatermark.html">withWatermark</a></code>, +<code><a href="with.html">with</a></code>, <code><a href="write.df.html">write.df</a></code>, +<code><a href="write.jdbc.html">write.jdbc</a></code>, <code><a href="write.json.html">write.json</a></code>, +<code><a href="write.orc.html">write.orc</a></code>, <code><a href="write.parquet.html">write.parquet</a></code>, +<code><a href="write.stream.html">write.stream</a></code>, <code><a href="write.text.html">write.text</a></code> +</p> + + +<h3>Examples</h3> + +<pre><code class="r">## Not run: +##D sparkR.session() +##D df1 <- read.json(path) +##D df2 <- read.json(path2) +##D crossJoin(df1, df2) # Performs a Cartesian +## End(Not run) +</code></pre> + + +<hr /><div style="text-align: center;">[Package <em>SparkR</em> version 2.4.0 <a href="00Index.html">Index</a>]</div> +</body></html> http://git-wip-us.apache.org/repos/asf/spark-website/blob/52917ac4/site/docs/2.4.0/api/R/crosstab.html ---------------------------------------------------------------------- diff --git a/site/docs/2.4.0/api/R/crosstab.html b/site/docs/2.4.0/api/R/crosstab.html new file mode 100644 index 0000000..5e80529 --- /dev/null +++ b/site/docs/2.4.0/api/R/crosstab.html @@ -0,0 +1,82 @@ +<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd"><html xmlns="http://www.w3.org/1999/xhtml"><head><title>R: Computes a pair-wise frequency table of the given columns</title> +<meta http-equiv="Content-Type" content="text/html; charset=utf-8" /> +<link rel="stylesheet" type="text/css" href="R.css" /> + +<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/8.3/styles/github.min.css"> +<script src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/8.3/highlight.min.js"></script> +<script src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/8.3/languages/r.min.js"></script> +<script>hljs.initHighlightingOnLoad();</script> +</head><body> + +<table width="100%" summary="page for crosstab {SparkR}"><tr><td>crosstab {SparkR}</td><td style="text-align: right;">R Documentation</td></tr></table> + +<h2>Computes a pair-wise frequency table of the given columns</h2> + +<h3>Description</h3> + +<p>Computes a pair-wise frequency table of the given columns. Also known as a contingency +table. The number of distinct values for each column should be less than 1e4. At most 1e6 +non-zero pair frequencies will be returned. +</p> + + +<h3>Usage</h3> + +<pre> +## S4 method for signature 'SparkDataFrame,character,character' +crosstab(x, col1, col2) +</pre> + + +<h3>Arguments</h3> + +<table summary="R argblock"> +<tr valign="top"><td><code>x</code></td> +<td> +<p>a SparkDataFrame</p> +</td></tr> +<tr valign="top"><td><code>col1</code></td> +<td> +<p>name of the first column. Distinct items will make the first item of each row.</p> +</td></tr> +<tr valign="top"><td><code>col2</code></td> +<td> +<p>name of the second column. Distinct items will make the column names of the output.</p> +</td></tr> +</table> + + +<h3>Value</h3> + +<p>a local R data.frame representing the contingency table. The first column of each row +will be the distinct values of <code>col1</code> and the column names will be the distinct +values of <code>col2</code>. The name of the first column will be "<code>col1</code>_<code>col2</code>". +Pairs that have no occurrences will have zero as their counts. +</p> + + +<h3>Note</h3> + +<p>crosstab since 1.5.0 +</p> + + +<h3>See Also</h3> + +<p>Other stat functions: <code><a href="approxQuantile.html">approxQuantile</a></code>, +<code><a href="corr.html">corr</a></code>, <code><a href="cov.html">cov</a></code>, +<code><a href="freqItems.html">freqItems</a></code>, <code><a href="sampleBy.html">sampleBy</a></code> +</p> + + +<h3>Examples</h3> + +<pre><code class="r">## Not run: +##D df <- read.json("/path/to/file.json") +##D ct <- crosstab(df, "title", "gender") +## End(Not run) +</code></pre> + + +<hr /><div style="text-align: center;">[Package <em>SparkR</em> version 2.4.0 <a href="00Index.html">Index</a>]</div> +</body></html> http://git-wip-us.apache.org/repos/asf/spark-website/blob/52917ac4/site/docs/2.4.0/api/R/cube.html ---------------------------------------------------------------------- diff --git a/site/docs/2.4.0/api/R/cube.html b/site/docs/2.4.0/api/R/cube.html new file mode 100644 index 0000000..136cf6b --- /dev/null +++ b/site/docs/2.4.0/api/R/cube.html @@ -0,0 +1,128 @@ +<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd"><html xmlns="http://www.w3.org/1999/xhtml"><head><title>R: cube</title> +<meta http-equiv="Content-Type" content="text/html; charset=utf-8" /> +<link rel="stylesheet" type="text/css" href="R.css" /> + +<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/8.3/styles/github.min.css"> +<script src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/8.3/highlight.min.js"></script> +<script src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/8.3/languages/r.min.js"></script> +<script>hljs.initHighlightingOnLoad();</script> +</head><body> + +<table width="100%" summary="page for cube {SparkR}"><tr><td>cube {SparkR}</td><td style="text-align: right;">R Documentation</td></tr></table> + +<h2>cube</h2> + +<h3>Description</h3> + +<p>Create a multi-dimensional cube for the SparkDataFrame using the specified columns. +</p> + + +<h3>Usage</h3> + +<pre> +cube(x, ...) + +## S4 method for signature 'SparkDataFrame' +cube(x, ...) +</pre> + + +<h3>Arguments</h3> + +<table summary="R argblock"> +<tr valign="top"><td><code>x</code></td> +<td> +<p>a SparkDataFrame.</p> +</td></tr> +<tr valign="top"><td><code>...</code></td> +<td> +<p>character name(s) or Column(s) to group on.</p> +</td></tr> +</table> + + +<h3>Details</h3> + +<p>If grouping expression is missing <code>cube</code> creates a single global aggregate and is +equivalent to direct application of <a href="summarize.html">agg</a>. +</p> + + +<h3>Value</h3> + +<p>A GroupedData. +</p> + + +<h3>Note</h3> + +<p>cube since 2.3.0 +</p> + + +<h3>See Also</h3> + +<p><a href="summarize.html">agg</a>, <a href="groupBy.html">groupBy</a>, <a href="rollup.html">rollup</a> +</p> +<p>Other SparkDataFrame functions: <code><a href="SparkDataFrame.html">SparkDataFrame-class</a></code>, +<code><a href="summarize.html">agg</a></code>, <code><a href="alias.html">alias</a></code>, +<code><a href="arrange.html">arrange</a></code>, <code><a href="as.data.frame.html">as.data.frame</a></code>, +<code><a href="attach.html">attach,SparkDataFrame-method</a></code>, +<code><a href="broadcast.html">broadcast</a></code>, <code><a href="cache.html">cache</a></code>, +<code><a href="checkpoint.html">checkpoint</a></code>, <code><a href="coalesce.html">coalesce</a></code>, +<code><a href="collect.html">collect</a></code>, <code><a href="columns.html">colnames</a></code>, +<code><a href="coltypes.html">coltypes</a></code>, +<code><a href="createOrReplaceTempView.html">createOrReplaceTempView</a></code>, +<code><a href="crossJoin.html">crossJoin</a></code>, <code><a href="dapplyCollect.html">dapplyCollect</a></code>, +<code><a href="dapply.html">dapply</a></code>, <code><a href="describe.html">describe</a></code>, +<code><a href="dim.html">dim</a></code>, <code><a href="distinct.html">distinct</a></code>, +<code><a href="dropDuplicates.html">dropDuplicates</a></code>, <code><a href="nafunctions.html">dropna</a></code>, +<code><a href="drop.html">drop</a></code>, <code><a href="dtypes.html">dtypes</a></code>, +<code><a href="exceptAll.html">exceptAll</a></code>, <code><a href="except.html">except</a></code>, +<code><a href="explain.html">explain</a></code>, <code><a href="filter.html">filter</a></code>, +<code><a href="first.html">first</a></code>, <code><a href="gapplyCollect.html">gapplyCollect</a></code>, +<code><a href="gapply.html">gapply</a></code>, <code><a href="getNumPartitions.html">getNumPartitions</a></code>, +<code><a href="groupBy.html">group_by</a></code>, <code><a href="head.html">head</a></code>, +<code><a href="hint.html">hint</a></code>, <code><a href="histogram.html">histogram</a></code>, +<code><a href="insertInto.html">insertInto</a></code>, <code><a href="intersectAll.html">intersectAll</a></code>, +<code><a href="intersect.html">intersect</a></code>, <code><a href="isLocal.html">isLocal</a></code>, +<code><a href="isStreaming.html">isStreaming</a></code>, <code><a href="join.html">join</a></code>, +<code><a href="limit.html">limit</a></code>, <code><a href="localCheckpoint.html">localCheckpoint</a></code>, +<code><a href="merge.html">merge</a></code>, <code><a href="mutate.html">mutate</a></code>, +<code><a href="ncol.html">ncol</a></code>, <code><a href="nrow.html">nrow</a></code>, +<code><a href="persist.html">persist</a></code>, <code><a href="printSchema.html">printSchema</a></code>, +<code><a href="randomSplit.html">randomSplit</a></code>, <code><a href="rbind.html">rbind</a></code>, +<code><a href="rename.html">rename</a></code>, <code><a href="repartitionByRange.html">repartitionByRange</a></code>, +<code><a href="repartition.html">repartition</a></code>, <code><a href="rollup.html">rollup</a></code>, +<code><a href="sample.html">sample</a></code>, <code><a href="saveAsTable.html">saveAsTable</a></code>, +<code><a href="schema.html">schema</a></code>, <code><a href="selectExpr.html">selectExpr</a></code>, +<code><a href="select.html">select</a></code>, <code><a href="showDF.html">showDF</a></code>, +<code><a href="show.html">show</a></code>, <code><a href="storageLevel.html">storageLevel</a></code>, +<code><a href="str.html">str</a></code>, <code><a href="subset.html">subset</a></code>, +<code><a href="summary.html">summary</a></code>, <code><a href="take.html">take</a></code>, +<code><a href="toJSON.html">toJSON</a></code>, <code><a href="unionByName.html">unionByName</a></code>, +<code><a href="union.html">union</a></code>, <code><a href="unpersist.html">unpersist</a></code>, +<code><a href="withColumn.html">withColumn</a></code>, <code><a href="withWatermark.html">withWatermark</a></code>, +<code><a href="with.html">with</a></code>, <code><a href="write.df.html">write.df</a></code>, +<code><a href="write.jdbc.html">write.jdbc</a></code>, <code><a href="write.json.html">write.json</a></code>, +<code><a href="write.orc.html">write.orc</a></code>, <code><a href="write.parquet.html">write.parquet</a></code>, +<code><a href="write.stream.html">write.stream</a></code>, <code><a href="write.text.html">write.text</a></code> +</p> + + +<h3>Examples</h3> + +<pre><code class="r">## Not run: +##D df <- createDataFrame(mtcars) +##D mean(cube(df, "cyl", "gear", "am"), "mpg") +##D +##D # Following calls are equivalent +##D agg(cube(df), mean(df$mpg)) +##D agg(df, mean(df$mpg)) +## End(Not run) +</code></pre> + + +<hr /><div style="text-align: center;">[Package <em>SparkR</em> version 2.4.0 <a href="00Index.html">Index</a>]</div> +</body></html> http://git-wip-us.apache.org/repos/asf/spark-website/blob/52917ac4/site/docs/2.4.0/api/R/currentDatabase.html ---------------------------------------------------------------------- diff --git a/site/docs/2.4.0/api/R/currentDatabase.html b/site/docs/2.4.0/api/R/currentDatabase.html new file mode 100644 index 0000000..2979c89 --- /dev/null +++ b/site/docs/2.4.0/api/R/currentDatabase.html @@ -0,0 +1,50 @@ +<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd"><html xmlns="http://www.w3.org/1999/xhtml"><head><title>R: Returns the current default database</title> +<meta http-equiv="Content-Type" content="text/html; charset=utf-8" /> +<link rel="stylesheet" type="text/css" href="R.css" /> + +<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/8.3/styles/github.min.css"> +<script src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/8.3/highlight.min.js"></script> +<script src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/8.3/languages/r.min.js"></script> +<script>hljs.initHighlightingOnLoad();</script> +</head><body> + +<table width="100%" summary="page for currentDatabase {SparkR}"><tr><td>currentDatabase {SparkR}</td><td style="text-align: right;">R Documentation</td></tr></table> + +<h2>Returns the current default database</h2> + +<h3>Description</h3> + +<p>Returns the current default database. +</p> + + +<h3>Usage</h3> + +<pre> +currentDatabase() +</pre> + + +<h3>Value</h3> + +<p>name of the current default database. +</p> + + +<h3>Note</h3> + +<p>since 2.2.0 +</p> + + +<h3>Examples</h3> + +<pre><code class="r">## Not run: +##D sparkR.session() +##D currentDatabase() +## End(Not run) +</code></pre> + + +<hr /><div style="text-align: center;">[Package <em>SparkR</em> version 2.4.0 <a href="00Index.html">Index</a>]</div> +</body></html> http://git-wip-us.apache.org/repos/asf/spark-website/blob/52917ac4/site/docs/2.4.0/api/R/dapply.html ---------------------------------------------------------------------- diff --git a/site/docs/2.4.0/api/R/dapply.html b/site/docs/2.4.0/api/R/dapply.html new file mode 100644 index 0000000..631db32 --- /dev/null +++ b/site/docs/2.4.0/api/R/dapply.html @@ -0,0 +1,152 @@ +<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd"><html xmlns="http://www.w3.org/1999/xhtml"><head><title>R: dapply</title> +<meta http-equiv="Content-Type" content="text/html; charset=utf-8" /> +<link rel="stylesheet" type="text/css" href="R.css" /> + +<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/8.3/styles/github.min.css"> +<script src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/8.3/highlight.min.js"></script> +<script src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/8.3/languages/r.min.js"></script> +<script>hljs.initHighlightingOnLoad();</script> +</head><body> + +<table width="100%" summary="page for dapply {SparkR}"><tr><td>dapply {SparkR}</td><td style="text-align: right;">R Documentation</td></tr></table> + +<h2>dapply</h2> + +<h3>Description</h3> + +<p>Apply a function to each partition of a SparkDataFrame. +</p> + + +<h3>Usage</h3> + +<pre> +dapply(x, func, schema) + +## S4 method for signature 'SparkDataFrame,'function',characterOrstructType' +dapply(x, func, + schema) +</pre> + + +<h3>Arguments</h3> + +<table summary="R argblock"> +<tr valign="top"><td><code>x</code></td> +<td> +<p>A SparkDataFrame</p> +</td></tr> +<tr valign="top"><td><code>func</code></td> +<td> +<p>A function to be applied to each partition of the SparkDataFrame. +func should have only one parameter, to which a R data.frame corresponds +to each partition will be passed. +The output of func should be a R data.frame.</p> +</td></tr> +<tr valign="top"><td><code>schema</code></td> +<td> +<p>The schema of the resulting SparkDataFrame after the function is applied. +It must match the output of func. Since Spark 2.3, the DDL-formatted string +is also supported for the schema.</p> +</td></tr> +</table> + + +<h3>Note</h3> + +<p>dapply since 2.0.0 +</p> + + +<h3>See Also</h3> + +<p><a href="dapplyCollect.html">dapplyCollect</a> +</p> +<p>Other SparkDataFrame functions: <code><a href="SparkDataFrame.html">SparkDataFrame-class</a></code>, +<code><a href="summarize.html">agg</a></code>, <code><a href="alias.html">alias</a></code>, +<code><a href="arrange.html">arrange</a></code>, <code><a href="as.data.frame.html">as.data.frame</a></code>, +<code><a href="attach.html">attach,SparkDataFrame-method</a></code>, +<code><a href="broadcast.html">broadcast</a></code>, <code><a href="cache.html">cache</a></code>, +<code><a href="checkpoint.html">checkpoint</a></code>, <code><a href="coalesce.html">coalesce</a></code>, +<code><a href="collect.html">collect</a></code>, <code><a href="columns.html">colnames</a></code>, +<code><a href="coltypes.html">coltypes</a></code>, +<code><a href="createOrReplaceTempView.html">createOrReplaceTempView</a></code>, +<code><a href="crossJoin.html">crossJoin</a></code>, <code><a href="cube.html">cube</a></code>, +<code><a href="dapplyCollect.html">dapplyCollect</a></code>, <code><a href="describe.html">describe</a></code>, +<code><a href="dim.html">dim</a></code>, <code><a href="distinct.html">distinct</a></code>, +<code><a href="dropDuplicates.html">dropDuplicates</a></code>, <code><a href="nafunctions.html">dropna</a></code>, +<code><a href="drop.html">drop</a></code>, <code><a href="dtypes.html">dtypes</a></code>, +<code><a href="exceptAll.html">exceptAll</a></code>, <code><a href="except.html">except</a></code>, +<code><a href="explain.html">explain</a></code>, <code><a href="filter.html">filter</a></code>, +<code><a href="first.html">first</a></code>, <code><a href="gapplyCollect.html">gapplyCollect</a></code>, +<code><a href="gapply.html">gapply</a></code>, <code><a href="getNumPartitions.html">getNumPartitions</a></code>, +<code><a href="groupBy.html">group_by</a></code>, <code><a href="head.html">head</a></code>, +<code><a href="hint.html">hint</a></code>, <code><a href="histogram.html">histogram</a></code>, +<code><a href="insertInto.html">insertInto</a></code>, <code><a href="intersectAll.html">intersectAll</a></code>, +<code><a href="intersect.html">intersect</a></code>, <code><a href="isLocal.html">isLocal</a></code>, +<code><a href="isStreaming.html">isStreaming</a></code>, <code><a href="join.html">join</a></code>, +<code><a href="limit.html">limit</a></code>, <code><a href="localCheckpoint.html">localCheckpoint</a></code>, +<code><a href="merge.html">merge</a></code>, <code><a href="mutate.html">mutate</a></code>, +<code><a href="ncol.html">ncol</a></code>, <code><a href="nrow.html">nrow</a></code>, +<code><a href="persist.html">persist</a></code>, <code><a href="printSchema.html">printSchema</a></code>, +<code><a href="randomSplit.html">randomSplit</a></code>, <code><a href="rbind.html">rbind</a></code>, +<code><a href="rename.html">rename</a></code>, <code><a href="repartitionByRange.html">repartitionByRange</a></code>, +<code><a href="repartition.html">repartition</a></code>, <code><a href="rollup.html">rollup</a></code>, +<code><a href="sample.html">sample</a></code>, <code><a href="saveAsTable.html">saveAsTable</a></code>, +<code><a href="schema.html">schema</a></code>, <code><a href="selectExpr.html">selectExpr</a></code>, +<code><a href="select.html">select</a></code>, <code><a href="showDF.html">showDF</a></code>, +<code><a href="show.html">show</a></code>, <code><a href="storageLevel.html">storageLevel</a></code>, +<code><a href="str.html">str</a></code>, <code><a href="subset.html">subset</a></code>, +<code><a href="summary.html">summary</a></code>, <code><a href="take.html">take</a></code>, +<code><a href="toJSON.html">toJSON</a></code>, <code><a href="unionByName.html">unionByName</a></code>, +<code><a href="union.html">union</a></code>, <code><a href="unpersist.html">unpersist</a></code>, +<code><a href="withColumn.html">withColumn</a></code>, <code><a href="withWatermark.html">withWatermark</a></code>, +<code><a href="with.html">with</a></code>, <code><a href="write.df.html">write.df</a></code>, +<code><a href="write.jdbc.html">write.jdbc</a></code>, <code><a href="write.json.html">write.json</a></code>, +<code><a href="write.orc.html">write.orc</a></code>, <code><a href="write.parquet.html">write.parquet</a></code>, +<code><a href="write.stream.html">write.stream</a></code>, <code><a href="write.text.html">write.text</a></code> +</p> + + +<h3>Examples</h3> + +<pre><code class="r">## Not run: +##D df <- createDataFrame(iris) +##D df1 <- dapply(df, function(x) { x }, schema(df)) +##D collect(df1) +##D +##D # filter and add a column +##D df <- createDataFrame( +##D list(list(1L, 1, "1"), list(2L, 2, "2"), list(3L, 3, "3")), +##D c("a", "b", "c")) +##D schema <- structType(structField("a", "integer"), structField("b", "double"), +##D structField("c", "string"), structField("d", "integer")) +##D df1 <- dapply( +##D df, +##D function(x) { +##D y <- x[x[1] > 1, ] +##D y <- cbind(y, y[1] + 1L) +##D }, +##D schema) +##D +##D # The schema also can be specified in a DDL-formatted string. +##D schema <- "a INT, d DOUBLE, c STRING, d INT" +##D df1 <- dapply( +##D df, +##D function(x) { +##D y <- x[x[1] > 1, ] +##D y <- cbind(y, y[1] + 1L) +##D }, +##D schema) +##D +##D collect(df1) +##D # the result +##D # a b c d +##D # 1 2 2 2 3 +##D # 2 3 3 3 4 +## End(Not run) +</code></pre> + + +<hr /><div style="text-align: center;">[Package <em>SparkR</em> version 2.4.0 <a href="00Index.html">Index</a>]</div> +</body></html> http://git-wip-us.apache.org/repos/asf/spark-website/blob/52917ac4/site/docs/2.4.0/api/R/dapplyCollect.html ---------------------------------------------------------------------- diff --git a/site/docs/2.4.0/api/R/dapplyCollect.html b/site/docs/2.4.0/api/R/dapplyCollect.html new file mode 100644 index 0000000..8a795a1 --- /dev/null +++ b/site/docs/2.4.0/api/R/dapplyCollect.html @@ -0,0 +1,130 @@ +<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd"><html xmlns="http://www.w3.org/1999/xhtml"><head><title>R: dapplyCollect</title> +<meta http-equiv="Content-Type" content="text/html; charset=utf-8" /> +<link rel="stylesheet" type="text/css" href="R.css" /> + +<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/8.3/styles/github.min.css"> +<script src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/8.3/highlight.min.js"></script> +<script src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/8.3/languages/r.min.js"></script> +<script>hljs.initHighlightingOnLoad();</script> +</head><body> + +<table width="100%" summary="page for dapplyCollect {SparkR}"><tr><td>dapplyCollect {SparkR}</td><td style="text-align: right;">R Documentation</td></tr></table> + +<h2>dapplyCollect</h2> + +<h3>Description</h3> + +<p>Apply a function to each partition of a SparkDataFrame and collect the result back +to R as a data.frame. +</p> + + +<h3>Usage</h3> + +<pre> +dapplyCollect(x, func) + +## S4 method for signature 'SparkDataFrame,'function'' +dapplyCollect(x, func) +</pre> + + +<h3>Arguments</h3> + +<table summary="R argblock"> +<tr valign="top"><td><code>x</code></td> +<td> +<p>A SparkDataFrame</p> +</td></tr> +<tr valign="top"><td><code>func</code></td> +<td> +<p>A function to be applied to each partition of the SparkDataFrame. +func should have only one parameter, to which a R data.frame corresponds +to each partition will be passed. +The output of func should be a R data.frame.</p> +</td></tr> +</table> + + +<h3>Note</h3> + +<p>dapplyCollect since 2.0.0 +</p> + + +<h3>See Also</h3> + +<p><a href="dapply.html">dapply</a> +</p> +<p>Other SparkDataFrame functions: <code><a href="SparkDataFrame.html">SparkDataFrame-class</a></code>, +<code><a href="summarize.html">agg</a></code>, <code><a href="alias.html">alias</a></code>, +<code><a href="arrange.html">arrange</a></code>, <code><a href="as.data.frame.html">as.data.frame</a></code>, +<code><a href="attach.html">attach,SparkDataFrame-method</a></code>, +<code><a href="broadcast.html">broadcast</a></code>, <code><a href="cache.html">cache</a></code>, +<code><a href="checkpoint.html">checkpoint</a></code>, <code><a href="coalesce.html">coalesce</a></code>, +<code><a href="collect.html">collect</a></code>, <code><a href="columns.html">colnames</a></code>, +<code><a href="coltypes.html">coltypes</a></code>, +<code><a href="createOrReplaceTempView.html">createOrReplaceTempView</a></code>, +<code><a href="crossJoin.html">crossJoin</a></code>, <code><a href="cube.html">cube</a></code>, +<code><a href="dapply.html">dapply</a></code>, <code><a href="describe.html">describe</a></code>, +<code><a href="dim.html">dim</a></code>, <code><a href="distinct.html">distinct</a></code>, +<code><a href="dropDuplicates.html">dropDuplicates</a></code>, <code><a href="nafunctions.html">dropna</a></code>, +<code><a href="drop.html">drop</a></code>, <code><a href="dtypes.html">dtypes</a></code>, +<code><a href="exceptAll.html">exceptAll</a></code>, <code><a href="except.html">except</a></code>, +<code><a href="explain.html">explain</a></code>, <code><a href="filter.html">filter</a></code>, +<code><a href="first.html">first</a></code>, <code><a href="gapplyCollect.html">gapplyCollect</a></code>, +<code><a href="gapply.html">gapply</a></code>, <code><a href="getNumPartitions.html">getNumPartitions</a></code>, +<code><a href="groupBy.html">group_by</a></code>, <code><a href="head.html">head</a></code>, +<code><a href="hint.html">hint</a></code>, <code><a href="histogram.html">histogram</a></code>, +<code><a href="insertInto.html">insertInto</a></code>, <code><a href="intersectAll.html">intersectAll</a></code>, +<code><a href="intersect.html">intersect</a></code>, <code><a href="isLocal.html">isLocal</a></code>, +<code><a href="isStreaming.html">isStreaming</a></code>, <code><a href="join.html">join</a></code>, +<code><a href="limit.html">limit</a></code>, <code><a href="localCheckpoint.html">localCheckpoint</a></code>, +<code><a href="merge.html">merge</a></code>, <code><a href="mutate.html">mutate</a></code>, +<code><a href="ncol.html">ncol</a></code>, <code><a href="nrow.html">nrow</a></code>, +<code><a href="persist.html">persist</a></code>, <code><a href="printSchema.html">printSchema</a></code>, +<code><a href="randomSplit.html">randomSplit</a></code>, <code><a href="rbind.html">rbind</a></code>, +<code><a href="rename.html">rename</a></code>, <code><a href="repartitionByRange.html">repartitionByRange</a></code>, +<code><a href="repartition.html">repartition</a></code>, <code><a href="rollup.html">rollup</a></code>, +<code><a href="sample.html">sample</a></code>, <code><a href="saveAsTable.html">saveAsTable</a></code>, +<code><a href="schema.html">schema</a></code>, <code><a href="selectExpr.html">selectExpr</a></code>, +<code><a href="select.html">select</a></code>, <code><a href="showDF.html">showDF</a></code>, +<code><a href="show.html">show</a></code>, <code><a href="storageLevel.html">storageLevel</a></code>, +<code><a href="str.html">str</a></code>, <code><a href="subset.html">subset</a></code>, +<code><a href="summary.html">summary</a></code>, <code><a href="take.html">take</a></code>, +<code><a href="toJSON.html">toJSON</a></code>, <code><a href="unionByName.html">unionByName</a></code>, +<code><a href="union.html">union</a></code>, <code><a href="unpersist.html">unpersist</a></code>, +<code><a href="withColumn.html">withColumn</a></code>, <code><a href="withWatermark.html">withWatermark</a></code>, +<code><a href="with.html">with</a></code>, <code><a href="write.df.html">write.df</a></code>, +<code><a href="write.jdbc.html">write.jdbc</a></code>, <code><a href="write.json.html">write.json</a></code>, +<code><a href="write.orc.html">write.orc</a></code>, <code><a href="write.parquet.html">write.parquet</a></code>, +<code><a href="write.stream.html">write.stream</a></code>, <code><a href="write.text.html">write.text</a></code> +</p> + + +<h3>Examples</h3> + +<pre><code class="r">## Not run: +##D df <- createDataFrame(iris) +##D ldf <- dapplyCollect(df, function(x) { x }) +##D +##D # filter and add a column +##D df <- createDataFrame( +##D list(list(1L, 1, "1"), list(2L, 2, "2"), list(3L, 3, "3")), +##D c("a", "b", "c")) +##D ldf <- dapplyCollect( +##D df, +##D function(x) { +##D y <- x[x[1] > 1, ] +##D y <- cbind(y, y[1] + 1L) +##D }) +##D # the result +##D # a b c d +##D # 2 2 2 3 +##D # 3 3 3 4 +## End(Not run) +</code></pre> + + +<hr /><div style="text-align: center;">[Package <em>SparkR</em> version 2.4.0 <a href="00Index.html">Index</a>]</div> +</body></html> http://git-wip-us.apache.org/repos/asf/spark-website/blob/52917ac4/site/docs/2.4.0/api/R/describe.html ---------------------------------------------------------------------- diff --git a/site/docs/2.4.0/api/R/describe.html b/site/docs/2.4.0/api/R/describe.html new file mode 100644 index 0000000..7c947fb --- /dev/null +++ b/site/docs/2.4.0/api/R/describe.html @@ -0,0 +1,131 @@ +<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd"><html xmlns="http://www.w3.org/1999/xhtml"><head><title>R: describe</title> +<meta http-equiv="Content-Type" content="text/html; charset=utf-8" /> +<link rel="stylesheet" type="text/css" href="R.css" /> + +<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/8.3/styles/github.min.css"> +<script src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/8.3/highlight.min.js"></script> +<script src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/8.3/languages/r.min.js"></script> +<script>hljs.initHighlightingOnLoad();</script> +</head><body> + +<table width="100%" summary="page for describe {SparkR}"><tr><td>describe {SparkR}</td><td style="text-align: right;">R Documentation</td></tr></table> + +<h2>describe</h2> + +<h3>Description</h3> + +<p>Computes statistics for numeric and string columns. +If no columns are given, this function computes statistics for all numerical or string columns. +</p> + + +<h3>Usage</h3> + +<pre> +describe(x, col, ...) + +## S4 method for signature 'SparkDataFrame,character' +describe(x, col, ...) + +## S4 method for signature 'SparkDataFrame,ANY' +describe(x) +</pre> + + +<h3>Arguments</h3> + +<table summary="R argblock"> +<tr valign="top"><td><code>x</code></td> +<td> +<p>a SparkDataFrame to be computed.</p> +</td></tr> +<tr valign="top"><td><code>col</code></td> +<td> +<p>a string of name.</p> +</td></tr> +<tr valign="top"><td><code>...</code></td> +<td> +<p>additional expressions.</p> +</td></tr> +</table> + + +<h3>Value</h3> + +<p>A SparkDataFrame. +</p> + + +<h3>Note</h3> + +<p>describe(SparkDataFrame, character) since 1.4.0 +</p> +<p>describe(SparkDataFrame) since 1.4.0 +</p> + + +<h3>See Also</h3> + +<p>See <a href="summary.html">summary</a> for expanded statistics and control over which statistics to compute. +</p> +<p>Other SparkDataFrame functions: <code><a href="SparkDataFrame.html">SparkDataFrame-class</a></code>, +<code><a href="summarize.html">agg</a></code>, <code><a href="alias.html">alias</a></code>, +<code><a href="arrange.html">arrange</a></code>, <code><a href="as.data.frame.html">as.data.frame</a></code>, +<code><a href="attach.html">attach,SparkDataFrame-method</a></code>, +<code><a href="broadcast.html">broadcast</a></code>, <code><a href="cache.html">cache</a></code>, +<code><a href="checkpoint.html">checkpoint</a></code>, <code><a href="coalesce.html">coalesce</a></code>, +<code><a href="collect.html">collect</a></code>, <code><a href="columns.html">colnames</a></code>, +<code><a href="coltypes.html">coltypes</a></code>, +<code><a href="createOrReplaceTempView.html">createOrReplaceTempView</a></code>, +<code><a href="crossJoin.html">crossJoin</a></code>, <code><a href="cube.html">cube</a></code>, +<code><a href="dapplyCollect.html">dapplyCollect</a></code>, <code><a href="dapply.html">dapply</a></code>, +<code><a href="dim.html">dim</a></code>, <code><a href="distinct.html">distinct</a></code>, +<code><a href="dropDuplicates.html">dropDuplicates</a></code>, <code><a href="nafunctions.html">dropna</a></code>, +<code><a href="drop.html">drop</a></code>, <code><a href="dtypes.html">dtypes</a></code>, +<code><a href="exceptAll.html">exceptAll</a></code>, <code><a href="except.html">except</a></code>, +<code><a href="explain.html">explain</a></code>, <code><a href="filter.html">filter</a></code>, +<code><a href="first.html">first</a></code>, <code><a href="gapplyCollect.html">gapplyCollect</a></code>, +<code><a href="gapply.html">gapply</a></code>, <code><a href="getNumPartitions.html">getNumPartitions</a></code>, +<code><a href="groupBy.html">group_by</a></code>, <code><a href="head.html">head</a></code>, +<code><a href="hint.html">hint</a></code>, <code><a href="histogram.html">histogram</a></code>, +<code><a href="insertInto.html">insertInto</a></code>, <code><a href="intersectAll.html">intersectAll</a></code>, +<code><a href="intersect.html">intersect</a></code>, <code><a href="isLocal.html">isLocal</a></code>, +<code><a href="isStreaming.html">isStreaming</a></code>, <code><a href="join.html">join</a></code>, +<code><a href="limit.html">limit</a></code>, <code><a href="localCheckpoint.html">localCheckpoint</a></code>, +<code><a href="merge.html">merge</a></code>, <code><a href="mutate.html">mutate</a></code>, +<code><a href="ncol.html">ncol</a></code>, <code><a href="nrow.html">nrow</a></code>, +<code><a href="persist.html">persist</a></code>, <code><a href="printSchema.html">printSchema</a></code>, +<code><a href="randomSplit.html">randomSplit</a></code>, <code><a href="rbind.html">rbind</a></code>, +<code><a href="rename.html">rename</a></code>, <code><a href="repartitionByRange.html">repartitionByRange</a></code>, +<code><a href="repartition.html">repartition</a></code>, <code><a href="rollup.html">rollup</a></code>, +<code><a href="sample.html">sample</a></code>, <code><a href="saveAsTable.html">saveAsTable</a></code>, +<code><a href="schema.html">schema</a></code>, <code><a href="selectExpr.html">selectExpr</a></code>, +<code><a href="select.html">select</a></code>, <code><a href="showDF.html">showDF</a></code>, +<code><a href="show.html">show</a></code>, <code><a href="storageLevel.html">storageLevel</a></code>, +<code><a href="str.html">str</a></code>, <code><a href="subset.html">subset</a></code>, +<code><a href="summary.html">summary</a></code>, <code><a href="take.html">take</a></code>, +<code><a href="toJSON.html">toJSON</a></code>, <code><a href="unionByName.html">unionByName</a></code>, +<code><a href="union.html">union</a></code>, <code><a href="unpersist.html">unpersist</a></code>, +<code><a href="withColumn.html">withColumn</a></code>, <code><a href="withWatermark.html">withWatermark</a></code>, +<code><a href="with.html">with</a></code>, <code><a href="write.df.html">write.df</a></code>, +<code><a href="write.jdbc.html">write.jdbc</a></code>, <code><a href="write.json.html">write.json</a></code>, +<code><a href="write.orc.html">write.orc</a></code>, <code><a href="write.parquet.html">write.parquet</a></code>, +<code><a href="write.stream.html">write.stream</a></code>, <code><a href="write.text.html">write.text</a></code> +</p> + + +<h3>Examples</h3> + +<pre><code class="r">## Not run: +##D sparkR.session() +##D path <- "path/to/file.json" +##D df <- read.json(path) +##D describe(df) +##D describe(df, "col1") +##D describe(df, "col1", "col2") +## End(Not run) +</code></pre> + + +<hr /><div style="text-align: center;">[Package <em>SparkR</em> version 2.4.0 <a href="00Index.html">Index</a>]</div> +</body></html> http://git-wip-us.apache.org/repos/asf/spark-website/blob/52917ac4/site/docs/2.4.0/api/R/dim.html ---------------------------------------------------------------------- diff --git a/site/docs/2.4.0/api/R/dim.html b/site/docs/2.4.0/api/R/dim.html new file mode 100644 index 0000000..9e49945 --- /dev/null +++ b/site/docs/2.4.0/api/R/dim.html @@ -0,0 +1,105 @@ +<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd"><html xmlns="http://www.w3.org/1999/xhtml"><head><title>R: Returns the dimensions of SparkDataFrame</title> +<meta http-equiv="Content-Type" content="text/html; charset=utf-8" /> +<link rel="stylesheet" type="text/css" href="R.css" /> + +<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/8.3/styles/github.min.css"> +<script src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/8.3/highlight.min.js"></script> +<script src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/8.3/languages/r.min.js"></script> +<script>hljs.initHighlightingOnLoad();</script> +</head><body> + +<table width="100%" summary="page for dim {SparkR}"><tr><td>dim {SparkR}</td><td style="text-align: right;">R Documentation</td></tr></table> + +<h2>Returns the dimensions of SparkDataFrame</h2> + +<h3>Description</h3> + +<p>Returns the dimensions (number of rows and columns) of a SparkDataFrame +</p> + + +<h3>Usage</h3> + +<pre> +## S4 method for signature 'SparkDataFrame' +dim(x) +</pre> + + +<h3>Arguments</h3> + +<table summary="R argblock"> +<tr valign="top"><td><code>x</code></td> +<td> +<p>a SparkDataFrame</p> +</td></tr> +</table> + + +<h3>Note</h3> + +<p>dim since 1.5.0 +</p> + + +<h3>See Also</h3> + +<p>Other SparkDataFrame functions: <code><a href="SparkDataFrame.html">SparkDataFrame-class</a></code>, +<code><a href="summarize.html">agg</a></code>, <code><a href="alias.html">alias</a></code>, +<code><a href="arrange.html">arrange</a></code>, <code><a href="as.data.frame.html">as.data.frame</a></code>, +<code><a href="attach.html">attach,SparkDataFrame-method</a></code>, +<code><a href="broadcast.html">broadcast</a></code>, <code><a href="cache.html">cache</a></code>, +<code><a href="checkpoint.html">checkpoint</a></code>, <code><a href="coalesce.html">coalesce</a></code>, +<code><a href="collect.html">collect</a></code>, <code><a href="columns.html">colnames</a></code>, +<code><a href="coltypes.html">coltypes</a></code>, +<code><a href="createOrReplaceTempView.html">createOrReplaceTempView</a></code>, +<code><a href="crossJoin.html">crossJoin</a></code>, <code><a href="cube.html">cube</a></code>, +<code><a href="dapplyCollect.html">dapplyCollect</a></code>, <code><a href="dapply.html">dapply</a></code>, +<code><a href="describe.html">describe</a></code>, <code><a href="distinct.html">distinct</a></code>, +<code><a href="dropDuplicates.html">dropDuplicates</a></code>, <code><a href="nafunctions.html">dropna</a></code>, +<code><a href="drop.html">drop</a></code>, <code><a href="dtypes.html">dtypes</a></code>, +<code><a href="exceptAll.html">exceptAll</a></code>, <code><a href="except.html">except</a></code>, +<code><a href="explain.html">explain</a></code>, <code><a href="filter.html">filter</a></code>, +<code><a href="first.html">first</a></code>, <code><a href="gapplyCollect.html">gapplyCollect</a></code>, +<code><a href="gapply.html">gapply</a></code>, <code><a href="getNumPartitions.html">getNumPartitions</a></code>, +<code><a href="groupBy.html">group_by</a></code>, <code><a href="head.html">head</a></code>, +<code><a href="hint.html">hint</a></code>, <code><a href="histogram.html">histogram</a></code>, +<code><a href="insertInto.html">insertInto</a></code>, <code><a href="intersectAll.html">intersectAll</a></code>, +<code><a href="intersect.html">intersect</a></code>, <code><a href="isLocal.html">isLocal</a></code>, +<code><a href="isStreaming.html">isStreaming</a></code>, <code><a href="join.html">join</a></code>, +<code><a href="limit.html">limit</a></code>, <code><a href="localCheckpoint.html">localCheckpoint</a></code>, +<code><a href="merge.html">merge</a></code>, <code><a href="mutate.html">mutate</a></code>, +<code><a href="ncol.html">ncol</a></code>, <code><a href="nrow.html">nrow</a></code>, +<code><a href="persist.html">persist</a></code>, <code><a href="printSchema.html">printSchema</a></code>, +<code><a href="randomSplit.html">randomSplit</a></code>, <code><a href="rbind.html">rbind</a></code>, +<code><a href="rename.html">rename</a></code>, <code><a href="repartitionByRange.html">repartitionByRange</a></code>, +<code><a href="repartition.html">repartition</a></code>, <code><a href="rollup.html">rollup</a></code>, +<code><a href="sample.html">sample</a></code>, <code><a href="saveAsTable.html">saveAsTable</a></code>, +<code><a href="schema.html">schema</a></code>, <code><a href="selectExpr.html">selectExpr</a></code>, +<code><a href="select.html">select</a></code>, <code><a href="showDF.html">showDF</a></code>, +<code><a href="show.html">show</a></code>, <code><a href="storageLevel.html">storageLevel</a></code>, +<code><a href="str.html">str</a></code>, <code><a href="subset.html">subset</a></code>, +<code><a href="summary.html">summary</a></code>, <code><a href="take.html">take</a></code>, +<code><a href="toJSON.html">toJSON</a></code>, <code><a href="unionByName.html">unionByName</a></code>, +<code><a href="union.html">union</a></code>, <code><a href="unpersist.html">unpersist</a></code>, +<code><a href="withColumn.html">withColumn</a></code>, <code><a href="withWatermark.html">withWatermark</a></code>, +<code><a href="with.html">with</a></code>, <code><a href="write.df.html">write.df</a></code>, +<code><a href="write.jdbc.html">write.jdbc</a></code>, <code><a href="write.json.html">write.json</a></code>, +<code><a href="write.orc.html">write.orc</a></code>, <code><a href="write.parquet.html">write.parquet</a></code>, +<code><a href="write.stream.html">write.stream</a></code>, <code><a href="write.text.html">write.text</a></code> +</p> + + +<h3>Examples</h3> + +<pre><code class="r">## Not run: +##D sparkR.session() +##D path <- "path/to/file.json" +##D df <- read.json(path) +##D dim(df) +## End(Not run) +</code></pre> + + +<hr /><div style="text-align: center;">[Package <em>SparkR</em> version 2.4.0 <a href="00Index.html">Index</a>]</div> +</body></html> --------------------------------------------------------------------- To unsubscribe, e-mail: commits-unsubscr...@spark.apache.org For additional commands, e-mail: commits-h...@spark.apache.org