Skip to content

Commit e0d6daa

Browse files
author
Peng
committed
merge master
2 parents ffe79b8 + 25b4f41 commit e0d6daa

File tree

166 files changed

+2295
-942
lines changed

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

166 files changed

+2295
-942
lines changed

R/pkg/NAMESPACE

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -84,6 +84,7 @@ exportClasses("SparkDataFrame")
8484
exportMethods("arrange",
8585
"as.data.frame",
8686
"attach",
87+
"broadcast",
8788
"cache",
8889
"checkpoint",
8990
"coalesce",

R/pkg/R/DataFrame.R

Lines changed: 29 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -3769,3 +3769,32 @@ setMethod("alias",
37693769
sdf <- callJMethod(object@sdf, "alias", data)
37703770
dataFrame(sdf)
37713771
})
3772+
3773+
#' broadcast
3774+
#'
3775+
#' Return a new SparkDataFrame marked as small enough for use in broadcast joins.
3776+
#'
3777+
#' Equivalent to \code{hint(x, "broadcast")}.
3778+
#'
3779+
#' @param x a SparkDataFrame.
3780+
#' @return a SparkDataFrame.
3781+
#'
3782+
#' @aliases broadcast,SparkDataFrame-method
3783+
#' @family SparkDataFrame functions
3784+
#' @rdname broadcast
3785+
#' @name broadcast
3786+
#' @export
3787+
#' @examples
3788+
#' \dontrun{
3789+
#' df <- createDataFrame(mtcars)
3790+
#' avg_mpg <- mean(groupBy(createDataFrame(mtcars), "cyl"), "mpg")
3791+
#'
3792+
#' head(join(df, broadcast(avg_mpg), df$cyl == avg_mpg$cyl))
3793+
#' }
3794+
#' @note broadcast since 2.3.0
3795+
setMethod("broadcast",
3796+
signature(x = "SparkDataFrame"),
3797+
function(x) {
3798+
sdf <- callJStatic("org.apache.spark.sql.functions", "broadcast", x@sdf)
3799+
dataFrame(sdf)
3800+
})

R/pkg/R/context.R

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -258,15 +258,15 @@ includePackage <- function(sc, pkg) {
258258
#'
259259
#' # Large Matrix object that we want to broadcast
260260
#' randomMat <- matrix(nrow=100, ncol=10, data=rnorm(1000))
261-
#' randomMatBr <- broadcast(sc, randomMat)
261+
#' randomMatBr <- broadcastRDD(sc, randomMat)
262262
#'
263263
#' # Use the broadcast variable inside the function
264264
#' useBroadcast <- function(x) {
265265
#' sum(value(randomMatBr) * x)
266266
#' }
267267
#' sumRDD <- lapply(rdd, useBroadcast)
268268
#'}
269-
broadcast <- function(sc, object) {
269+
broadcastRDD <- function(sc, object) {
270270
objName <- as.character(substitute(object))
271271
serializedObj <- serialize(object, connection = NULL)
272272

0 commit comments

Comments
 (0)