Skip to content
Closed
Show file tree
Hide file tree
Changes from all commits
Commits
Show all changes
1144 commits
Select commit Hold shift + click to select a range
be9dd15
[SPARK-11818][REPL] Fix ExecutorClassLoader to lookup resources from …
HeartSaVioR Nov 24, 2015
e5aaae6
[SPARK-11942][SQL] fix encoder life cycle for CoGroup
cloud-fan Nov 24, 2015
56a0aba
[SPARK-11952][ML] Remove duplicate ml examples
yanboliang Nov 24, 2015
9e24ba6
[SPARK-11521][ML][DOC] Document that Logistic, Linear Regression summ…
jkbradley Nov 24, 2015
52bc25c
[SPARK-11847][ML] Model export/import for spark.ml: LDA
hhbyyh Nov 24, 2015
19530da
[SPARK-11926][SQL] unify GetStructField and GetInternalRowField
cloud-fan Nov 24, 2015
8101254
[SPARK-11872] Prevent the call to SparkContext#stop() in the listener…
tedyu Nov 24, 2015
f315272
[SPARK-11946][SQL] Audit pivot API for 1.6.
rxin Nov 24, 2015
e6dd237
[SPARK-11929][CORE] Make the repl log4j configuration override the ro…
Nov 24, 2015
58d9b26
[SPARK-11805] free the array in UnsafeExternalSorter during spilling
Nov 24, 2015
34ca392
Added a line of comment to explain why the extra sort exists in pivot.
rxin Nov 24, 2015
c7f95df
[SPARK-11783][SQL] Fixes execution Hive client when using remote Hive…
liancheng Nov 24, 2015
238ae51
[SPARK-11914][SQL] Support coalesce and repartition in Dataset APIs
gatorsmile Nov 24, 2015
25bbd3c
[SPARK-11967][SQL] Consistent use of varargs for multiple paths in Da…
rxin Nov 25, 2015
4d6bbbc
[SPARK-11947][SQL] Mark deprecated methods with "This will be removed…
rxin Nov 25, 2015
a5d9887
[STREAMING][FLAKY-TEST] Catch execution context race condition in `Fi…
brkyvz Nov 25, 2015
151d7c2
[SPARK-10621][SQL] Consistent naming for functions in SQL, Python, Scala
rxin Nov 25, 2015
2169886
[SPARK-11979][STREAMING] Empty TrackStateRDD cannot be checkpointed a…
tdas Nov 25, 2015
2610e06
[SPARK-11970][SQL] Adding JoinType into JoinWith and support Sample i…
gatorsmile Nov 25, 2015
a0f1a11
[SPARK-11981][SQL] Move implementations of methods back to DataFrame …
rxin Nov 25, 2015
6385002
[SPARK-11686][CORE] Issue WARN when dynamic allocation is disabled du…
Nov 25, 2015
b9b6fbe
[SPARK-11860][PYSAPRK][DOCUMENTATION] Invalid argument specification …
zjffdu Nov 25, 2015
0a5aef7
[SPARK-10666][SPARK-6880][CORE] Use properties from ActiveJob associa…
markhamstra Nov 25, 2015
c1f85fc
[SPARK-11956][CORE] Fix a few bugs in network lib-based file transfer.
Nov 25, 2015
faabdfa
[SPARK-11984][SQL][PYTHON] Fix typos in doc for pivot for scala and p…
felixcheung Nov 25, 2015
6b78157
[SPARK-11974][CORE] Not all the temp dirs had been deleted when the J…
pzzs Nov 25, 2015
dc1d324
[SPARK-11969] [SQL] [PYSPARK] visualization of SQL query for pyspark
Nov 25, 2015
0dee44a
[MINOR] Remove unnecessary spaces in `include_example.rb`
yu-iskw Nov 25, 2015
67b6732
[DOCUMENTATION] Fix minor doc error
zjffdu Nov 25, 2015
83653ac
[SPARK-10864][WEB UI] app name is hidden if window is resized
ajbozarth Nov 25, 2015
9f3e59a
[SPARK-11880][WINDOWS][SPARK SUBMIT] bin/load-spark-env.cmd loads spa…
wangt Nov 25, 2015
88875d9
[SPARK-10558][CORE] Fix wrong executor state in Master
jerryshao Nov 25, 2015
d29e2ef
[SPARK-11935][PYSPARK] Send the Python exceptions in TransformFunctio…
zsxwing Nov 25, 2015
4e81783
[SPARK-11866][NETWORK][CORE] Make sure timed out RPCs are cleaned up.
Nov 25, 2015
ecac283
Fix Aggregator documentation (rename present to finish).
rxin Nov 25, 2015
21e5606
[SPARK-11983][SQL] remove all unused codegen fallback trait
adrian-wang Nov 25, 2015
cc243a0
[SPARK-11206] Support SQL UI on the history server
carsonwang Nov 25, 2015
d1930ec
[SPARK-12003] [SQL] remove the prefix for name after expanded star
Nov 26, 2015
068b643
[SPARK-11980][SPARK-10621][SQL] Fix json_tuple and add test cases for
gatorsmile Nov 26, 2015
d3ef693
[SPARK-11999][CORE] Fix the issue that ThreadUtils.newDaemonCachedThr…
zsxwing Nov 26, 2015
27d69a0
[SPARK-11973] [SQL] push filter through aggregation with alias and li…
Nov 26, 2015
001f052
[SPARK-12005][SQL] Work around VerifyError in HyperLogLogPlusPlus.
Nov 26, 2015
bc16a67
[SPARK-11863][SQL] Unable to resolve order by if it contains mixture …
dilipbiswal Nov 26, 2015
ad76562
[SPARK-11998][SQL][TEST-HADOOP2.0] When downloading Hadoop artifacts …
yhuai Nov 27, 2015
de28e4d
[SPARK-11973][SQL] Improve optimizer code readability.
rxin Nov 27, 2015
4376b5b
doc typo: "classificaion" -> "classification"
muxator Nov 27, 2015
0c1e72e
[SPARK-11996][CORE] Make the executor thread dump work again
zsxwing Nov 27, 2015
6f6bb0e
[SPARK-12011][SQL] Stddev/Variance etc should support columnName as a…
yanboliang Nov 27, 2015
b63938a
[SPARK-11881][SQL] Fix for postgresql fetchsize > 0
mariusvniekerk Nov 27, 2015
d822088
[SPARK-11917][PYSPARK] Add SQLContext#dropTempTable to PySpark
zjffdu Nov 27, 2015
4d4cbc0
[SPARK-11778][SQL] add regression test
Nov 27, 2015
5eaed4e
[SPARK-11991] fixes
Nov 27, 2015
10e315c
Fix style violation for b63938a8b04
rxin Nov 27, 2015
a374e20
[SPARK-11997] [SQL] NPE when save a DataFrame as parquet and partitio…
dilipbiswal Nov 27, 2015
ba02f6c
[SPARK-12025][SPARKR] Rename some window rank function names for SparkR
yanboliang Nov 27, 2015
f57e6c9
[SPARK-12021][STREAMING][TESTS] Fix the potential dead-lock in Stream…
zsxwing Nov 27, 2015
b992152
[SPARK-12020][TESTS][TEST-HADOOP2.0] PR builder cannot trigger hadoop…
yhuai Nov 27, 2015
149cd69
[SPARK-12028] [SQL] get_json_object returns an incorrect result when …
gatorsmile Nov 28, 2015
28e46ab
[SPARK-12029][SPARKR] Improve column functions signature, param check…
felixcheung Nov 29, 2015
c793d2d
[SPARK-9319][SPARKR] Add support for setting column names, types
felixcheung Nov 29, 2015
cc7a1bc
[SPARK-11781][SPARKR] SparkR has problem in inferring type of raw type.
Nov 29, 2015
3d28081
[SPARK-12024][SQL] More efficient multi-column counting.
hvanhovell Nov 29, 2015
0ddfe78
[SPARK-12039] [SQL] Ignore HiveSparkSubmitSuite's "SPARK-9757 Persist…
yhuai Nov 30, 2015
e074944
[SPARK-11859][MESOS] SparkContext accepts invalid Master URLs in the …
toddwan Nov 30, 2015
953e8e6
[MINOR][BUILD] Changed the comment to reflect the plugin project is t…
ScrapCodes Nov 30, 2015
26c3581
[DOC] Explicitly state that top maintains the order of elements
mineo Nov 30, 2015
bf0e85a
[SPARK-12023][BUILD] Fix warnings while packaging spark with maven.
ScrapCodes Nov 30, 2015
2db4662
[SPARK-11989][SQL] Only use commit in JDBC data source if the underly…
CK50 Nov 30, 2015
17275fa
[SPARK-11700] [SQL] Remove thread local SQLContext in SparkPlan
Nov 30, 2015
8df584b
[SPARK-11982] [SQL] improve performance of cartesian product
Nov 30, 2015
f2fbfa4
[MINOR][DOCS] fixed list display in ml-ensembles
BenFradet Nov 30, 2015
2c5dee0
Revert "[SPARK-11206] Support SQL UI on the history server"
JoshRosen Nov 30, 2015
a8ceec5
[SPARK-12053][CORE] EventLoggingListener.getLogPath needs 4 parameters
chutium Nov 30, 2015
e232720
[SPARK-11689][ML] Add user guide and example code for LDA under spark.ml
hhbyyh Nov 30, 2015
de64b65
[SPARK-11975][ML] Remove duplicate mllib example (DT/RF/GBT in Java/P…
yanboliang Nov 30, 2015
5535888
[SPARK-11960][MLLIB][DOC] User guide for streaming tests
feynmanliang Nov 30, 2015
ecc00ec
fix Maven build
davies Nov 30, 2015
edb26e7
[SPARK-12058][HOTFIX] Disable KinesisStreamTests
zsxwing Dec 1, 2015
d3ca8cf
[SPARK-12000] Fix API doc generation issues
JoshRosen Dec 1, 2015
e6dc89a
[SPARK-12035] Add more debug information in include_example tag of Je…
yinxusen Dec 1, 2015
0a46e43
[SPARK-12037][CORE] initialize heartbeatReceiverRef before calling st…
CodingCat Dec 1, 2015
9bf2120
[SPARK-12007][NETWORK] Avoid copies in the network lib's RPC layer.
Dec 1, 2015
96bf468
[SPARK-12049][CORE] User JVM shutdown hook can cause deadlock at shut…
srowen Dec 1, 2015
f73379b
[HOTFIX][SPARK-12000] Add missing quotes in Jekyll API docs plugin.
JoshRosen Dec 1, 2015
9693b0d
[SPARK-12018][SQL] Refactor common subexpression elimination code
viirya Dec 1, 2015
a0af0e3
[SPARK-11898][MLLIB] Use broadcast for the global tables in Word2Vec
hhbyyh Dec 1, 2015
c87531b
[SPARK-11949][SQL] Set field nullable property for GroupingSets to ge…
viirya Dec 1, 2015
1401166
[SPARK-12060][CORE] Avoid memory copy in JavaSerializerInstance.seria…
zsxwing Dec 1, 2015
69dbe6b
[SPARK-12046][DOC] Fixes various ScalaDoc/JavaDoc issues
liancheng Dec 1, 2015
8ddc55f
[SPARK-12068][SQL] use a single column in Dataset.groupBy and count w…
cloud-fan Dec 1, 2015
9df2462
[SPARK-11856][SQL] add type cast if the real type is different but co…
cloud-fan Dec 1, 2015
fd95eea
[SPARK-11954][SQL] Encoder for JavaBeans
cloud-fan Dec 1, 2015
0a7bca2
[SPARK-11905][SQL] Support Persist/Cache and Unpersist in Dataset APIs
gatorsmile Dec 1, 2015
6a8cf80
[SPARK-11821] Propagate Kerberos keytab for all environments
woj-i Dec 1, 2015
34e7093
[SPARK-12065] Upgrade Tachyon from 0.8.1 to 0.8.2
JoshRosen Dec 1, 2015
2cef1cd
[SPARK-12030] Fix Platform.copyMemory to handle overlapping regions.
nongli Dec 1, 2015
60b541e
[SPARK-12004] Preserve the RDD partitioner through RDD checkpointing
tdas Dec 1, 2015
328b757
Revert "[SPARK-12060][CORE] Avoid memory copy in JavaSerializerInstan…
zsxwing Dec 1, 2015
e76431f
[SPARK-11961][DOC] Add docs of ChiSqSelector
yinxusen Dec 1, 2015
f292018
[SPARK-12002][STREAMING][PYSPARK] Fix python direct stream checkpoint…
jerryshao Dec 1, 2015
ef6790f
[SPARK-12075][SQL] Speed up HiveComparisionTest by avoiding / speedin…
JoshRosen Dec 1, 2015
47a0abc
[SPARK-11328][SQL] Improve error message when hitting this issue
nongli Dec 1, 2015
5a8b5fd
[SPARK-11788][SQL] surround timestamp/date value with quotes in JDBC …
Dec 1, 2015
5872a9d
[SPARK-11352][SQL] Escape */ in the generated comments.
yhuai Dec 2, 2015
e96a70d
[SPARK-11596][SQL] In TreeNode's argString, if a TreeNode is not a ch…
yhuai Dec 2, 2015
1ce4adf
[SPARK-8414] Ensure context cleaner periodic cleanups
Dec 2, 2015
d96f8c9
[SPARK-12081] Make unified memory manager work with small heaps
Dec 2, 2015
96691fe
[SPARK-12077][SQL] change the default plan for single distinct
Dec 2, 2015
8a75a30
[SPARK-12087][STREAMING] Create new JobConf for every batch in saveAs…
tdas Dec 2, 2015
0f37d1d
[SPARK-11949][SQL] Check bitmasks to set nullable property
viirya Dec 2, 2015
4375eb3
[SPARK-12090] [PYSPARK] consider shuffle in coalesce()
Dec 2, 2015
128c290
[SPARK-3580][CORE] Add Consistent Method To Get Number of RDD Partiti…
Dec 2, 2015
a1542ce
[SPARK-12094][SQL] Prettier tree string for TreeNode
liancheng Dec 2, 2015
452690b
[SPARK-12001] Allow partially-stopped StreamingContext to be complete…
JoshRosen Dec 2, 2015
de07d06
[SPARK-10266][DOCUMENTATION, ML] Fixed @Since annotation for ml.tunning
yu-iskw Dec 2, 2015
d0d7ec5
[SPARK-12093][SQL] Fix the error of comment in DDLParser
watermen Dec 3, 2015
9bb695b
[SPARK-12000] do not specify arg types when reference a method in Sca…
mengxr Dec 3, 2015
ae40253
[SPARK-12082][FLAKY-TEST] Increase timeouts in NettyBlockTransferSecu…
JoshRosen Dec 3, 2015
ec2b6c2
[SPARK-12109][SQL] Expressions's simpleString should delegate to its …
yhuai Dec 3, 2015
5349851
[SPARK-12088][SQL] check connection.isClosed before calling connection…
Dec 3, 2015
7470d9e
[DOCUMENTATION][MLLIB] typo in mllib doc
zjffdu Dec 3, 2015
95b3cf1
[DOCUMENTATION][KAFKA] fix typo in kafka/OffsetRange.scala
microwishing Dec 3, 2015
43c575c
[SPARK-12116][SPARKR][DOCS] document how to workaround function name …
felixcheung Dec 3, 2015
8fa3e47
[SPARK-11314][YARN] add service API and test service for Yarn Cluster…
steveloughran Dec 3, 2015
7bc9e1d
[SPARK-12059][CORE] Avoid assertion error when unexpected state trans…
jerryshao Dec 3, 2015
649be4f
[SPARK-12101][CORE] Fix thread pools that cannot cache tasks in Worke…
zsxwing Dec 3, 2015
688e521
[SPARK-12108] Make event logs smaller
Dec 3, 2015
d576e76
[MINOR][ML] Use coefficients replace weights
yanboliang Dec 3, 2015
ad7cea6
[SPARK-12107][EC2] Update spark-ec2 versions
nchammas Dec 3, 2015
a02d472
[FLAKY-TEST-FIX][STREAMING][TEST] Make sure StreamingContexts are shu…
tdas Dec 3, 2015
2213441
[SPARK-12019][SPARKR] Support character vector for sparkR.init(), che…
felixcheung Dec 3, 2015
f434f36
[SPARK-12056][CORE] Create a TaskAttemptContext only after calling se…
Dec 4, 2015
b6e9963
[SPARK-11206] Support SQL UI on the history server (resubmit)
carsonwang Dec 4, 2015
5011f26
[SPARK-12104][SPARKR] collect() does not handle multiple columns with…
Dec 4, 2015
4106d80
[SPARK-12122][STREAMING] Prevent batches from being submitted twice a…
tdas Dec 4, 2015
17e4e02
Add links howto to setup IDEs for developing spark
kaklakariada Dec 4, 2015
95296d9
[SPARK-12089] [SQL] Fix memory corrupt due to freeing a page being re…
Dec 4, 2015
d0d8222
[SPARK-6990][BUILD] Add Java linting script; fix minor warnings
dskrvk Dec 4, 2015
302d68d
[SPARK-12058][STREAMING][KINESIS][TESTS] fix Kinesis python tests
brkyvz Dec 4, 2015
d64806b
[SPARK-11314][BUILD][HOTFIX] Add exclusion for moved YARN classes.
Dec 4, 2015
b7204e1
[SPARK-12112][BUILD] Upgrade to SBT 0.13.9
JoshRosen Dec 5, 2015
bbfc16e
[SPARK-12142][CORE]Reply false when container allocator is not ready …
XuTingjun Dec 5, 2015
f30373f
[SPARK-12080][CORE] Kryo - Support multiple user registrators
Dec 5, 2015
3af53e6
[SPARK-12084][CORE] Fix codes that uses ByteBuffer.array incorrectly
zsxwing Dec 5, 2015
ee94b70
[SPARK-12096][MLLIB] remove the old constraint in word2vec
hhbyyh Dec 5, 2015
e9c9ae2
[SPARK-11994][MLLIB] Word2VecModel load and save cause SparkException…
tmnd1991 Dec 5, 2015
7da6748
[SPARK-11988][ML][MLLIB] Update JPMML to 1.2.7
srowen Dec 5, 2015
c8d0e16
[SPARK-11774][SPARKR] Implement struct(), encode(), decode() function…
Dec 5, 2015
895b6c4
[SPARK-11715][SPARKR] Add R support corr for Column Aggregration
felixcheung Dec 6, 2015
6979edf
[SPARK-12115][SPARKR] Change numPartitions() to getNumPartitions() to…
yanboliang Dec 6, 2015
b6e8e63
[SPARK-12044][SPARKR] Fix usage of isnan, isNaN
yanboliang Dec 6, 2015
04b6799
[SPARK-12048][SQL] Prevent to close JDBC resources twice
Dec 6, 2015
49efd03
[SPARK-12138][SQL] Escape \u in the generated comments of codegen
gatorsmile Dec 6, 2015
80a824d
[SPARK-12152][PROJECT-INFRA] Speed up Scalastyle checks by only invok…
JoshRosen Dec 7, 2015
6fd9e70
[SPARK-12106][STREAMING][FLAKY-TEST] BatchedWAL test transiently flak…
brkyvz Dec 7, 2015
9cde7d5
[SPARK-12032] [SQL] Re-order inner joins to do join with conditions f…
Dec 7, 2015
39d677c
[SPARK-12034][SPARKR] Eliminate warnings in SparkR test cases.
Dec 7, 2015
ef3f047
[SPARK-12132] [PYSPARK] raise KeyboardInterrupt inside SIGINT handler
Dec 7, 2015
5d80d8c
[SPARK-11932][STREAMING] Partition previous TrackStateRDD if partitio…
tdas Dec 7, 2015
3f4efb5
[SPARK-12060][CORE] Avoid memory copy in JavaSerializerInstance.seria…
zsxwing Dec 7, 2015
871e85d
[SPARK-11963][DOC] Add docs for QuantileDiscretizer
yinxusen Dec 7, 2015
84b8094
[SPARK-11884] Drop multiple columns in the DataFrame API
tedyu Dec 7, 2015
36282f7
[SPARK-12184][PYTHON] Make python api doc for pivot consistant with s…
aray Dec 7, 2015
3e7e05f
[SPARK-12160][MLLIB] Use SQLContext.getOrCreate in MLlib
jkbradley Dec 8, 2015
78209b0
[SPARK-11551][DOC][EXAMPLE] Replace example code in ml-features.md us…
somideshmukh Dec 8, 2015
7389658
Closes #10098
mengxr Dec 8, 2015
7d05a62
[SPARK-10259][ML] Add @since annotation to ml.classification
Dec 8, 2015
4a39b5a
[SPARK-11958][SPARK-11957][ML][DOC] SQLTransformer user guide and exa…
yanboliang Dec 8, 2015
48a9804
[SPARK-12103][STREAMING][KAFKA][DOC] document that K means Key and V …
koeninger Dec 8, 2015
7081291
[SPARK-12166][TEST] Unset hadoop related environment in testing
zjffdu Dec 8, 2015
037b7e7
[SPARK-11439][ML] Optimization of creating sparse feature without den…
Dec 8, 2015
da2012a
[SPARK-11551][DOC][EXAMPLE] Revert PR #10002
liancheng Dec 8, 2015
e3735ce
[SPARK-11652][CORE] Remote code execution with InvokerTransformer
srowen Dec 8, 2015
6cb06e8
[SPARK-11155][WEB UI] Stage summary json should include stage duration
keypointt Dec 8, 2015
75c60bf
[SPARK-12074] Avoid memory copy involving ByteBuffer.wrap(ByteArrayOu…
tedyu Dec 8, 2015
381f17b
[SPARK-12201][SQL] add type coercion rule for greatest/least
cloud-fan Dec 8, 2015
c0b13d5
[SPARK-12195][SQL] Adding BigDecimal, Date and Timestamp into Encoder
gatorsmile Dec 8, 2015
5d96a71
[SPARK-12188][SQL] Code refactoring and comment correction in Dataset…
gatorsmile Dec 8, 2015
872a2ee
[SPARK-10393] use ML pipeline in LDA example
hhbyyh Dec 8, 2015
4bcb894
[SPARK-12205][SQL] Pivot fails Analysis when aggregate is UnresolvedF…
aray Dec 8, 2015
5cb4695
[SPARK-11605][MLLIB] ML 1.6 QA: API: Java compatibility, docs
hhbyyh Dec 8, 2015
06746b3
[SPARK-12159][ML] Add user guide section for IndexToString transformer
BenFradet Dec 8, 2015
2ff17bc
[SPARK-3873][BUILD] Add style checker to enforce import ordering.
Dec 8, 2015
9494521
[SPARK-12187] *MemoryPool classes should not be fully public
Dec 8, 2015
3959489
[SPARK-12069][SQL] Update documentation with Datasets
marmbrus Dec 8, 2015
765c67f
[SPARK-8517][ML][DOC] Reorganizes the spark.ml user guide
thunterdb Dec 9, 2015
a0046e3
[SPARK-11343][ML] Documentation of float and double prediction/label …
dahlem Dec 9, 2015
3934562
[SPARK-12222] [CORE] Deserialize RoaringBitmap using Kryo serializer …
scwf Dec 9, 2015
f6883bb
[SPARK-11676][SQL] Parquet filter tests all pass if filters are not r…
HyukjinKwon Dec 9, 2015
a113216
[SPARK-12031][CORE][BUG] Integer overflow when do sampling
uncleGen Dec 9, 2015
6e1c55e
[SPARK-12012][SQL] Show more comprehensive PhysicalRDD metadata when …
liancheng Dec 9, 2015
22b9a87
[SPARK-10299][ML] word2vec should allow users to specify the window size
holdenk Dec 9, 2015
6900f01
[SPARK-10582][YARN][CORE] Fix AM failure situation for dynamic alloca…
jerryshao Dec 9, 2015
442a771
[SPARK-12241][YARN] Improve failure reporting in Yarn client obtainTo…
steveloughran Dec 9, 2015
aec5ea0
[SPARK-12165][SPARK-12189] Fix bugs in eviction of storage memory by …
JoshRosen Dec 9, 2015
1eb7c22
[SPARK-11824][WEBUI] WebUI does not render descriptions with 'bad' HT…
srowen Dec 9, 2015
051c6a0
[SPARK-11551][DOC] Replace example code in ml-features.md using inclu…
yinxusen Dec 9, 2015
7a8e587
[SPARK-12211][DOC][GRAPHX] Fix version number in graphx doc for migra…
aray Dec 10, 2015
8770bd1
[SPARK-12165][ADDENDUM] Fix outdated comments on unroll test
Dec 10, 2015
ac8cdf1
[SPARK-11678][SQL][DOCS] Document basePath in the programming guide.
yhuai Dec 10, 2015
2166c2a
[SPARK-11796] Fix httpclient and httpcore depedency issues related to…
Dec 10, 2015
bd2cd4f
[SPARK-12244][SPARK-12245][STREAMING] Rename trackStateByKey to mapWi…
tdas Dec 10, 2015
d8ec081
[SPARK-12252][SPARK-12131][SQL] refactor MapObjects to make it less h…
cloud-fan Dec 10, 2015
e29704f
[SPARK-12136][STREAMING] rddToFileName does not properly handle prefi…
Dec 10, 2015
21b3d2a
[SPARK-11530][MLLIB] Return eigenvalues with PCA model
srowen Dec 10, 2015
76540b6
[SPARK-12242][SQL] Add DataFrame.transform method
rxin Dec 10, 2015
db51652
[SPARK-11832][CORE] Process arguments in spark-shell for Scala 2.11
jodersky Dec 10, 2015
eeb5872
[SPARK-12198][SPARKR] SparkR support read.parquet and deprecate parqu…
yanboliang Dec 10, 2015
9fba9c8
[SPARK-11602][MLLIB] Refine visibility for 1.6 scala API audit
hhbyyh Dec 10, 2015
d9d354e
[SPARK-12234][SPARKR] Fix ```subset``` function error when only set `…
yanboliang Dec 10, 2015
bc5f56a
[SPARK-12250][SQL] Allow users to define a UDAF without providing det…
yhuai Dec 10, 2015
ec5f9ed
[SPARK-12228][SQL] Try to run execution hive's derby in memory.
yhuai Dec 10, 2015
2ecbe02
[SPARK-12212][ML][DOC] Clarifies the difference between spark.ml, spa…
thunterdb Dec 10, 2015
4a46b88
[SPARK-11563][CORE][REPL] Use RpcEnv to transfer REPL-generated classes.
Dec 10, 2015
6a6c1fc
[SPARK-11713] [PYSPARK] [STREAMING] Initial RDD updateStateByKey for …
BryanCutler Dec 10, 2015
23a9e62
[SPARK-12251] Document and improve off-heap memory configurations
JoshRosen Dec 10, 2015
5030923
[SPARK-12155][SPARK-12253] Fix executor OOM in unified memory management
Dec 10, 2015
24d3357
[STREAMING][DOC][MINOR] Update the description of direct Kafka stream…
jerryshao Dec 10, 2015
b1b4ee7
[SPARK-12258][SQL] passing null into ScalaUDF
Dec 11, 2015
518ab51
[SPARK-10991][ML] logistic regression training summary handle empty p…
holdenk Dec 11, 2015
c119a34
[SPARK-12258] [SQL] passing null into ScalaUDF (follow-up)
Dec 11, 2015
0fb9825
[SPARK-12146][SPARKR] SparkR jsonFile should support multiple input f…
yanboliang Dec 11, 2015
aa305dc
[SPARK-11964][DOCS][ML] Add in Pipeline Import/Export Documentation
bllchmbrs Dec 11, 2015
713e695
[SPARK-12273][STREAMING] Make Spark Streaming web UI list Receivers i…
lw-lin Dec 11, 2015
1b82203
[SPARK-11497][MLLIB][PYTHON] PySpark RowMatrix Constructor Has Type E…
dusenberrymw Dec 11, 2015
aea676c
[SPARK-12217][ML] Document invalid handling for StringIndexer
BenFradet Dec 11, 2015
a0ff6d1
[SPARK-11978][ML] Move dataset_example.py to examples/ml and rename t…
yanboliang Dec 12, 2015
1e799d6
[SPARK-12298][SQL] Fix infinite loop in DataFrame.sortWithinPartitions
ankurdave Dec 12, 2015
1e3526c
[SPARK-12158][SPARKR][SQL] Fix 'sample' functions that break R unit t…
gatorsmile Dec 12, 2015
03138b6
[SPARK-11193] Use Java ConcurrentHashMap instead of SynchronizedMap t…
jbonofre Dec 12, 2015
98b212d
[SPARK-12199][DOC] Follow-up: Refine example code in ml-features.md
yinxusen Dec 13, 2015
8af2f8c
[SPARK-12267][CORE] Store the remote RpcEnv address to send the corre…
zsxwing Dec 13, 2015
2aecda2
[SPARK-12281][CORE] Fix a race condition when reporting ExecutorState…
zsxwing Dec 14, 2015
834e714
[SPARK-12213][SQL] use multiple partitions for single distinct query
Dec 14, 2015
ed87f6d
[SPARK-12275][SQL] No plan for BroadcastHint in some condition
Dec 14, 2015
e25f1fe
[MINOR][DOC] Fix broken word2vec link
BenFradet Dec 14, 2015
b51a4cd
[SPARK-12016] [MLLIB] [PYSPARK] Wrap Word2VecModel when loading it in…
viirya Dec 14, 2015
fb3778d
[SPARK-12327] Disable commented code lintr temporarily
shivaram Dec 15, 2015
9ea1a8e
[SPARK-12274][SQL] WrapOption should not have type constraint for child
cloud-fan Dec 15, 2015
d13ff82
[SPARK-12188][SQL][FOLLOW-UP] Code refactoring and comment correction…
gatorsmile Dec 15, 2015
606f99b
[SPARK-12288] [SQL] Support UnsafeRow in Coalesce/Except/Intersect.
gatorsmile Dec 15, 2015
c59df8c
[SPARK-12332][TRIVIAL][TEST] Fix minor typo in ResetSystemProperties
holdenk Dec 15, 2015
bc1ff9f
[STREAMING][MINOR] Fix typo in function name of StateImpl
jerryshao Dec 15, 2015
6edd12b
[SPARK-10618] [Mesos] Adressing comments on PR.
SleepyThread Dec 15, 2015
14af20d
[SPARK-10618] [Mesos] Refactoring coarsed-grained scheduling conditio…
SleepyThread Sep 15, 2015
ecddfe6
[SPARK-10618] [Mesos] Killing space and removing duplication, also ha…
SleepyThread Sep 16, 2015
6a9d86a
[SPARK-10514] [CORE] [Mesos] Refactoring fine-grained scheduling cond…
SleepyThread Sep 17, 2015
538e089
[SPARK-10618] [Mesos] Adressing comments on PR.
SleepyThread Dec 15, 2015
6463452
Rebasing current master to local PR branch.
SleepyThread Dec 16, 2015
645cbdd
[SPARK-10618] [Mesos] removing meetconstraints check as it is already…
SleepyThread Dec 16, 2015
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
The table of contents is too big for display.
Diff view
Diff view
  •  
  •  
  •  
5 changes: 5 additions & 0 deletions .gitignore
Original file line number Diff line number Diff line change
Expand Up @@ -50,6 +50,7 @@ spark-tests.log
streaming-tests.log
dependency-reduced-pom.xml
.ensime
.ensime_cache/
.ensime_lucene
checkpoint
derby.log
Expand All @@ -74,3 +75,7 @@ metastore/
warehouse/
TempStatsStore/
sql/hive-thriftserver/test_warehouses

# For R session data
.RHistory
.RData
13 changes: 1 addition & 12 deletions .rat-excludes
Original file line number Diff line number Diff line change
Expand Up @@ -15,20 +15,8 @@ TAGS
RELEASE
control
docs
docker.properties.template
fairscheduler.xml.template
spark-defaults.conf.template
log4j.properties
log4j.properties.template
metrics.properties
metrics.properties.template
slaves
slaves.template
spark-env.sh
spark-env.cmd
spark-env.sh.template
log4j-defaults.properties
log4j-defaults-repl.properties
bootstrap-tooltip.js
jquery-1.11.1.min.js
d3.min.js
Expand Down Expand Up @@ -94,4 +82,5 @@ INDEX
gen-java.*
.*avpr
org.apache.spark.sql.sources.DataSourceRegister
org.apache.spark.scheduler.SparkHistoryListenerFactory
.*parquet
714 changes: 27 additions & 687 deletions LICENSE

Large diffs are not rendered by default.

35 changes: 35 additions & 0 deletions NOTICE
Original file line number Diff line number Diff line change
Expand Up @@ -572,3 +572,38 @@ Copyright 2009-2013 The Apache Software Foundation

Apache Avro IPC
Copyright 2009-2013 The Apache Software Foundation


Vis.js
Copyright 2010-2015 Almende B.V.

Vis.js is dual licensed under both

* The Apache 2.0 License
http://www.apache.org/licenses/LICENSE-2.0

and

* The MIT License
http://opensource.org/licenses/MIT

Vis.js may be distributed under either license.


Vis.js uses and redistributes the following third-party libraries:

- component-emitter
https://github.com/component/emitter
The MIT License

- hammer.js
http://hammerjs.github.io/
The MIT License

- moment.js
http://momentjs.com/
The MIT License

- keycharm
https://github.com/AlexDM0/keycharm
The MIT License
6 changes: 6 additions & 0 deletions R/install-dev.bat
Original file line number Diff line number Diff line change
Expand Up @@ -25,3 +25,9 @@ set SPARK_HOME=%~dp0..
MKDIR %SPARK_HOME%\R\lib

R.exe CMD INSTALL --library="%SPARK_HOME%\R\lib" %SPARK_HOME%\R\pkg\

rem Zip the SparkR package so that it can be distributed to worker nodes on YARN
pushd %SPARK_HOME%\R\lib
%JAVA_HOME%\bin\jar.exe cfM "%SPARK_HOME%\R\lib\sparkr.zip" SparkR
popd

4 changes: 4 additions & 0 deletions R/install-dev.sh
Original file line number Diff line number Diff line change
Expand Up @@ -42,4 +42,8 @@ Rscript -e ' if("devtools" %in% rownames(installed.packages())) { library(devtoo
# Install SparkR to $LIB_DIR
R CMD INSTALL --library=$LIB_DIR $FWDIR/pkg/

# Zip the SparkR package so that it can be distributed to worker nodes on YARN
cd $LIB_DIR
jar cfM "$LIB_DIR/sparkr.zip" SparkR

popd > /dev/null
2 changes: 1 addition & 1 deletion R/pkg/.lintr
Original file line number Diff line number Diff line change
@@ -1,2 +1,2 @@
linters: with_defaults(line_length_linter(100), camel_case_linter = NULL, open_curly_linter(allow_single_line = TRUE), closed_curly_linter(allow_single_line = TRUE))
linters: with_defaults(line_length_linter(100), camel_case_linter = NULL, open_curly_linter(allow_single_line = TRUE), closed_curly_linter(allow_single_line = TRUE), commented_code_linter = NULL)
exclusions: list("inst/profile/general.R" = 1, "inst/profile/shell.R")
2 changes: 2 additions & 0 deletions R/pkg/DESCRIPTION
Original file line number Diff line number Diff line change
Expand Up @@ -33,4 +33,6 @@ Collate:
'mllib.R'
'serialize.R'
'sparkR.R'
'stats.R'
'types.R'
'utils.R'
41 changes: 40 additions & 1 deletion R/pkg/NAMESPACE
Original file line number Diff line number Diff line change
Expand Up @@ -23,10 +23,18 @@ export("setJobGroup",
exportClasses("DataFrame")

exportMethods("arrange",
"as.data.frame",
"attach",
"cache",
"collect",
"colnames",
"colnames<-",
"coltypes",
"coltypes<-",
"columns",
"count",
"cov",
"corr",
"crosstab",
"describe",
"dim",
Expand All @@ -38,6 +46,7 @@ exportMethods("arrange",
"fillna",
"filter",
"first",
"freqItems",
"group_by",
"groupBy",
"head",
Expand All @@ -50,6 +59,7 @@ exportMethods("arrange",
"mutate",
"na.omit",
"names",
"names<-",
"ncol",
"nrow",
"orderBy",
Expand All @@ -61,6 +71,7 @@ exportMethods("arrange",
"repartition",
"sample",
"sample_frac",
"sampleBy",
"saveAsParquetFile",
"saveAsTable",
"saveDF",
Expand All @@ -78,6 +89,7 @@ exportMethods("arrange",
"unique",
"unpersist",
"where",
"with",
"withColumn",
"withColumnRenamed",
"write.df")
Expand All @@ -90,6 +102,7 @@ exportMethods("%in%",
"add_months",
"alias",
"approxCountDistinct",
"array_contains",
"asc",
"ascii",
"asin",
Expand All @@ -104,6 +117,7 @@ exportMethods("%in%",
"cbrt",
"ceil",
"ceiling",
"column",
"concat",
"concat_ws",
"contains",
Expand All @@ -113,13 +127,17 @@ exportMethods("%in%",
"count",
"countDistinct",
"crc32",
"cume_dist",
"date_add",
"date_format",
"date_sub",
"datediff",
"dayofmonth",
"dayofyear",
"decode",
"dense_rank",
"desc",
"encode",
"endsWith",
"exp",
"explode",
Expand All @@ -144,8 +162,11 @@ exportMethods("%in%",
"isNaN",
"isNotNull",
"isNull",
"kurtosis",
"lag",
"last",
"last_day",
"lead",
"least",
"length",
"levenshtein",
Expand All @@ -171,17 +192,21 @@ exportMethods("%in%",
"nanvl",
"negate",
"next_day",
"ntile",
"otherwise",
"percent_rank",
"pmod",
"quarter",
"rand",
"randn",
"rank",
"regexp_extract",
"regexp_replace",
"reverse",
"rint",
"rlike",
"round",
"row_number",
"rpad",
"rtrim",
"second",
Expand All @@ -190,12 +215,19 @@ exportMethods("%in%",
"shiftLeft",
"shiftRight",
"shiftRightUnsigned",
"sd",
"sign",
"signum",
"sin",
"sinh",
"size",
"skewness",
"sort_array",
"soundex",
"stddev",
"stddev_pop",
"stddev_samp",
"struct",
"sqrt",
"startsWith",
"substr",
Expand All @@ -214,6 +246,10 @@ exportMethods("%in%",
"unhex",
"unix_timestamp",
"upper",
"var",
"variance",
"var_pop",
"var_samp",
"weekofyear",
"when",
"year")
Expand All @@ -224,15 +260,18 @@ exportMethods("agg")
export("sparkRSQL.init",
"sparkRHive.init")

export("cacheTable",
export("as.DataFrame",
"cacheTable",
"clearCache",
"createDataFrame",
"createExternalTable",
"dropTempTable",
"jsonFile",
"read.json",
"loadDF",
"parquetFile",
"read.df",
"read.parquet",
"sql",
"table",
"tableNames",
Expand Down
Loading