Skip to content
Closed
Show file tree
Hide file tree
Changes from 1 commit
Commits
Show all changes
862 commits
Select commit Hold shift + click to select a range
5aca6ad
[SPARK-11767] [SQL] limit the size of caced batch
Nov 17, 2015
fa603e0
[SPARK-11732] Removes some MiMa false positives
thunterdb Nov 17, 2015
328eb49
[SPARK-11729] Replace example code in ml-linear-methods.md using incl…
yinxusen Nov 17, 2015
6eb7008
[SPARK-11763][ML] Add save,load to LogisticRegression Estimator
jkbradley Nov 17, 2015
3e9e638
[SPARK-11764][ML] make Param.jsonEncode/jsonDecode support Vector
mengxr Nov 17, 2015
936bc0b
[SPARK-11786][CORE] Tone down messages from akka error monitor.
Nov 17, 2015
928d631
[SPARK-11740][STREAMING] Fix the race condition of two checkpoints in…
zsxwing Nov 17, 2015
965245d
[SPARK-9552] Add force control for killExecutors to avoid false killi…
GraceH Nov 17, 2015
e29656f
[MINOR] Correct comments in JavaDirectKafkaWordCount
Nov 17, 2015
3720b14
[SPARK-11790][STREAMING][TESTS] Increase the connection timeout
zsxwing Nov 17, 2015
52c734b
[SPARK-11771][YARN][TRIVIAL] maximum memory in yarn is controlled by …
holdenk Nov 17, 2015
b362d50
[SPARK-11726] Throw exception on timeout when waiting for REST server…
jacek-lewandowski Nov 17, 2015
75a2922
[SPARK-9065][STREAMING][PYSPARK] Add MessageHandler for Kafka Python API
jerryshao Nov 18, 2015
ed8d153
[SPARK-11793][SQL] Dataset should set the resolved encoders internall…
rxin Nov 18, 2015
bf25f9b
[SPARK-11016] Move RoaringBitmap to explicit Kryo serializer
Nov 18, 2015
e33053e
[SPARK-11583] [CORE] MapStatus Using RoaringBitmap More Properly
yaooqinn Nov 18, 2015
98be816
[SPARK-11737] [SQL] Fix serialization of UTF8String with Kyro
Nov 18, 2015
91f4b6f
[SPARK-11797][SQL] collect, first, and take should use encoders for s…
rxin Nov 18, 2015
8fb775b
[SPARK-11755][R] SparkR should export "predict"
yanboliang Nov 18, 2015
446738e
[SPARK-11761] Prevent the call to StreamingContext#stop() in the list…
tedyu Nov 18, 2015
67a5132
[SPARK-7013][ML][TEST] Add unit test for spark.ml StandardScaler
RoyGao Nov 18, 2015
2f191c6
[SPARK-11643] [SQL] parse year with leading zero
Nov 18, 2015
9154f89
[SPARK-11728] Replace example code in ml-ensembles.md using include_e…
yinxusen Nov 18, 2015
8019f66
[SPARK-10186][SQL][FOLLOW-UP] simplify test
cloud-fan Nov 18, 2015
5e2b444
[SPARK-11802][SQL] Kryo-based encoder for opaque types in Datasets
rxin Nov 18, 2015
1714350
[SPARK-11792][SQL] SizeEstimator cannot provide a good size estimatio…
yhuai Nov 18, 2015
b8f4379
[SPARK-10946][SQL] JDBC - Use Statement.executeUpdate instead of Prep…
somideshmukh Nov 18, 2015
e62820c
[SPARK-6541] Sort executors by ID (numeric)
jbonofre Nov 18, 2015
9631ca3
[SPARK-11652][CORE] Remote code execution with InvokerTransformer
srowen Nov 18, 2015
1429e0a
rmse was wrongly calculated
Nov 18, 2015
3a6807f
[SPARK-11804] [PYSPARK] Exception raise when using Jdbc predicates opt…
zjffdu Nov 18, 2015
a97d6f3
[SPARK-11281][SPARKR] Add tests covering the issue.
zero323 Nov 18, 2015
224723e
[SPARK-11773][SPARKR] Implement collection functions in SparkR.
Nov 18, 2015
3cca5ff
[SPARK-11195][CORE] Use correct classloader for TaskResultGetter
Nov 18, 2015
cffb899
[SPARK-11803][SQL] fix Dataset self-join
cloud-fan Nov 18, 2015
33b8373
[SPARK-11725][SQL] correctly handle null inputs for UDF
cloud-fan Nov 18, 2015
dbf428c
[SPARK-11795][SQL] combine grouping attributes into a single NamedExp…
cloud-fan Nov 18, 2015
90a7519
[MINOR][BUILD] Ignore ensime cache
jodersky Nov 18, 2015
6f99522
[SPARK-11792] [SQL] [FOLLOW-UP] Change SizeEstimation to KnownSizeEst…
yhuai Nov 18, 2015
94624ea
[SPARK-11739][SQL] clear the instantiated SQLContext
Nov 18, 2015
31921e0
[SPARK-4557][STREAMING] Spark Streaming foreachRDD Java API method sh…
BryanCutler Nov 18, 2015
a416e41
[SPARK-11809] Switch the default Mesos mode to coarse-grained mode
rxin Nov 18, 2015
7c5b641
[SPARK-10745][CORE] Separate configs between shuffle and RPC
zsxwing Nov 18, 2015
09ad953
[SPARK-11720][SQL][ML] Handle edge cases when count = 0 or 1 for Stat…
JihongMA Nov 18, 2015
045a4f0
[SPARK-6790][ML] Add spark.ml LinearRegression import/export
fayeshine Nov 18, 2015
2acdf10
[SPARK-6789][ML] Add Readable, Writable support for spark.ml ALS, ALS…
jkbradley Nov 18, 2015
e391abd
[SPARK-11813][MLLIB] Avoid serialization of vocab in Word2Vec
hhbyyh Nov 18, 2015
e222d75
[SPARK-11684][R][ML][DOC] Update SparkR glm API doc, user guide and e…
yanboliang Nov 18, 2015
603a721
[SPARK-11820][ML][PYSPARK] PySpark LiR & LoR should support weightCol
yanboliang Nov 18, 2015
54db797
[SPARK-11544][SQL] sqlContext doesn't use PathFilter
dilipbiswal Nov 18, 2015
5df0894
[SPARK-11810][SQL] Java-based encoder for opaque types in Datasets.
rxin Nov 18, 2015
7e987de
[SPARK-6787][ML] add read/write to estimators under ml.feature (1)
mengxr Nov 18, 2015
3a98519
[SPARK-11649] Properly set Akka frame size in SparkListenerSuite test
JoshRosen Nov 18, 2015
c07a50b
[SPARK-10930] History "Stages" page "duration" can be confusing
Nov 18, 2015
4b11712
[SPARK-11495] Fix potential socket / file handle leaks that were foun…
JoshRosen Nov 19, 2015
a402c92
[SPARK-11814][STREAMING] Add better default checkpoint duration
tdas Nov 19, 2015
921900f
[SPARK-11791] Fix flaky test in BatchedWriteAheadLogSuite
brkyvz Nov 19, 2015
59a5013
[SPARK-11636][SQL] Support classes defined in the REPL with Encoders
marmbrus Nov 19, 2015
e99d339
[SPARK-11839][ML] refactor save/write traits
mengxr Nov 19, 2015
e61367b
[SPARK-11833][SQL] Add Java tests for Kryo/Java Dataset encoders
rxin Nov 19, 2015
6d0848b
[SPARK-11787][SQL] Improve Parquet scan performance when using flat s…
nongli Nov 19, 2015
9c0654d
Revert "[SPARK-11544][SQL] sqlContext doesn't use PathFilter"
yhuai Nov 19, 2015
67c7582
[SPARK-11816][ML] fix some style issue in ML/MLlib examples
hhbyyh Nov 19, 2015
fc3f77b
[SPARK-11614][SQL] serde parameters should be set only when all param…
navis Nov 19, 2015
d02d5b9
[SPARK-11842][ML] Small cleanups to existing Readers and Writers
jkbradley Nov 19, 2015
1a93323
[SPARK-11339][SPARKR] Document the list of functions in R base packag…
felixcheung Nov 19, 2015
f449992
[SPARK-11849][SQL] Analyzer should replace current_date and current_t…
rxin Nov 19, 2015
9628788
[SPARK-11840][SQL] Restore the 1.5's behavior of planning a single di…
yhuai Nov 19, 2015
72d150c
[SPARK-11830][CORE] Make NettyRpcEnv bind to the specified host
zsxwing Nov 19, 2015
276a7e1
[SPARK-11633][SQL] LogicalRDD throws TreeNode Exception : Failed to C…
gatorsmile Nov 19, 2015
7d4aba1
[SPARK-11848][SQL] Support EXPLAIN in DataSet APIs
gatorsmile Nov 19, 2015
47d1c23
[SPARK-11750][SQL] revert SPARK-11727 and code clean up
cloud-fan Nov 19, 2015
4700074
[SPARK-11778][SQL] parse table name before it is passed to lookupRela…
Nov 19, 2015
599a8c6
[SPARK-11812][PYSPARK] invFunc=None works properly with python's redu…
dtolpin Nov 19, 2015
014c0f7
[SPARK-11858][SQL] Move sql.columnar into sql.execution.
rxin Nov 19, 2015
90d384d
[SPARK-11831][CORE][TESTS] Use port 0 to avoid port conflicts in tests
zsxwing Nov 19, 2015
3bd77b2
[SPARK-11799][CORE] Make it explicit in executor logs that uncaught e…
Nov 19, 2015
f7135ed
[SPARK-11828][CORE] Register DAGScheduler metrics source after app id…
Nov 19, 2015
01403aa
[SPARK-11746][CORE] Use cache-aware method dependencies
suyanNone Nov 19, 2015
37cff1b
[SPARK-11275][SQL] Incorrect results when using rollup/cube
aray Nov 19, 2015
880128f
[SPARK-4134][CORE] Lower severity of some executor loss logs.
Nov 20, 2015
b2cecb8
[SPARK-11845][STREAMING][TEST] Added unit test to verify TrackStateRD…
tdas Nov 20, 2015
ee21407
[SPARK-11864][SQL] Improve performance of max/min
Nov 20, 2015
7ee7d5a
[SPARK-11544][SQL][TEST-HADOOP1.0] sqlContext doesn't use PathFilter
dilipbiswal Nov 20, 2015
4114ce2
[SPARK-11846] Add save/load for AFTSurvivalRegression and IsotonicReg…
yinxusen Nov 20, 2015
3b7f056
[SPARK-11829][ML] Add read/write to estimators under ml.feature (II)
yanboliang Nov 20, 2015
7216f40
[SPARK-11875][ML][PYSPARK] Update doc for PySpark HasCheckpointInterval
yanboliang Nov 20, 2015
0fff8eb
[SPARK-11869][ML] Clean up TempDirectory properly in ML tests
jkbradley Nov 20, 2015
3e1d120
[SPARK-11867] Add save/load for kmeans and naive bayes
yinxusen Nov 20, 2015
a66142d
[SPARK-11877] Prevent agg. fallback conf. from leaking across test su…
JoshRosen Nov 20, 2015
9ace2e5
[SPARK-11852][ML] StandardScaler minor refactor
yanboliang Nov 20, 2015
e359d5d
[SPARK-11689][ML] Add user guide and example code for LDA under spark.ml
hhbyyh Nov 20, 2015
bef361c
[SPARK-11876][SQL] Support printSchema in DataSet API
gatorsmile Nov 20, 2015
60bfb11
[SPARK-11817][SQL] Truncating the fractional seconds to prevent inser…
viirya Nov 20, 2015
3b9d2a3
[SPARK-11819][SQL] nice error message for missing encoder
cloud-fan Nov 20, 2015
652def3
[SPARK-11650] Reduce RPC timeouts to speed up slow AkkaUtilsSuite test
JoshRosen Nov 20, 2015
9ed4ad4
[SPARK-11724][SQL] Change casting between int and timestamp to consis…
nongli Nov 20, 2015
be7a2cf
[SPARK-11870][STREAMING][PYSPARK] Rethrow the exceptions in Transform…
zsxwing Nov 20, 2015
89fd9bd
[SPARK-11887] Close PersistenceEngine at the end of PersistenceEngine…
JoshRosen Nov 20, 2015
03ba56d
[SPARK-11716][SQL] UDFRegistration just drops the input type when re-…
jbonofre Nov 20, 2015
a6239d5
[SPARK-11756][SPARKR] Fix use of aliases - SparkR can not output help…
felixcheung Nov 20, 2015
4b84c72
[SPARK-11636][SQL] Support classes defined in the REPL with Encoders
marmbrus Nov 20, 2015
ed47b1e
[SPARK-11549][DOCS] Replace example code in mllib-evaluation-metrics.…
Nov 20, 2015
58b4e4f
[SPARK-11787][SPARK-11883][SQL][FOLLOW-UP] Cleanup for this patch.
nongli Nov 20, 2015
968acf3
[SPARK-11889][SQL] Fix type inference for GroupedDataset.agg in REPL
marmbrus Nov 20, 2015
68ed046
[SPARK-11890][SQL] Fix compilation for Scala 2.11
marmbrus Nov 20, 2015
4781587
[HOTFIX] Fix Java Dataset Tests
marmbrus Nov 21, 2015
a2dce22
Revert "[SPARK-11689][ML] Add user guide and example code for LDA und…
mengxr Nov 21, 2015
7d3f922
[SPARK-11819][SQL][FOLLOW-UP] fix scala 2.11 build
cloud-fan Nov 21, 2015
54328b6
[SPARK-11900][SQL] Add since version for all encoders
rxin Nov 21, 2015
5967102
[SPARK-11901][SQL] API audit for Aggregator.
rxin Nov 21, 2015
ff442bb
[SPARK-11899][SQL] API audit for GroupedDataset.
rxin Nov 21, 2015
426004a
[SPARK-11908][SQL] Add NullType support to RowEncoder
viirya Nov 22, 2015
fe89c18
[SPARK-11895][ML] rename and refactor DatasetExample under mllib/exam…
mengxr Nov 23, 2015
a6fda0b
[SPARK-6791][ML] Add read/write for CrossValidator and Evaluators
jkbradley Nov 23, 2015
fc4b792
[SPARK-11835] Adds a sidebar menu to MLlib's documentation
thunterdb Nov 23, 2015
d9cf9c2
[SPARK-11912][ML] ml.feature.PCA minor refactor
yanboliang Nov 23, 2015
4be360d
[SPARK-11902][ML] Unhandled case in VectorAssembler#transform
BenFradet Nov 23, 2015
94ce65d
[SPARK-11628][SQL] support column datatype of char(x) to recognize Hi…
xguo27 Nov 23, 2015
1a5baaa
[SPARK-11894][SQL] fix isNull for GetInternalRowField
cloud-fan Nov 23, 2015
f2996e0
[SPARK-11921][SQL] fix `nullable` of encoder schema
cloud-fan Nov 23, 2015
946b406
[SPARK-11913][SQL] support typed aggregate with complex buffer schema
cloud-fan Nov 23, 2015
5fd86e4
[SPARK-7173][YARN] Add label expression support for application master
jerryshao Nov 23, 2015
5231cd5
[SPARK-11762][NETWORK] Account for active streams when couting outsta…
Nov 23, 2015
98d7ec7
[SPARK-11920][ML][DOC] ML LinearRegression should use correct dataset…
yanboliang Nov 23, 2015
f6dcc6e
[SPARK-11837][EC2] python3 compatibility for launching ec2 m3 instances
mortada Nov 23, 2015
1b6e938
[SPARK-4424] Remove spark.driver.allowMultipleContexts override in tests
JoshRosen Nov 23, 2015
1d91202
[SPARK-11836][SQL] udf/cast should not create new SQLContext
Nov 23, 2015
242be7d
[SPARK-11910][STREAMING][DOCS] Update twitter4j dependency version
lresende Nov 23, 2015
7cfa4c6
[SPARK-11865][NETWORK] Avoid returning inactive client in TransportCl…
Nov 23, 2015
c2467da
[SPARK-11140][CORE] Transfer files using network lib when using Netty…
Nov 23, 2015
9db5f60
[SPARK-9866][SQL] Speed up VersionsSuite by using persistent Ivy cache
JoshRosen Nov 24, 2015
1057456
[SPARK-10560][PYSPARK][MLLIB][DOCS] Make StreamingLogisticRegressionW…
BryanCutler Nov 24, 2015
026ea2e
Updated sql programming guide to include jdbc fetch size
sksamuel Nov 24, 2015
8d57524
[SPARK-11933][SQL] Rename mapGroup -> mapGroups and flatMapGroup -> f…
rxin Nov 24, 2015
6cf51a7
[SPARK-11903] Remove --skip-java-test
nchammas Nov 24, 2015
4021a28
[SPARK-10707][SQL] Fix nullability computation in union output
mbautin Nov 24, 2015
12eea83
[SPARK-11897][SQL] Add @scala.annotations.varargs to sql functions
xguo27 Nov 24, 2015
800bd79
[SPARK-11906][WEB UI] Speculation Tasks Cause ProgressBar UI Overflow
saurfang Nov 24, 2015
d4a5e6f
[SPARK-11043][SQL] BugFix:Set the operator log in the thrift server.
SaintBacchus Nov 24, 2015
5889880
[SPARK-11592][SQL] flush spark-sql command line history to history file
adrian-wang Nov 24, 2015
be9dd15
[SPARK-11818][REPL] Fix ExecutorClassLoader to lookup resources from …
HeartSaVioR Nov 24, 2015
e5aaae6
[SPARK-11942][SQL] fix encoder life cycle for CoGroup
cloud-fan Nov 24, 2015
56a0aba
[SPARK-11952][ML] Remove duplicate ml examples
yanboliang Nov 24, 2015
9e24ba6
[SPARK-11521][ML][DOC] Document that Logistic, Linear Regression summ…
jkbradley Nov 24, 2015
52bc25c
[SPARK-11847][ML] Model export/import for spark.ml: LDA
hhbyyh Nov 24, 2015
19530da
[SPARK-11926][SQL] unify GetStructField and GetInternalRowField
cloud-fan Nov 24, 2015
8101254
[SPARK-11872] Prevent the call to SparkContext#stop() in the listener…
tedyu Nov 24, 2015
f315272
[SPARK-11946][SQL] Audit pivot API for 1.6.
rxin Nov 24, 2015
e6dd237
[SPARK-11929][CORE] Make the repl log4j configuration override the ro…
Nov 24, 2015
58d9b26
[SPARK-11805] free the array in UnsafeExternalSorter during spilling
Nov 24, 2015
34ca392
Added a line of comment to explain why the extra sort exists in pivot.
rxin Nov 24, 2015
c7f95df
[SPARK-11783][SQL] Fixes execution Hive client when using remote Hive…
liancheng Nov 24, 2015
238ae51
[SPARK-11914][SQL] Support coalesce and repartition in Dataset APIs
gatorsmile Nov 24, 2015
25bbd3c
[SPARK-11967][SQL] Consistent use of varargs for multiple paths in Da…
rxin Nov 25, 2015
4d6bbbc
[SPARK-11947][SQL] Mark deprecated methods with "This will be removed…
rxin Nov 25, 2015
a5d9887
[STREAMING][FLAKY-TEST] Catch execution context race condition in `Fi…
brkyvz Nov 25, 2015
151d7c2
[SPARK-10621][SQL] Consistent naming for functions in SQL, Python, Scala
rxin Nov 25, 2015
2169886
[SPARK-11979][STREAMING] Empty TrackStateRDD cannot be checkpointed a…
tdas Nov 25, 2015
2610e06
[SPARK-11970][SQL] Adding JoinType into JoinWith and support Sample i…
gatorsmile Nov 25, 2015
a0f1a11
[SPARK-11981][SQL] Move implementations of methods back to DataFrame …
rxin Nov 25, 2015
6385002
[SPARK-11686][CORE] Issue WARN when dynamic allocation is disabled du…
Nov 25, 2015
b9b6fbe
[SPARK-11860][PYSAPRK][DOCUMENTATION] Invalid argument specification …
zjffdu Nov 25, 2015
0a5aef7
[SPARK-10666][SPARK-6880][CORE] Use properties from ActiveJob associa…
markhamstra Nov 25, 2015
c1f85fc
[SPARK-11956][CORE] Fix a few bugs in network lib-based file transfer.
Nov 25, 2015
faabdfa
[SPARK-11984][SQL][PYTHON] Fix typos in doc for pivot for scala and p…
felixcheung Nov 25, 2015
6b78157
[SPARK-11974][CORE] Not all the temp dirs had been deleted when the J…
pzzs Nov 25, 2015
dc1d324
[SPARK-11969] [SQL] [PYSPARK] visualization of SQL query for pyspark
Nov 25, 2015
0dee44a
[MINOR] Remove unnecessary spaces in `include_example.rb`
yu-iskw Nov 25, 2015
67b6732
[DOCUMENTATION] Fix minor doc error
zjffdu Nov 25, 2015
83653ac
[SPARK-10864][WEB UI] app name is hidden if window is resized
ajbozarth Nov 25, 2015
9f3e59a
[SPARK-11880][WINDOWS][SPARK SUBMIT] bin/load-spark-env.cmd loads spa…
wangt Nov 25, 2015
88875d9
[SPARK-10558][CORE] Fix wrong executor state in Master
jerryshao Nov 25, 2015
d29e2ef
[SPARK-11935][PYSPARK] Send the Python exceptions in TransformFunctio…
zsxwing Nov 25, 2015
4e81783
[SPARK-11866][NETWORK][CORE] Make sure timed out RPCs are cleaned up.
Nov 25, 2015
ecac283
Fix Aggregator documentation (rename present to finish).
rxin Nov 25, 2015
21e5606
[SPARK-11983][SQL] remove all unused codegen fallback trait
adrian-wang Nov 25, 2015
cc243a0
[SPARK-11206] Support SQL UI on the history server
carsonwang Nov 25, 2015
d1930ec
[SPARK-12003] [SQL] remove the prefix for name after expanded star
Nov 26, 2015
068b643
[SPARK-11980][SPARK-10621][SQL] Fix json_tuple and add test cases for
gatorsmile Nov 26, 2015
d3ef693
[SPARK-11999][CORE] Fix the issue that ThreadUtils.newDaemonCachedThr…
zsxwing Nov 26, 2015
27d69a0
[SPARK-11973] [SQL] push filter through aggregation with alias and li…
Nov 26, 2015
001f052
[SPARK-12005][SQL] Work around VerifyError in HyperLogLogPlusPlus.
Nov 26, 2015
bc16a67
[SPARK-11863][SQL] Unable to resolve order by if it contains mixture …
dilipbiswal Nov 26, 2015
ad76562
[SPARK-11998][SQL][TEST-HADOOP2.0] When downloading Hadoop artifacts …
yhuai Nov 27, 2015
de28e4d
[SPARK-11973][SQL] Improve optimizer code readability.
rxin Nov 27, 2015
4376b5b
doc typo: "classificaion" -> "classification"
muxator Nov 27, 2015
0c1e72e
[SPARK-11996][CORE] Make the executor thread dump work again
zsxwing Nov 27, 2015
6f6bb0e
[SPARK-12011][SQL] Stddev/Variance etc should support columnName as a…
yanboliang Nov 27, 2015
b63938a
[SPARK-11881][SQL] Fix for postgresql fetchsize > 0
mariusvniekerk Nov 27, 2015
d822088
[SPARK-11917][PYSPARK] Add SQLContext#dropTempTable to PySpark
zjffdu Nov 27, 2015
4d4cbc0
[SPARK-11778][SQL] add regression test
Nov 27, 2015
5eaed4e
[SPARK-11991] fixes
Nov 27, 2015
10e315c
Fix style violation for b63938a8b04
rxin Nov 27, 2015
a374e20
[SPARK-11997] [SQL] NPE when save a DataFrame as parquet and partitio…
dilipbiswal Nov 27, 2015
ba02f6c
[SPARK-12025][SPARKR] Rename some window rank function names for SparkR
yanboliang Nov 27, 2015
f57e6c9
[SPARK-12021][STREAMING][TESTS] Fix the potential dead-lock in Stream…
zsxwing Nov 27, 2015
b992152
[SPARK-12020][TESTS][TEST-HADOOP2.0] PR builder cannot trigger hadoop…
yhuai Nov 27, 2015
149cd69
[SPARK-12028] [SQL] get_json_object returns an incorrect result when …
gatorsmile Nov 28, 2015
28e46ab
[SPARK-12029][SPARKR] Improve column functions signature, param check…
felixcheung Nov 29, 2015
c793d2d
[SPARK-9319][SPARKR] Add support for setting column names, types
felixcheung Nov 29, 2015
cc7a1bc
[SPARK-11781][SPARKR] SparkR has problem in inferring type of raw type.
Nov 29, 2015
3d28081
[SPARK-12024][SQL] More efficient multi-column counting.
hvanhovell Nov 29, 2015
0ddfe78
[SPARK-12039] [SQL] Ignore HiveSparkSubmitSuite's "SPARK-9757 Persist…
yhuai Nov 30, 2015
e074944
[SPARK-11859][MESOS] SparkContext accepts invalid Master URLs in the …
toddwan Nov 30, 2015
953e8e6
[MINOR][BUILD] Changed the comment to reflect the plugin project is t…
ScrapCodes Nov 30, 2015
26c3581
[DOC] Explicitly state that top maintains the order of elements
mineo Nov 30, 2015
bf0e85a
[SPARK-12023][BUILD] Fix warnings while packaging spark with maven.
ScrapCodes Nov 30, 2015
2db4662
[SPARK-11989][SQL] Only use commit in JDBC data source if the underly…
CK50 Nov 30, 2015
17275fa
[SPARK-11700] [SQL] Remove thread local SQLContext in SparkPlan
Nov 30, 2015
8df584b
[SPARK-11982] [SQL] improve performance of cartesian product
Nov 30, 2015
f2fbfa4
[MINOR][DOCS] fixed list display in ml-ensembles
BenFradet Nov 30, 2015
2c5dee0
Revert "[SPARK-11206] Support SQL UI on the history server"
JoshRosen Nov 30, 2015
a8ceec5
[SPARK-12053][CORE] EventLoggingListener.getLogPath needs 4 parameters
chutium Nov 30, 2015
e232720
[SPARK-11689][ML] Add user guide and example code for LDA under spark.ml
hhbyyh Nov 30, 2015
de64b65
[SPARK-11975][ML] Remove duplicate mllib example (DT/RF/GBT in Java/P…
yanboliang Nov 30, 2015
5535888
[SPARK-11960][MLLIB][DOC] User guide for streaming tests
feynmanliang Nov 30, 2015
ecc00ec
fix Maven build
davies Nov 30, 2015
edb26e7
[SPARK-12058][HOTFIX] Disable KinesisStreamTests
zsxwing Dec 1, 2015
d3ca8cf
[SPARK-12000] Fix API doc generation issues
JoshRosen Dec 1, 2015
e6dc89a
[SPARK-12035] Add more debug information in include_example tag of Je…
yinxusen Dec 1, 2015
0a46e43
[SPARK-12037][CORE] initialize heartbeatReceiverRef before calling st…
CodingCat Dec 1, 2015
9bf2120
[SPARK-12007][NETWORK] Avoid copies in the network lib's RPC layer.
Dec 1, 2015
96bf468
[SPARK-12049][CORE] User JVM shutdown hook can cause deadlock at shut…
srowen Dec 1, 2015
f73379b
[HOTFIX][SPARK-12000] Add missing quotes in Jekyll API docs plugin.
JoshRosen Dec 1, 2015
9693b0d
[SPARK-12018][SQL] Refactor common subexpression elimination code
viirya Dec 1, 2015
a0af0e3
[SPARK-11898][MLLIB] Use broadcast for the global tables in Word2Vec
hhbyyh Dec 1, 2015
c87531b
[SPARK-11949][SQL] Set field nullable property for GroupingSets to ge…
viirya Dec 1, 2015
1401166
[SPARK-12060][CORE] Avoid memory copy in JavaSerializerInstance.seria…
zsxwing Dec 1, 2015
69dbe6b
[SPARK-12046][DOC] Fixes various ScalaDoc/JavaDoc issues
liancheng Dec 1, 2015
8ddc55f
[SPARK-12068][SQL] use a single column in Dataset.groupBy and count w…
cloud-fan Dec 1, 2015
9df2462
[SPARK-11856][SQL] add type cast if the real type is different but co…
cloud-fan Dec 1, 2015
fd95eea
[SPARK-11954][SQL] Encoder for JavaBeans
cloud-fan Dec 1, 2015
0a7bca2
[SPARK-11905][SQL] Support Persist/Cache and Unpersist in Dataset APIs
gatorsmile Dec 1, 2015
6a8cf80
[SPARK-11821] Propagate Kerberos keytab for all environments
woj-i Dec 1, 2015
34e7093
[SPARK-12065] Upgrade Tachyon from 0.8.1 to 0.8.2
JoshRosen Dec 1, 2015
2cef1cd
[SPARK-12030] Fix Platform.copyMemory to handle overlapping regions.
nongli Dec 1, 2015
60b541e
[SPARK-12004] Preserve the RDD partitioner through RDD checkpointing
tdas Dec 1, 2015
328b757
Revert "[SPARK-12060][CORE] Avoid memory copy in JavaSerializerInstan…
zsxwing Dec 1, 2015
e76431f
[SPARK-11961][DOC] Add docs of ChiSqSelector
yinxusen Dec 1, 2015
f292018
[SPARK-12002][STREAMING][PYSPARK] Fix python direct stream checkpoint…
jerryshao Dec 1, 2015
ef6790f
[SPARK-12075][SQL] Speed up HiveComparisionTest by avoiding / speedin…
JoshRosen Dec 1, 2015
47a0abc
[SPARK-11328][SQL] Improve error message when hitting this issue
nongli Dec 1, 2015
5a8b5fd
[SPARK-11788][SQL] surround timestamp/date value with quotes in JDBC …
Dec 1, 2015
5872a9d
[SPARK-11352][SQL] Escape */ in the generated comments.
yhuai Dec 2, 2015
e96a70d
[SPARK-11596][SQL] In TreeNode's argString, if a TreeNode is not a ch…
yhuai Dec 2, 2015
1ce4adf
[SPARK-8414] Ensure context cleaner periodic cleanups
Dec 2, 2015
d96f8c9
[SPARK-12081] Make unified memory manager work with small heaps
Dec 2, 2015
772dc7f
remove unnecessary evaluation from SortOrder
cloud-fan Dec 2, 2015
a3e1313
fix comment
cloud-fan Dec 2, 2015
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
Prev Previous commit
Next Next commit
[SPARK-11761] Prevent the call to StreamingContext#stop() in the list…
…ener bus's thread

See discussion toward the tail of apache#9723
From zsxwing :
```
The user should not call stop or other long-time work in a listener since it will block the listener thread, and prevent from stopping SparkContext/StreamingContext.

I cannot see an approach since we need to stop the listener bus's thread before stopping SparkContext/StreamingContext totally.
```
Proposed solution is to prevent the call to StreamingContext#stop() in the listener bus's thread.

Author: tedyu <[email protected]>

Closes apache#9741 from tedyu/master.
  • Loading branch information
tedyu authored and tdas committed Nov 18, 2015
commit 446738e51fcda50cf2dc44123ff6bf12a1611dc0
Original file line number Diff line number Diff line change
Expand Up @@ -19,6 +19,7 @@ package org.apache.spark.util

import java.util.concurrent._
import java.util.concurrent.atomic.AtomicBoolean
import scala.util.DynamicVariable

import org.apache.spark.SparkContext

Expand Down Expand Up @@ -60,25 +61,27 @@ private[spark] abstract class AsynchronousListenerBus[L <: AnyRef, E](name: Stri
private val listenerThread = new Thread(name) {
setDaemon(true)
override def run(): Unit = Utils.tryOrStopSparkContext(sparkContext) {
while (true) {
eventLock.acquire()
self.synchronized {
processingEvent = true
}
try {
val event = eventQueue.poll
if (event == null) {
// Get out of the while loop and shutdown the daemon thread
if (!stopped.get) {
throw new IllegalStateException("Polling `null` from eventQueue means" +
" the listener bus has been stopped. So `stopped` must be true")
}
return
}
postToAll(event)
} finally {
AsynchronousListenerBus.withinListenerThread.withValue(true) {
while (true) {
eventLock.acquire()
self.synchronized {
processingEvent = false
processingEvent = true
}
try {
val event = eventQueue.poll
if (event == null) {
// Get out of the while loop and shutdown the daemon thread
if (!stopped.get) {
throw new IllegalStateException("Polling `null` from eventQueue means" +
" the listener bus has been stopped. So `stopped` must be true")
}
return
}
postToAll(event)
} finally {
self.synchronized {
processingEvent = false
}
}
}
}
Expand Down Expand Up @@ -177,3 +180,10 @@ private[spark] abstract class AsynchronousListenerBus[L <: AnyRef, E](name: Stri
*/
def onDropEvent(event: E): Unit
}

private[spark] object AsynchronousListenerBus {
/* Allows for Context to check whether stop() call is made within listener thread
*/
val withinListenerThread: DynamicVariable[Boolean] = new DynamicVariable[Boolean](false)
}

Original file line number Diff line number Diff line change
Expand Up @@ -44,7 +44,7 @@ import org.apache.spark.streaming.dstream._
import org.apache.spark.streaming.receiver.{ActorReceiver, ActorSupervisorStrategy, Receiver}
import org.apache.spark.streaming.scheduler.{JobScheduler, StreamingListener}
import org.apache.spark.streaming.ui.{StreamingJobProgressListener, StreamingTab}
import org.apache.spark.util.{CallSite, ShutdownHookManager, ThreadUtils, Utils}
import org.apache.spark.util.{AsynchronousListenerBus, CallSite, ShutdownHookManager, ThreadUtils, Utils}

/**
* Main entry point for Spark Streaming functionality. It provides methods used to create
Expand Down Expand Up @@ -693,6 +693,10 @@ class StreamingContext private[streaming] (
*/
def stop(stopSparkContext: Boolean, stopGracefully: Boolean): Unit = {
var shutdownHookRefToRemove: AnyRef = null
if (AsynchronousListenerBus.withinListenerThread.value) {
throw new SparkException("Cannot stop StreamingContext within listener thread of" +
" AsynchronousListenerBus")
}
synchronized {
try {
state match {
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -21,6 +21,7 @@ import scala.collection.mutable.{ArrayBuffer, HashMap, SynchronizedBuffer, Synch
import scala.concurrent.Future
import scala.concurrent.ExecutionContext.Implicits.global

import org.apache.spark.SparkException
import org.apache.spark.storage.StorageLevel
import org.apache.spark.streaming.dstream.DStream
import org.apache.spark.streaming.receiver.Receiver
Expand Down Expand Up @@ -161,6 +162,14 @@ class StreamingListenerSuite extends TestSuiteBase with Matchers {
}
}

test("don't call ssc.stop in listener") {
ssc = new StreamingContext("local[2]", "ssc", Milliseconds(1000))
val inputStream = ssc.receiverStream(new StreamingListenerSuiteReceiver)
inputStream.foreachRDD(_.count)

startStreamingContextAndCallStop(ssc)
}

test("onBatchCompleted with successful batch") {
ssc = new StreamingContext("local[2]", "test", Milliseconds(1000))
val inputStream = ssc.receiverStream(new StreamingListenerSuiteReceiver)
Expand Down Expand Up @@ -207,6 +216,17 @@ class StreamingListenerSuite extends TestSuiteBase with Matchers {
assert(failureReasons(1).contains("This is another failed job"))
}

private def startStreamingContextAndCallStop(_ssc: StreamingContext): Unit = {
val contextStoppingCollector = new StreamingContextStoppingCollector(_ssc)
_ssc.addStreamingListener(contextStoppingCollector)
val batchCounter = new BatchCounter(_ssc)
_ssc.start()
// Make sure running at least one batch
batchCounter.waitUntilBatchesCompleted(expectedNumCompletedBatches = 1, timeout = 10000)
_ssc.stop()
assert(contextStoppingCollector.sparkExSeen)
}

private def startStreamingContextAndCollectFailureReasons(
_ssc: StreamingContext, isFailed: Boolean = false): Map[Int, String] = {
val failureReasonsCollector = new FailureReasonsCollector()
Expand Down Expand Up @@ -320,3 +340,17 @@ class FailureReasonsCollector extends StreamingListener {
}
}
}
/**
* A StreamingListener that calls StreamingContext.stop().
*/
class StreamingContextStoppingCollector(val ssc: StreamingContext) extends StreamingListener {
@volatile var sparkExSeen = false
override def onBatchCompleted(batchCompleted: StreamingListenerBatchCompleted) {
try {
ssc.stop()
} catch {
case se: SparkException =>
sparkExSeen = true
}
}
}