Skip to content

Commit 15cd980

Browse files
committed
Fix spark-shell in branch-1.0
1 parent edea1ef commit 15cd980

File tree

5 files changed

+90
-9
lines changed

5 files changed

+90
-9
lines changed

bin/pyspark

Lines changed: 14 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -23,12 +23,18 @@ FWDIR="$(cd `dirname $0`/..; pwd)"
2323
# Export this as SPARK_HOME
2424
export SPARK_HOME="$FWDIR"
2525

26+
source $FWDIR/bin/utils.sh
27+
2628
SCALA_VERSION=2.10
2729

28-
if [[ "$@" = *--help ]] || [[ "$@" = *-h ]]; then
30+
function usage() {
2931
echo "Usage: ./bin/pyspark [options]" 1>&2
3032
$FWDIR/bin/spark-submit --help 2>&1 | grep -v Usage 1>&2
3133
exit 0
34+
}
35+
36+
if [[ "$@" = *--help ]] || [[ "$@" = *-h ]]; then
37+
usage
3238
fi
3339

3440
# Exit if the user hasn't compiled Spark
@@ -66,10 +72,11 @@ fi
6672
# Build up arguments list manually to preserve quotes and backslashes.
6773
# We export Spark submit arguments as an environment variable because shell.py must run as a
6874
# PYTHONSTARTUP script, which does not take in arguments. This is required for IPython notebooks.
69-
75+
SUBMIT_USAGE_FUNCTION=usage
76+
gatherSparkSubmitOpts "$@"
7077
PYSPARK_SUBMIT_ARGS=""
7178
whitespace="[[:space:]]"
72-
for i in "$@"; do
79+
for i in "${SUBMISSION_OPTS[@]}"; do
7380
if [[ $i =~ \" ]]; then i=$(echo $i | sed 's/\"/\\\"/g'); fi
7481
if [[ $i =~ $whitespace ]]; then i=\"$i\"; fi
7582
PYSPARK_SUBMIT_ARGS="$PYSPARK_SUBMIT_ARGS $i"
@@ -80,7 +87,10 @@ export PYSPARK_SUBMIT_ARGS
8087
if [[ "$1" =~ \.py$ ]]; then
8188
echo -e "\nWARNING: Running python applications through ./bin/pyspark is deprecated as of Spark 1.0." 1>&2
8289
echo -e "Use ./bin/spark-submit <python file>\n" 1>&2
83-
exec $FWDIR/bin/spark-submit "$@"
90+
primary=$1
91+
shift
92+
gatherSparkSubmitOpts "$@"
93+
exec $FWDIR/bin/spark-submit "${SUBMISSION_OPTS[@]}" $primary "${APPLICATION_OPTS[@]}"
8494
else
8595
# Only use ipython if no command line arguments were provided [SPARK-1134]
8696
if [[ "$IPYTHON" = "1" ]]; then

bin/spark-shell

Lines changed: 12 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -31,13 +31,21 @@ set -o posix
3131
## Global script variables
3232
FWDIR="$(cd `dirname $0`/..; pwd)"
3333

34-
if [[ "$@" = *--help ]] || [[ "$@" = *-h ]]; then
34+
function usage() {
3535
echo "Usage: ./bin/spark-shell [options]"
3636
$FWDIR/bin/spark-submit --help 2>&1 | grep -v Usage 1>&2
3737
exit 0
38+
}
39+
40+
if [[ "$@" = *--help ]] || [[ "$@" = *-h ]]; then
41+
usage
3842
fi
3943

40-
function main(){
44+
source $FWDIR/bin/utils.sh
45+
SUBMIT_USAGE_FUNCTION=usage
46+
gatherSparkSubmitOpts "$@"
47+
48+
function main() {
4149
if $cygwin; then
4250
# Workaround for issue involving JLine and Cygwin
4351
# (see http://sourceforge.net/p/jline/bugs/40/).
@@ -46,11 +54,11 @@ function main(){
4654
# (see https://github.com/sbt/sbt/issues/562).
4755
stty -icanon min 1 -echo > /dev/null 2>&1
4856
export SPARK_SUBMIT_OPTS="$SPARK_SUBMIT_OPTS -Djline.terminal=unix"
49-
$FWDIR/bin/spark-submit spark-shell "$@" --class org.apache.spark.repl.Main
57+
$FWDIR/bin/spark-submit --class org.apache.spark.repl.Main "${SUBMISSION_OPTS[@]}" spark-shell "${APPLICATION_OPTS[@]}"
5058
stty icanon echo > /dev/null 2>&1
5159
else
5260
export SPARK_SUBMIT_OPTS
53-
$FWDIR/bin/spark-submit spark-shell "$@" --class org.apache.spark.repl.Main
61+
$FWDIR/bin/spark-submit --class org.apache.spark.repl.Main "${SUBMISSION_OPTS[@]}" spark-shell "${APPLICATION_OPTS[@]}"
5462
fi
5563
}
5664

bin/utils.sh

Lines changed: 59 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,59 @@
1+
#!/usr/bin/env bash
2+
3+
#
4+
# Licensed to the Apache Software Foundation (ASF) under one or more
5+
# contributor license agreements. See the NOTICE file distributed with
6+
# this work for additional information regarding copyright ownership.
7+
# The ASF licenses this file to You under the Apache License, Version 2.0
8+
# (the "License"); you may not use this file except in compliance with
9+
# the License. You may obtain a copy of the License at
10+
#
11+
# http://www.apache.org/licenses/LICENSE-2.0
12+
#
13+
# Unless required by applicable law or agreed to in writing, software
14+
# distributed under the License is distributed on an "AS IS" BASIS,
15+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
16+
# See the License for the specific language governing permissions and
17+
# limitations under the License.
18+
#
19+
20+
# Gather all all spark-submit options into SUBMISSION_OPTS
21+
function gatherSparkSubmitOpts() {
22+
23+
if [ -z "$SUBMIT_USAGE_FUNCTION" ]; then
24+
echo "Function for printing usage of $0 is not set." 1>&2
25+
echo "Please set usage function to shell variable 'SUBMIT_USAGE_FUNCTION' in $0" 1>&2
26+
exit 1
27+
fi
28+
29+
# NOTE: If you add or remove spark-sumbmit options,
30+
# modify NOT ONLY this script but also SparkSubmitArgument.scala
31+
SUBMISSION_OPTS=()
32+
APPLICATION_OPTS=()
33+
while (($#)); do
34+
case "$1" in
35+
--master | --deploy-mode | --class | --name | --jars | --py-files | --files | \
36+
--conf | --properties-file | --driver-memory | --driver-java-options | \
37+
--driver-library-path | --driver-class-path | --executor-memory | --driver-cores | \
38+
--total-executor-cores | --executor-cores | --queue | --num-executors | --archives)
39+
if [[ $# -lt 2 ]]; then
40+
"$SUBMIT_USAGE_FUNCTION"
41+
exit 1;
42+
fi
43+
SUBMISSION_OPTS+=("$1"); shift
44+
SUBMISSION_OPTS+=("$1"); shift
45+
;;
46+
47+
--verbose | -v | --supervise)
48+
SUBMISSION_OPTS+=("$1"); shift
49+
;;
50+
51+
*)
52+
APPLICATION_OPTS+=("$1"); shift
53+
;;
54+
esac
55+
done
56+
57+
export SUBMISSION_OPTS
58+
export APPLICATION_OPTS
59+
}

core/src/main/scala/org/apache/spark/deploy/SparkSubmitArguments.scala

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -206,6 +206,10 @@ private[spark] class SparkSubmitArguments(args: Seq[String]) {
206206

207207
parse(opts)
208208

209+
/**
210+
* NOTE: If you add or remove spark-submit options,
211+
* modify NOT ONLY this file but also utils.sh
212+
*/
209213
def parse(opts: Seq[String]): Unit = opts match {
210214
case ("--name") :: value :: tail =>
211215
name = value

python/pyspark/java_gateway.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -38,7 +38,7 @@ def launch_gateway():
3838
submit_args = os.environ.get("PYSPARK_SUBMIT_ARGS")
3939
submit_args = submit_args if submit_args is not None else ""
4040
submit_args = shlex.split(submit_args)
41-
command = [os.path.join(SPARK_HOME, script), "pyspark-shell"] + submit_args
41+
command = [os.path.join(SPARK_HOME, script)] + submit_args + ["pyspark-shell"]
4242
if not on_windows:
4343
# Don't send ctrl-c / SIGINT to the Java gateway:
4444
def preexec_func():

0 commit comments

Comments
 (0)