Skip to content

Commit baa8ad5

Browse files
committed
Code review feedback.
1 parent f081d47 commit baa8ad5

File tree

4 files changed

+31
-27
lines changed

4 files changed

+31
-27
lines changed

python/pyspark/sql/__init__.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -46,7 +46,7 @@
4646

4747
def since(version):
4848
"""
49-
Annotates a function to append the version of Spark the function was added.
49+
A decorator that annotates a function to append the version of Spark the function was added.
5050
"""
5151
import re
5252
indent_p = re.compile(r'\n( +)')

python/pyspark/sql/context.py

Lines changed: 17 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -198,8 +198,8 @@ def _inferSchema(self, rdd, samplingRatio=None):
198198
raise ValueError("The first row in RDD is empty, "
199199
"can not infer schema")
200200
if type(first) is dict:
201-
warnings.warn("Using RDD of dict to inferSchema is deprecated,"
202-
"please use pyspark.sql.Row instead", DeprecationWarning)
201+
warnings.warn("Using RDD of dict to inferSchema is deprecated. "
202+
"Use pyspark.sql.Row instead")
203203

204204
if samplingRatio is None:
205205
schema = _infer_schema(first)
@@ -222,8 +222,7 @@ def inferSchema(self, rdd, samplingRatio=None):
222222
"""
223223
.. note:: Deprecated in 1.3, use :func:`createDataFrame` instead.
224224
"""
225-
warnings.warn(
226-
"inferSchema is deprecated, please use createDataFrame instead.", DeprecationWarning)
225+
warnings.warn("inferSchema is deprecated, please use createDataFrame instead.")
227226

228227
if isinstance(rdd, DataFrame):
229228
raise TypeError("Cannot apply schema to DataFrame")
@@ -235,8 +234,7 @@ def applySchema(self, rdd, schema):
235234
"""
236235
.. note:: Deprecated in 1.3, use :func:`createDataFrame` instead.
237236
"""
238-
warnings.warn(
239-
"applySchema is deprecated, please use createDataFrame instead", DeprecationWarning)
237+
warnings.warn("applySchema is deprecated, please use createDataFrame instead")
240238

241239
if isinstance(rdd, DataFrame):
242240
raise TypeError("Cannot apply schema to DataFrame")
@@ -369,8 +367,11 @@ def parquetFile(self, *paths):
369367
"""Loads a Parquet file, returning the result as a :class:`DataFrame`.
370368
371369
.. note:: Deprecated in 1.4, use :func:`DataFrameReader.parquet` instead.
370+
371+
>>> sqlContext.parquetFile('python/test_support/sql/parquet_partitioned').dtypes
372+
[('name', 'string'), ('year', 'int'), ('month', 'int'), ('day', 'int')]
372373
"""
373-
warnings.warn("parquetFile is deprecated. Use read.parquet() instead.", DeprecationWarning)
374+
warnings.warn("parquetFile is deprecated. Use read.parquet() instead.")
374375
gateway = self._sc._gateway
375376
jpaths = gateway.new_array(gateway.jvm.java.lang.String, len(paths))
376377
for i in range(0, len(paths)):
@@ -382,8 +383,11 @@ def jsonFile(self, path, schema=None, samplingRatio=1.0):
382383
"""Loads a text file storing one JSON object per line as a :class:`DataFrame`.
383384
384385
.. note:: Deprecated in 1.4, use :func:`DataFrameReader.json` instead.
386+
387+
>>> sqlContext.jsonFile('python/test_support/sql/people.json').dtypes
388+
[('age', 'bigint'), ('name', 'string')]
385389
"""
386-
warnings.warn("jsonFile is deprecated. Use read.json() instead.", DeprecationWarning)
390+
warnings.warn("jsonFile is deprecated. Use read.json() instead.")
387391
if schema is None:
388392
df = self._ssql_ctx.jsonFile(path, samplingRatio)
389393
else:
@@ -440,7 +444,7 @@ def load(self, path=None, source=None, schema=None, **options):
440444
441445
.. note:: Deprecated in 1.4, use :func:`DataFrameReader.load` instead.
442446
"""
443-
warnings.warn("load is deprecated. Use read.load() instead.", DeprecationWarning)
447+
warnings.warn("load is deprecated. Use read.load() instead.")
444448
return self.read.load(path, source, schema, **options)
445449

446450
@since(1.3)
@@ -621,10 +625,14 @@ def register(self, name, f, returnType=StringType()):
621625

622626

623627
def _test():
628+
import os
624629
import doctest
625630
from pyspark.context import SparkContext
626631
from pyspark.sql import Row, SQLContext
627632
import pyspark.sql.context
633+
634+
os.chdir(os.environ["SPARK_HOME"])
635+
628636
globs = pyspark.sql.context.__dict__.copy()
629637
sc = SparkContext('local[4]', 'PythonTest')
630638
globs['sc'] = sc

python/pyspark/sql/dataframe.py

Lines changed: 8 additions & 12 deletions
Original file line numberDiff line numberDiff line change
@@ -125,8 +125,7 @@ def saveAsParquetFile(self, path):
125125
126126
.. note:: Deprecated in 1.4, use :func:`DataFrameWriter.parquet` instead.
127127
"""
128-
warnings.warn(
129-
"saveAsParquetFile is deprecated. Use write.parquet() instead.", DeprecationWarning)
128+
warnings.warn("saveAsParquetFile is deprecated. Use write.parquet() instead.")
130129
self._jdf.saveAsParquetFile(path)
131130

132131
@since(1.3)
@@ -147,25 +146,23 @@ def registerAsTable(self, name):
147146
"""
148147
.. note:: Deprecated in 1.4, use :func:`registerTempTable` instead.
149148
"""
150-
warnings.warn("Use registerTempTable instead of registerAsTable.", DeprecationWarning)
149+
warnings.warn("Use registerTempTable instead of registerAsTable.")
151150
self.registerTempTable(name)
152151

153152
def insertInto(self, tableName, overwrite=False):
154153
"""Inserts the contents of this :class:`DataFrame` into the specified table.
155154
156155
.. note:: Deprecated in 1.4, use :func:`DataFrameWriter.insertInto` instead.
157156
"""
158-
warnings.warn(
159-
"insertInto is deprecated. Use write.insertInto() instead.", DeprecationWarning)
157+
warnings.warn("insertInto is deprecated. Use write.insertInto() instead.")
160158
self.write.insertInto(tableName, overwrite)
161159

162160
def saveAsTable(self, tableName, source=None, mode="error", **options):
163161
"""Saves the contents of this :class:`DataFrame` to a data source as a table.
164162
165163
.. note:: Deprecated in 1.4, use :func:`DataFrameWriter.saveAsTable` instead.
166164
"""
167-
warnings.warn(
168-
"insertInto is deprecated. Use write.saveAsTable() instead.", DeprecationWarning)
165+
warnings.warn("insertInto is deprecated. Use write.saveAsTable() instead.")
169166
self.write.saveAsTable(tableName, source, mode, **options)
170167

171168
@since(1.3)
@@ -174,8 +171,7 @@ def save(self, path=None, source=None, mode="error", **options):
174171
175172
.. note:: Deprecated in 1.4, use :func:`DataFrameWriter.save` instead.
176173
"""
177-
warnings.warn(
178-
"insertInto is deprecated. Use write.save() instead.", DeprecationWarning)
174+
warnings.warn("insertInto is deprecated. Use write.save() instead.")
179175
return self.write.save(path, source, mode, **options)
180176

181177
@property
@@ -629,9 +625,9 @@ def describe(self, *cols):
629625
def head(self, n=None):
630626
"""Returns the first ``n`` rows.
631627
632-
If n is greater than 1, return a list of :class:`Row`. If n is 1, return a single Row.
633-
634-
:param n: int, default 1.
628+
:param n: int, default 1. Number of rows to return.
629+
:return: If n is greater than 1, return a list of :class:`Row`.
630+
If n is 1, return a single Row.
635631
636632
>>> df.head()
637633
Row(age=2, name=u'Alice')

python/run-tests

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -70,13 +70,13 @@ function run_core_tests() {
7070

7171
function run_sql_tests() {
7272
echo "Run sql tests ..."
73-
run_test "pyspark.sql.readwriter"
7473
run_test "pyspark.sql.types"
7574
run_test "pyspark.sql.context"
7675
run_test "pyspark.sql.column"
7776
run_test "pyspark.sql.dataframe"
7877
run_test "pyspark.sql.group"
7978
run_test "pyspark.sql.functions"
79+
run_test "pyspark.sql.readwriter"
8080
run_test "pyspark.sql.window"
8181
run_test "pyspark.sql.tests"
8282
}
@@ -142,11 +142,11 @@ fi
142142
echo "Testing with Python version:"
143143
$PYSPARK_PYTHON --version
144144

145-
#run_core_tests
145+
run_core_tests
146146
run_sql_tests
147-
#run_mllib_tests
148-
#run_ml_tests
149-
#run_streaming_tests
147+
run_mllib_tests
148+
run_ml_tests
149+
run_streaming_tests
150150

151151
# Try to test with Python 3
152152
if [ $(which python3.4) ]; then

0 commit comments

Comments
 (0)