3131 import unittest
3232
3333from pyspark .tests import ReusedPySparkTestCase as PySparkTestCase
34- from pyspark .sql import DataFrame , SQLContext
34+ from pyspark .sql import DataFrame , SQLContext , Row
3535from pyspark .sql .functions import rand
3636from pyspark .ml .evaluation import RegressionEvaluator
3737from pyspark .ml .param import Param , Params
@@ -258,7 +258,7 @@ def test_idf(self):
258258 def test_ngram (self ):
259259 sqlContext = SQLContext (self .sc )
260260 dataset = sqlContext .createDataFrame ([
261- ([[ "a" , "b" , "c" , "d" , "e" ]])], [ "input" ])
261+ Row ( input = [ "a" , "b" , "c" , "d" , "e" ]) ])
262262 ngram0 = NGram (n = 4 , inputCol = "input" , outputCol = "output" )
263263 self .assertEqual (ngram0 .getN (), 4 )
264264 self .assertEqual (ngram0 .getInputCol (), "input" )
@@ -268,9 +268,7 @@ def test_ngram(self):
268268
269269 def test_stopwordsremover (self ):
270270 sqlContext = SQLContext (self .sc )
271- data = ["a" , "panda" ]
272- dataset = sqlContext .createDataFrame ([
273- ([data ])], ["input" ])
271+ dataset = sqlContext .createDataFrame ([Row (input = ["a" , "panda" ])])
274272 stopWordRemover = StopWordsRemover (inputCol = "input" , outputCol = "output" )
275273 # Default
276274 self .assertEquals (stopWordRemover .getInputCol (), "input" )
0 commit comments