|
36 | 36 | python_right_outer_join, python_cogroup |
37 | 37 | from pyspark.statcounter import StatCounter |
38 | 38 | from pyspark.rddsampler import RDDSampler |
| 39 | +from pyspark.storagelevel import StorageLevel |
39 | 40 |
|
40 | 41 | from py4j.java_collections import ListConverter, MapConverter |
41 | 42 |
|
@@ -1119,6 +1120,47 @@ def zip(self, other): |
1119 | 1120 | other._jrdd_deserializer) |
1120 | 1121 | return RDD(pairRDD, self.ctx, deserializer) |
1121 | 1122 |
|
| 1123 | + def name(self): |
| 1124 | + """ |
| 1125 | + Return the name of this RDD. |
| 1126 | + """ |
| 1127 | + name_ = self._jrdd.name() |
| 1128 | + if not name_: |
| 1129 | + return None |
| 1130 | + return name_.encode('utf-8') |
| 1131 | + |
| 1132 | + def setName(self, name): |
| 1133 | + """ |
| 1134 | + Assign a name to this RDD. |
| 1135 | + >>> rdd1 = sc.parallelize([1,2]) |
| 1136 | + >>> rdd1.setName('RDD1') |
| 1137 | + >>> rdd1.name() |
| 1138 | + 'RDD1' |
| 1139 | + """ |
| 1140 | + self._jrdd.setName(name) |
| 1141 | + |
| 1142 | + def toDebugString(self): |
| 1143 | + """ |
| 1144 | + A description of this RDD and its recursive dependencies for debugging. |
| 1145 | + """ |
| 1146 | + debug_string = self._jrdd.toDebugString() |
| 1147 | + if not debug_string: |
| 1148 | + return None |
| 1149 | + return debug_string.encode('utf-8') |
| 1150 | + |
| 1151 | + def getStorageLevel(self): |
| 1152 | + """ |
| 1153 | + Get the RDD's current storage level. |
| 1154 | + >>> rdd1 = sc.parallelize([1,2]) |
| 1155 | + >>> rdd1.getStorageLevel() |
| 1156 | + StorageLevel(False, False, False, 1) |
| 1157 | + """ |
| 1158 | + java_storage_level = self._jrdd.getStorageLevel() |
| 1159 | + storage_level = StorageLevel(java_storage_level.useDisk(), |
| 1160 | + java_storage_level.useMemory(), |
| 1161 | + java_storage_level.deserialized(), |
| 1162 | + java_storage_level.replication()) |
| 1163 | + return storage_level |
1122 | 1164 |
|
1123 | 1165 | # TODO: `lookup` is disabled because we can't make direct comparisons based |
1124 | 1166 | # on the key; we need to compare the hash of the key to the hash of the |
|
0 commit comments