Skip to content

Commit c6a3a82

Browse files
author
Pedro Bernardo
committed
Added pairRdd/create/*.py
1 parent a2068e7 commit c6a3a82

File tree

2 files changed

+23
-0
lines changed

2 files changed

+23
-0
lines changed
Lines changed: 12 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,12 @@
1+
from pyspark import SparkContext
2+
3+
if __name__ == "__main__":
4+
5+
sc = SparkContext("local", "create")
6+
sc.setLogLevel("ERROR")
7+
8+
inputStrings = ["Lily 23", "Jack 29", "Mary 29", "James 8"]
9+
regularRDDs = sc.parallelize(inputStrings)
10+
11+
pairRDD = regularRDDs.map(lambda s: (s.split(" ")[0], s.split(" ")[1]))
12+
pairRDD.coalesce(1).saveAsTextFile("out/pair_rdd_from_regular_rdd")
Lines changed: 11 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,11 @@
1+
from pyspark import SparkContext
2+
3+
if __name__ == "__main__":
4+
5+
sc = SparkContext("local", "create")
6+
sc.setLogLevel("ERROR")
7+
8+
tuples = [("Lily", 23), ("Jack", 29), ("Mary", 29), ("James", 8)]
9+
pairRDD = sc.parallelize(tuples)
10+
11+
pairRDD.coalesce(1).saveAsTextFile("out/pair_rdd_from_tuple_list")

0 commit comments

Comments
 (0)