Skip to content

Commit 7cc0943

Browse files
author
James Lee
committed
adapt UkMakerSpaces
1 parent 96f979a commit 7cc0943

File tree

2 files changed

+30
-36
lines changed

2 files changed

+30
-36
lines changed

src/main/scala/com/sparkTutorial/sparkSql/join/UkMakerSpaces.java

Lines changed: 0 additions & 36 deletions
This file was deleted.
Lines changed: 30 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,30 @@
1+
package com.sparkTutorial.sparkSql.join
2+
3+
import org.apache.log4j.{Level, Logger}
4+
import org.apache.spark.sql.{SparkSession, functions}
5+
6+
object UkMakerSpaces {
7+
8+
def main(args: Array[String]) {
9+
10+
Logger.getLogger("org").setLevel(Level.ERROR)
11+
12+
val session = SparkSession.builder().appName("UkMakerSpaces").master("local[*]").getOrCreate()
13+
14+
val makerSpace = session.read.option("header", "true").csv("in/uk-makerspaces-identifiable-data.csv")
15+
16+
val postCode = session.read.option("header", "true").csv("in/uk-postcode.csv")
17+
.withColumn("PostCode", functions.concat_ws("", functions.col("PostCode"), functions.lit(" ")))
18+
19+
System.out.println("=== Print 20 records of makerspace table ===")
20+
makerSpace.show()
21+
22+
System.out.println("=== Print 20 records of postcode table ===")
23+
postCode.show()
24+
25+
val joined = makerSpace.join(postCode, makerSpace.col("Postcode").startsWith(postCode.col("Postcode")), "left_outer")
26+
27+
System.out.println("=== Group by Region ===")
28+
joined.groupBy("Region").count().show(200)
29+
}
30+
}

0 commit comments

Comments
 (0)