-
Notifications
You must be signed in to change notification settings - Fork 1
Expand file tree
/
Copy pathprogram 5.scala
More file actions
23 lines (17 loc) · 861 Bytes
/
Copy pathprogram 5.scala
File metadata and controls
23 lines (17 loc) · 861 Bytes
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
// Databricks notebook source
var business= sc.textFile("/FileStore/tables/bhv9wv0j1489262645388/business.csv")
var review= sc.textFile("/FileStore/tables/4vo8z2wf1489262685677/review.csv")
var user=sc.textFile("/FileStore/tables/bexocdw61489262747888/user.csv")
var businessData=business.map(line=>line.split("\\^"))
.filter(line=>(line(1).contains("TX")))
.map(line=>(line(0),line(1)))
var reviewData=review.map(line=>line.split("\\^"))
.map(line=>(line(2),1))
.reduceByKey(_+_)
var busDF=businessData.toDF("id","address")
var reviewDF=reviewData.toDF("id","count")
var output=reviewDF.join(busDF,"id")
.distinct() //added distinct to avoid duplicates
.sort($"count".desc)
display(output)
// COMMAND ----------