Skip to content

Instantly share code, notes, and snippets.

@nbest937
nbest937 / sparkSessionOnEMR.scala
Last active October 3, 2018 22:11 — forked from dyno/sparkSessionOnEMR.scala
Working with SparkSession with Ammonite .on AWS EMR
// =============================================================================
// emr.sc -- import it in predef.sc
import ammonite.ops._
// add emr jars and config dir to interp class path
//
def loadEmrJars() = {
// /etc/zeppelin/conf/zeppelin-env.sh
val libDirs = List( //
"/usr/lib/hadoop-lzo/lib",
"/usr/lib/spark/jars",
library(maps)
library(geosphere)
library(plyr)
library(ggplot2)
library(sp)
airports <- read.csv("http://www.stanford.edu/~cengel/cgi-bin/anthrospace/wp-content/uploads/2012/03/airports.csv", as.is=TRUE, header=TRUE)
flights <- read.csv("http://www.stanford.edu/~cengel/cgi-bin/anthrospace/wp-content/uploads/2012/03/PEK-openflights-export-2012-03-19.csv", as.is=TRUE, header=TRUE)
# aggregate nunber of flights