Skip to content

Instantly share code, notes, and snippets.

@csbond007
Last active October 24, 2016 23:49
Show Gist options
  • Save csbond007/6a29076d4a1416d97ed2778ab9ad822f to your computer and use it in GitHub Desktop.
Save csbond007/6a29076d4a1416d97ed2778ab9ad822f to your computer and use it in GitHub Desktop.
import org.apache.spark.SparkContext
import org.apache.spark.SparkContext._
import org.apache.spark.SparkConf
import com.datastax.spark.connector._
object SampleApp {
def main(args: Array[String]) {
val conf = new SparkConf(true)
.set("spark.cassandra.connection.host", "10.10.40.138")
.setAppName(this.getClass.getSimpleName)
.setMaster("mesos://zk://10.10.40.138:2181/mesos")
val sc = new SparkContext(conf)
val NUM_SAMPLES = 1000000
val count = sc.parallelize(1 to NUM_SAMPLES).map{i =>
val x = Math.random()
val y = Math.random()
if (x*x + y*y < 1) 1 else 0
}.reduce(_ + _)
println("///////////////////// Pi is roughly " + 4.0 * count / NUM_SAMPLES)
val i = 1
println("//////////////////////////////////")
println(i)
val emr_data = sc.cassandraTable("emrbots_data", "emr_patientcorepopulated")
println("//////////////////////////////// emr_data.count() ///////////////////////")
println(emr_data.count())
val firstRow = emr_data.first
println("/////////////////////////// firstRow.size /////////////////////////////// ")
println(firstRow.size )
println("///////////////////////////////////////////// firstRow.getString(patientdateofbirth)////////")
println(firstRow.getString("patientdateofbirth"))
// emr_data.toArray().foreach(line => println(line))
// emr_data.collect().foreach(println)
sc.stop()
}
}
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment