Skip to content

Instantly share code, notes, and snippets.

import org.apache.spark.{SparkConf, SparkContext}
import org.apache.spark.streaming.kafka._
import org.apache.spark.streaming.{Seconds, StreamingContext}
import org.apache.log4j.Logger
import org.apache.log4j.Level
/** KafkaThree - Spark Streaming App to find the bigrams from Log data coming through Kafka broker */
object KafkaThree {
def main(args: Array[String]): Unit = {
@hardkap
hardkap / KafkaIndexed.scala
Created January 17, 2017 06:15
Spark Streaming with Kafka, Solr and Indexed RDD.
import org.apache.spark.{SparkConf, SparkContext}
import org.apache.spark.sql.SQLContext
import org.apache.spark.streaming.kafka._
import org.apache.spark.streaming.{Seconds, StreamingContext}
import edu.berkeley.cs.amplab.spark.indexedrdd.IndexedRDD
import edu.berkeley.cs.amplab.spark.indexedrdd.IndexedRDD._
import org.apache.log4j.Logger
import org.apache.log4j.Level
/** KafkaIndexed - Find the bigrams from Log data coming through Kafka broker */