Taneli Saastamoinen tsaastam

## spark_21109.scala
// illustration of https://issues.apache.org/jira/browse/SPARK-21109
// see also https://lobotomys.blogspot.co.uk/2017/07/spark-union-column-order-issue.html

import org.apache.spark.rdd.RDD
import org.apache.spark.sql.Dataset
import org.apache.spark.sql.SQLContext
import org.apache.spark.sql.SparkSession
import org.apache.spark.sql.functions._

// if using spark-shell, skip the next 4 lines

## spark_dataframe_ndcg.scala
// Normalised Discounted Cumulative Gain (NDCG) for Spark DataFrames
// See e.g. https://en.wikipedia.org/wiki/Discounted_cumulative_gain
//
// To run this code in the Spark Shell:
//
// 1) https://spark.apache.org/  -> download a binary Spark distribution
// 2) ./bin/spark-shell
// 3) copy-paste!

import org.apache.spark.sql.expressions.UserDefinedAggregateFunction
	// illustration of https://issues.apache.org/jira/browse/SPARK-21109
	// see also https://lobotomys.blogspot.co.uk/2017/07/spark-union-column-order-issue.html

	import org.apache.spark.rdd.RDD
	import org.apache.spark.sql.Dataset
	import org.apache.spark.sql.SQLContext
	import org.apache.spark.sql.SparkSession
	import org.apache.spark.sql.functions._

	// if using spark-shell, skip the next 4 lines
	// Normalised Discounted Cumulative Gain (NDCG) for Spark DataFrames
	// See e.g. https://en.wikipedia.org/wiki/Discounted_cumulative_gain
	//
	// To run this code in the Spark Shell:
	//
	// 1) https://spark.apache.org/ -> download a binary Spark distribution
	// 2) ./bin/spark-shell
	// 3) copy-paste!

	import org.apache.spark.sql.expressions.UserDefinedAggregateFunction