Skip to content

Instantly share code, notes, and snippets.

@rishav-rohit
rishav-rohit / ImcdpAvgDriver.java
Last active January 1, 2016 10:49
in-mapper combiner program to calculate average
package com.hadoop.imcdp;
import java.io.IOException;
import java.util.HashMap;
import java.util.Iterator;
import java.util.Map;
import java.util.Map.Entry;
import java.util.Set;
import org.apache.hadoop.conf.Configuration;
@rishav-rohit
rishav-rohit / AvgDriver.java
Last active December 3, 2022 01:21
M/R program to calculate average (without combiner)
package com.hadoop.imcdp;
import java.io.IOException;
import java.util.HashMap;
import java.util.Iterator;
import java.util.Map;
import java.util.Map.Entry;
import java.util.Set;
import org.apache.hadoop.conf.Configuration;
{"id":"A91D021BA58444B29D4D42CA5E39F7BF","student_id":100,"university_id":908,"course_details":{"course_id":100,"enroll_date":"2012-02-13 00:00:00.000000000","verb":"completed","result_score":0.9}}
{"id":"502A77CC99B241CB94CA356F5218F1A9","student_id":101,"university_id":112,"course_details":{"course_id":233,"enroll_date":"2011-06-08 00:00:00.000000000","verb":"started","result_score":0.65}}
{"id":"5D04CD5ABF014D6EBA237766F9B470DE","student_id":102,"university_id":340,"course_details":{"course_id":339,"enroll_date":"2012-03-06 00:00:00.000000000","verb":"started","result_score":0.57}}
{
"namespace": "com.rishav.avro",
"type": "record",
"name": "StudentActivity",
"fields": [
{
"name": "id",
"type": "string"
},
{
$ java -jar avro-tools-1.7.5.jar
Version 1.7.5 of Apache Avro
Copyright 2010 The Apache Software Foundation
This product includes software developed at
The Apache Software Foundation (http://www.apache.org/).
C JSON parsing provided by Jansson and
written by Petri Lehtinen. The original software is
available from http://www.digip.org/jansson/.
package com.rishav.avro;
import java.io.File;
import java.io.FileInputStream;
import java.io.IOException;
import java.io.InputStream;
import java.util.Iterator;
import java.util.LinkedHashMap;
import org.apache.avro.Schema;
package com.rishav.avro;
import java.io.File;
import java.io.FileInputStream;
import java.io.IOException;
import java.io.InputStream;
import java.util.Iterator;
import java.util.LinkedHashMap;
import org.apache.avro.Schema;
{
"namespace": "com.rishav.avro",
"type": "record",
"name": "StudentActivity",
"fields": [
{
"name": "id",
"type": "string"
},
{
package com.rishav.avro;
import java.io.File;
import java.io.FileInputStream;
import java.io.IOException;
import java.io.InputStream;
import java.util.Iterator;
import java.util.LinkedHashMap;
import org.apache.avro.Schema;
package com.hadoop.imcdp;
import java.io.*;
import java.util.Set;
import java.lang.Integer;
import org.apache.hadoop.io.*;
public class IntPair implements WritableComparable<IntPair>{
private IntWritable first;