sreejithpillai/LogDriver

## LogDriver
/*
 * Copyright 2014 Sreejith Pillai
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *      http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package com.sreejith.loganalyzer.mapreduce;

import org.apache.hadoop.fs.Path;
import org.apache.hadoop.io.IntWritable;
import org.apache.hadoop.mapreduce.Job;
import org.apache.hadoop.mapreduce.lib.input.FileInputFormat;
import org.apache.hadoop.mapreduce.lib.output.FileOutputFormat;

public class LogDriver {

	public static void main(String[] args) throws Exception {
		Job job = new Job();
		job.setJarByClass(LogDriver.class);
		job.setJobName("Log Analyzer");

		job.setMapperClass(LogMapper.class);
		job.setPartitionerClass(LogPartitioner.class);
		job.setCombinerClass(LogReducer.class);
		job.setReducerClass(LogReducer.class);

		job.setNumReduceTasks(2);

		job.setOutputKeyClass(IntWritable.class);
		job.setOutputValueClass(IntWritable.class);

		FileInputFormat.addInputPath(job, new Path(args[0]));
		FileOutputFormat.setOutputPath(job, new Path(args[1]));

		job.waitForCompletion(true);

	}
}

## LogMapper
/*
 * Copyright 2014 Sreejith Pillai
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *      http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package com.sreejith.loganalyzer.mapreduce;

import java.io.IOException;
import java.text.ParseException;
import java.util.regex.Matcher;
import java.util.regex.Pattern;
import org.apache.hadoop.io.IntWritable;
import org.apache.hadoop.io.LongWritable;
import org.apache.hadoop.io.Text;
import org.apache.hadoop.mapreduce.Mapper;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
import com.sreejith.loganalyzer.parser.ParseLog;

public class LogMapper extends
		Mapper<LongWritable, Text, IntWritable, IntWritable> {

	private static Logger logger = LoggerFactory.getLogger(LogMapper.class);
	private IntWritable hour = new IntWritable();
	private final static IntWritable one = new IntWritable(1);
	private static Pattern logPattern = Pattern
			.compile("([^ ]*) ([^ ]*) ([^ ]*) \\[([^]]*)\\]"
					+ " \"([^\"]*)\""
					+ " ([^ ]*) ([^ ]*).*");

	public void map(LongWritable key, Text value, Context context)
			throws InterruptedException, IOException {
		logger.info("Mapper started");
		String line = ((Text) value).toString();
		Matcher matcher = logPattern.matcher(line);
		if (matcher.matches()) {
			String timestamp = matcher.group(4);
			try {
				hour.set(ParseLog.getHour(timestamp));
			} catch (ParseException e) {
				logger.warn("Exception", e);
			}
			context.write(hour, one);
		}
		logger.info("Mapper Completed");
	}
}

## LogPartitioner
/*
 * Copyright 2014 Sreejith Pillai
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *      http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package com.sreejith.loganalyzer.mapreduce;

import org.apache.hadoop.io.IntWritable;
import org.apache.hadoop.mapreduce.Partitioner;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;

public class LogPartitioner extends Partitioner<IntWritable, IntWritable> {

	private static Logger logger = LoggerFactory.getLogger(LogPartitioner.class);
	@Override
	public int getPartition(IntWritable key, IntWritable value, int numReduceTasks) {
		logger.info("Partitioner started");

		int intKey=key.get();
		if(intKey>=8 && intKey<=18){
			return 1;
		}else{
			return 0;
		}
	}
}

## LogReducer
/*
 * Copyright 2014 Sreejith Pillai
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *      http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package com.sreejith.loganalyzer.mapreduce;

import java.io.IOException;
import org.apache.hadoop.io.IntWritable;
import org.apache.hadoop.mapreduce.Reducer;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;

public class LogReducer extends
		Reducer<IntWritable, IntWritable, IntWritable, IntWritable> {

	private static Logger logger = LoggerFactory.getLogger(LogReducer.class);

	public void reduce(IntWritable key, Iterable<IntWritable> values,
			Context context) throws IOException, InterruptedException {

		logger.info("Reducer started");
		int sum = 0;
		for (IntWritable value : values) {
			sum = sum + value.get();
		}
		context.write(key, new IntWritable(sum));
		logger.info("Reducer completed");
	}
}
	/*
	* Copyright 2014 Sreejith Pillai
	*
	* Licensed under the Apache License, Version 2.0 (the "License");
	* you may not use this file except in compliance with the License.
	* You may obtain a copy of the License at
	*
	* http://www.apache.org/licenses/LICENSE-2.0
	*
	* Unless required by applicable law or agreed to in writing, software
	* distributed under the License is distributed on an "AS IS" BASIS,
	* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	* See the License for the specific language governing permissions and
	* limitations under the License.
	*/
	package com.sreejith.loganalyzer.mapreduce;

	import org.apache.hadoop.fs.Path;
	import org.apache.hadoop.io.IntWritable;
	import org.apache.hadoop.mapreduce.Job;
	import org.apache.hadoop.mapreduce.lib.input.FileInputFormat;
	import org.apache.hadoop.mapreduce.lib.output.FileOutputFormat;

	public class LogDriver {

	public static void main(String[] args) throws Exception {
	Job job = new Job();
	job.setJarByClass(LogDriver.class);
	job.setJobName("Log Analyzer");

	job.setMapperClass(LogMapper.class);
	job.setPartitionerClass(LogPartitioner.class);
	job.setCombinerClass(LogReducer.class);
	job.setReducerClass(LogReducer.class);

	job.setNumReduceTasks(2);

	job.setOutputKeyClass(IntWritable.class);
	job.setOutputValueClass(IntWritable.class);

	FileInputFormat.addInputPath(job, new Path(args[0]));
	FileOutputFormat.setOutputPath(job, new Path(args[1]));

	job.waitForCompletion(true);

	}
	}