Skip to content

Instantly share code, notes, and snippets.

View sujee's full-sized avatar

Sujee Maniyam sujee

View GitHub Profile
// MembaseTest3
package tutorial;
import java.net.InetSocketAddress;
import java.util.concurrent.TimeUnit;
import net.spy.memcached.MemcachedClient;
/**
* simulates writing / reading from two different clients
// MembaseTest1
package tutorial;
import java.net.InetSocketAddress;
import net.spy.memcached.MemcachedClient;
/**
* Write / Read from Membase
*
* @author sujee
*
// MembaseTest2
package tutorial;
import java.net.InetSocketAddress;
import net.spy.memcached.MemcachedClient;
/**
* simulates writing / reading from two different clients
*/
public class MembaseTest2
...
...
long t2 = System.currentTimeMillis();
cache.shutdown(10, TimeUnit.SECONDS); // graceful shutdown
System.out.println("Time for " + MAX + " puts is " + (t2 - t1) + " ms");
// open another connection
cache = new MemcachedClient(new InetSocketAddress(server, port));
...
...
@sujee
sujee / amazon-emr-compile.sh
Created January 2, 2011 05:13
amazon-emr-compile.sh : compile script to create a single JAR for Amazon EMR
#!/bin/bash
## http://sujee.net/tech/articles/amazon-emr-beyond-basics/
CLASS_DIR=classes
mkdir -p $CLASS_DIR
rm -rf $CLASS_DIR/*
# compile
@sujee
sujee / amazon-emr-testMR.java
Created January 2, 2011 05:29
TestMR.java : basic map reduce program that takes input path as an argument
/**
* http://sujee.net/tech/articles/amazon-emr-beyond-basics/
* takes one argument for input path
*/
public class TestMR extends Configured implements Tool
{
public static void main(String[] args) throws Exception
{
int res = ToolRunner.run(new Configuration(), new TestMR(), args);
@sujee
sujee / run-emr-testMR.sh
Created January 2, 2011 05:40
run-emr-TestMR.sh : launches an MR job on EMR
#!/bin/bash
## http://sujee.net/tech/articles/amazon-emr-beyond-basics/
# config
# if changing machine type, also change mapred config file
MASTER_INSTANCE_TYPE="m1.large"
SLAVE_INSTANCE_TYPE="c1.xlarge"
INSTANCES=5
export JOBNAME="MyMR"
export TIMESTAMP=$(date +%Y%m%d-%H%M%S)
@sujee
sujee / emr-wait-for-completion.sh
Created January 2, 2011 07:14
emr-wait-for-completion.sh
#!/bin/bash
## http://sujee.net/tech/articles/amazon-emr-beyond-basics/
echo "=== $JOBID started...."
LOGDIR="/var/logs/hadoop-logs/${JOBNAME}__${JOBID}__${TIMESTAMP}"
mkdir -p "${LOGDIR}"
## stuff below is to wait till the jobs is done
@sujee
sujee / job-status-parse.rb
Created January 3, 2011 07:07
job-status-parse.rb
require 'rubygems'
require 'json'
a = JSON::parse(ARGF.read)
#p a
p a["JobFlows"][0]["ExecutionStatusDetail"]["State"]
@sujee
sujee / ParseProperties.java
Created January 30, 2011 07:11
ParseProperties.java
package amazonemr;
import java.net.URI;
import java.util.Enumeration;
import java.util.Properties;
import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.conf.Configured;
import org.apache.hadoop.fs.FSDataInputStream;
import org.apache.hadoop.fs.FileSystem;