Skip to content

Instantly share code, notes, and snippets.

View krishnakalyan3's full-sized avatar

Krishna Kalyan krishnakalyan3

View GitHub Profile
package UDF;
import java.io.BufferedReader;
import java.io.FileReader;
import java.io.IOException;
import java.util.ArrayList;
import java.util.HashMap;
import java.util.List;
import java.util.Map.Entry;
import java.util.regex.Matcher;
@krishnakalyan3
krishnakalyan3 / input
Created November 1, 2014 03:34
Input
1
2
3
4
1
1
1
@krishnakalyan3
krishnakalyan3 / Sum
Created November 1, 2014 03:43
Sum Operation
-- Plain Sum
B = group A All;
C = foreach B generate SUM($1);
dump C;
-- Group And Sum
A = load 'input' as (number:int);
B = group A by $0;
C = foreach B generate SUM($1);
dump C;
@krishnakalyan3
krishnakalyan3 / Cast
Created November 2, 2014 04:20
pig Cast
-- Load
A = load 'input' using PigStorage(',');
-- this will generate all columns after the first one
B = foreach A generate $1..;
--Suppose you need to cast the
C = FOREACH A generate (chararray)$0,(int)$1,(int)$2,(chararray)$3,(chararray)$4;
dump C;
@krishnakalyan3
krishnakalyan3 / HBase
Created November 2, 2014 04:34
Table with Sno|Name|Age
1|Krishna|23
2|Madhuri|37
3|Kalyan|54
4|Shobhana|50
@krishnakalyan3
krishnakalyan3 / Mapr
Created November 11, 2014 11:44
Ubuntu MapR Single Node
# Navigate to this Folder
cd /etc/apt
# Edit sources.list file and add the MapR repositories into it.
vi sources.list
# Add MapR repo entries below
deb http://package.mapr.com/releases/v2.1.2/ubuntu/ mapr optional
deb http://package.mapr.com/releases/ecosystem/ubuntu binary/
# Update repo
sudo apt-get update
# install Map-r hadoop
@krishnakalyan3
krishnakalyan3 / ambari
Created December 10, 2014 23:44
Ambari
# FDQN
# Password Less SSH, Disable SELINUX , iptables Off
# NTP
# yum -y install ntp
# wget http://public-repo-1.hortonworks.com/ambari/centos6/1.x/updates/1.5.1/ambari.repo
# cp ambari.repo /etc/yum.repos.d
# yum install ambari-server
# ambari-server setup
# ambari-server start
# Start Ambari in browser u/n admin , pwd admin
Vagrant::Config.run do |config|
config.vm.box = "centos65"
config.vm.customize [
"modifyvm", :id,
"--memory", "3427"
]
config.vm.define :hadoop1 do |hadoop1_config|
hadoop1_config.vm.network :hostonly, "10.10.0.53"
hadoop1_config.vm.host_name = "hdp.hadoop1.com"
@krishnakalyan3
krishnakalyan3 / host
Created December 11, 2014 00:12
host
hdp.hadoop1.com
hdp.hadoop2.com
hdp.hadoop3.com