Rajkumar Singh rajkrrsingh

## Create MapR-Db Table
private void createTable(String tableName, List<String> cfList)
			throws IOException {
		final String table = tableName;
		final List<String> cfs = cfList;

		try {
			ugi.doAs(new PrivilegedExceptionAction<Void>() {
				@Override
				public Void run() throws Exception {
					if (!admin.tableExists(table)) {

## gist:a86ff86f73e351bdf86c
#wget http://download.redis.io/releases/redis-3.0.2.tar.gz
# tar xzf redis-3.0.2.tar.gz
# cd redis-3.0.2
# make

Run Redis Server
src/redis-server

## HiveServer2 connection with MySQL DB as metastore over SSL.md

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                rajkrrsingh
                / HiveServer2 connection with MySQL DB as metastore over SSL.md
            
            
              Last active
              July 18, 2016 06:07
            
              
                quick guide to connect HS2 to MySQL DB metastore over SSL
              
          
    Setting up MySQL SSL

# Create clean environment
shell> rm -rf newcerts
shell> mkdir newcerts && cd newcerts

# Create CA certificate
shell> openssl genrsa 2048 > ca-key.pem
shell> openssl req -new -x509 -nodes -days 3600 \
         -key ca-key.pem -out ca.pem


## Reading parquet files using the parquet tools
// Building a parquet tools
git clone https://github.com/Parquet/parquet-mr.git
cd parquet-mr/parquet-tools/
mvn clean package -Plocal

// know the schema of the parquet file
java -jar parquet-tools-1.6.0rc3-SNAPSHOT.jar schema sample.parquet

// Read parquet file
java -jar parquet-tools-1.6.0rc3-SNAPSHOT.jar cat sample.parquet

## RunSqoopCommand.java
import net.neoremind.sshxcute.core.SSHExec;
import net.neoremind.sshxcute.core.ConnBean;
import net.neoremind.sshxcute.task.CustomTask;
import net.neoremind.sshxcute.task.impl.ExecCommand;

public class RunSqoopCommand {

public static void main(String args[]) throws Exception{


## SparkStreamingSampleApp
mkdir spark-streaming-example
cd spark-streaming-example/
mkdir -p src/main/scala
cd src/main/scala
vim TestStreaming.scala

add following line of code to TestStreaming.scala

import org.apache.spark.streaming.StreamingContext
import org.apache.spark.streaming.StreamingContext._

## Atlas_Rest_API
[root@rksnode ~]# curl http://rksnode:21000/api/atlas/admin/version
{"Version":"0.5.0.2.4.2.0-258-r375e15d6e3442c484b3a095a80127e41abef40b5","Name":"apache-atlas","Description":"Metadata Management and Data Governance Platform over Hadoop"}[root@rksnode ~]#
[root@rksnode ~]#
[root@rksnode ~]#
[root@rksnode ~]# curl http://rksnode:21000/api/atlas/types
{"results":["DataSet","hive_order","Process","hive_table","hive_db","hive_process","hive_principal_type","hive_resource_type","hive_object_type","Infrastructure","hive_index","hive_column","hive_resourceuri","hive_storagedesc","hive_role","hive_partition","hive_serde","hive_type"],"count":18,"requestId":"qtp1286783232-60 - 0128be6a-076e-4ad3-972a-58783a1f7180"}[root@rksnode ~]#
[root@rksnode ~]#
[root@rksnode ~]# curl http://rksnode:21000/api/atlas/types/hive_process
{"typeName":"hive_process","definition":"{\n  \"enumTypes\":[\n    \n  ],\n  \"structTypes\":[\n    \n  ],\n  \"traitTypes\":[\n    \n  ],\n  \"classTypes\":[\n    {\n      \"superTypes\":[\n

## Spark2StarterApp
mkdir Spark2StarterApp
cd Spark2StarterApp/
mkdir -p src/main/scala
cd src/main/scala
vim Spark2Example.scala

import org.apache.spark.sql.SparkSession

object Spark2Example {

## Spark2DataSetDemo
[root@rkk1 Spark2StarterApp]# /usr/hdp/current/spark2-client/bin/spark-shell
Setting default log level to "WARN".
To adjust logging level use sc.setLogLevel(newLevel).
16/11/30 18:01:48 WARN SparkContext: Use an existing SparkContext, some configuration may not take effect.
Spark context Web UI available at http://172.26.81.127:4040
Spark context available as 'sc' (master = local[*], app id = local-1480528906336).
Spark session available as 'spark'.
Welcome to
      ____              __
     / __/__  ___ _____/ /__

## Benchmark-results.txt
End-to-end Latency

0.0543 ms ms (median)
0.003125 ms (99th percentile)
5  ms (99.9th percentile)

Producer and consumer

Producer - 1431170.2 records/sec (136.49 MB/sec)
Consumer - 3276754.7021 records/sec (312.4957 MB/sec)
	private void createTable(String tableName, List<String> cfList)
	throws IOException {
	final String table = tableName;
	final List<String> cfs = cfList;

	try {
	ugi.doAs(new PrivilegedExceptionAction<Void>() {
	@Override
	public Void run() throws Exception {
	if (!admin.tableExists(table)) {
	#wget http://download.redis.io/releases/redis-3.0.2.tar.gz
	# tar xzf redis-3.0.2.tar.gz
	# cd redis-3.0.2
	# make

	Run Redis Server
	src/redis-server
	// Building a parquet tools
	git clone https://github.com/Parquet/parquet-mr.git
	cd parquet-mr/parquet-tools/
	mvn clean package -Plocal

	// know the schema of the parquet file
	java -jar parquet-tools-1.6.0rc3-SNAPSHOT.jar schema sample.parquet

	// Read parquet file
	java -jar parquet-tools-1.6.0rc3-SNAPSHOT.jar cat sample.parquet
	import net.neoremind.sshxcute.core.SSHExec;
	import net.neoremind.sshxcute.core.ConnBean;
	import net.neoremind.sshxcute.task.CustomTask;
	import net.neoremind.sshxcute.task.impl.ExecCommand;

	public class RunSqoopCommand {

	public static void main(String args[]) throws Exception{
	mkdir spark-streaming-example
	cd spark-streaming-example/
	mkdir -p src/main/scala
	cd src/main/scala
	vim TestStreaming.scala

	add following line of code to TestStreaming.scala

	import org.apache.spark.streaming.StreamingContext
	import org.apache.spark.streaming.StreamingContext._
	[root@rksnode ~]# curl http://rksnode:21000/api/atlas/admin/version
	{"Version":"0.5.0.2.4.2.0-258-r375e15d6e3442c484b3a095a80127e41abef40b5","Name":"apache-atlas","Description":"Metadata Management and Data Governance Platform over Hadoop"}[root@rksnode ~]#
	[root@rksnode ~]#
	[root@rksnode ~]#
	[root@rksnode ~]# curl http://rksnode:21000/api/atlas/types
	{"results":["DataSet","hive_order","Process","hive_table","hive_db","hive_process","hive_principal_type","hive_resource_type","hive_object_type","Infrastructure","hive_index","hive_column","hive_resourceuri","hive_storagedesc","hive_role","hive_partition","hive_serde","hive_type"],"count":18,"requestId":"qtp1286783232-60 - 0128be6a-076e-4ad3-972a-58783a1f7180"}[root@rksnode ~]#
	[root@rksnode ~]#
	[root@rksnode ~]# curl http://rksnode:21000/api/atlas/types/hive_process
	{"typeName":"hive_process","definition":"{\n \"enumTypes\":[\n \n ],\n \"structTypes\":[\n \n ],\n \"traitTypes\":[\n \n ],\n \"classTypes\":[\n {\n \"superTypes\":[\n
	mkdir Spark2StarterApp
	cd Spark2StarterApp/
	mkdir -p src/main/scala
	cd src/main/scala
	vim Spark2Example.scala

	import org.apache.spark.sql.SparkSession

	object Spark2Example {
	[root@rkk1 Spark2StarterApp]# /usr/hdp/current/spark2-client/bin/spark-shell
	Setting default log level to "WARN".
	To adjust logging level use sc.setLogLevel(newLevel).
	16/11/30 18:01:48 WARN SparkContext: Use an existing SparkContext, some configuration may not take effect.
	Spark context Web UI available at http://172.26.81.127:4040
	Spark context available as 'sc' (master = local[*], app id = local-1480528906336).
	Spark session available as 'spark'.
	Welcome to
	____ __
	/ __/__ ___ _____/ /__
	End-to-end Latency

	0.0543 ms ms (median)
	0.003125 ms (99th percentile)
	5 ms (99.9th percentile)

	Producer and consumer

	Producer - 1431170.2 records/sec (136.49 MB/sec)
	Consumer - 3276754.7021 records/sec (312.4957 MB/sec)