Skip to content

Instantly share code, notes, and snippets.

@meyarivan
meyarivan / stream.py
Created June 9, 2015 22:57
Decode Kafka msgs submitted by Mypipe
#!/usr/bin/env python2
from __future__ import print_function
import os, sys
from kafka import KafkaConsumer
import avro.schema
from avro.datafile import DataFileReader, DataFileWriter
from avro.io import DatumReader, DatumWriter
@meyarivan
meyarivan / mysql_mariadb.py
Created August 7, 2015 13:11
mysql_mariadb.py
# stdlib
import subprocess
import os
import sys
import re
import traceback
# project
from checks import AgentCheck
from utils.platform import Platform
#!/bin/bash
for DB in `hive -e "SHOW DATABASES;"`; do
for tbl in `hive -e "USE ${DB}; SHOW TABLES"`; do
hive -e "DESC FORMATTED ${DB}.${tbl};" > desc.${DB}.${tbl}
done
done
@meyarivan
meyarivan / Hive+S3 Tuning
Last active May 4, 2016 12:15
Hive + S3 tuning
Tunables:
- mapreduce.input.fileinputformat.list-status.num-threads (hive-site.xml)
- fs.s3a.block.size
JIRAs:
- https://issues.apache.org/jira/browse/HADOOP-12810
- https://issues.apache.org/jira/browse/HADOOP-9565
- https://issues.apache.org/jira/browse/HADOOP-12878