Get Homebrew installed on your mac if you don't already have it
Install highlight. "brew install highlight". (This brings down Lua and Boost as well)
py_dict = readLines('python_dictionary.txt') | |
# e.g. | |
#{"cat_name": "Ella", "dwell_status": "tree_dweller", "coat_color": "gray, white, orange", "is_from_hell": "Y"} | |
#{"cat_name": "Billie", "dwell_status": "bush_dweller", "coat_color": "gray, white", "is_from_hell": "N"} | |
dict_to_df = function(dict) { | |
require(plyr) | |
df = data.frame() | |
df_temp = list() |
clean_headers = function(headers) { | |
# Make lowercase | |
headers = tolower(headers) | |
# Replace symbols | |
headers = gsub(' ', '', headers, fixed = TRUE) | |
headers = gsub('.', '_', headers, fixed = TRUE) | |
headers = gsub('[^[:alnum:]_]', '', headers) # remove all symbols except '_' | |
headers = gsub('__', '_', headers, fixed = TRUE) |
theme_presentation = function (base_size = 12, base_family = "") { | |
theme_minimal(base_size = base_size, base_family = base_family) %+replace% | |
theme( | |
axis.text.x = element_text(size = 15), | |
axis.text.y = element_text(size = 15), | |
title = element_text(size = 20), | |
axis.title = element_text(size = 18), | |
axis.ticks = element_blank(), | |
legend.position = 'bottom') | |
} |
Get Homebrew installed on your mac if you don't already have it
Install highlight. "brew install highlight". (This brings down Lua and Boost as well)
sudo yum upgrade | |
sudo yum install tmux | |
tmux new -s session_name |
I hereby claim:
To claim this, I am signing this object:
// spark-shell --jars /home/otto/algebird-core_2.10-0.9.0.jar,/home/mforns/refinery-core-0.0.9.jar | |
import java.util.Date | |
import java.text.SimpleDateFormat | |
import org.wikimedia.analytics.refinery.core.PageviewDefinition | |
import org.wikimedia.analytics.refinery.core.Webrequest | |
import scala.math.pow | |
import org.apache.spark.rdd.RDD | |
import com.twitter.algebird.QTree |
multiread.delim = function(path, header = TRUE, sep = '\t') { | |
# multiread.delim is a function to read in all the files in a given directory | |
# and rbind them into one data frame. Input files need to be of the same | |
# structure. Headers will be labeled according to the headers in the first file. | |
file_names = paste(path, list.files(path), sep = '/') | |
for (file in file_names) { | |
if (!exists('combined_df')) { |
libs = c('arm', | |
'biglm', | |
'car', | |
'doParallel', | |
'dplyr', | |
'gclus', | |
'ggplot2', | |
'gplots', | |
'ggthemes', | |
'lpSolveAPI', |