Gabe gdbassett

## gist:97e9df660269db098db8
### Keybase proof

I hereby claim:

  * I am gdbassett on github.
  * I am gdbassett (https://keybase.io/gdbassett) on keybase.
  * I have a public key whose fingerprint is 8F47 6E59 65B3 9C92 428C  5A8C C609 81ED D4FA 1957

To claim this, I am signing this object:

## robustTau.py
from scipy import stats as scistats
import numpy as np

# Implementation of Tau from http://amstat.tandfonline.com/doi/abs/10.1198/004017002188618509#.VDgKhdR4rEh
# blatently transposed R robustbase library from http://r-forge.r-project.org/scm/?group_id=59, OGK.R
def scaleTau2(x, c1 = 4.5, c2 = 3.0, consistency = True, mu_too = False, *xargs, **kargs):
	## NOTA BENE: This is *NOT* consistency corrected
	x = np.asarray(x)
	n = len(x)
	medx = np.median(x)

## gist:6438b4036a501eba9f5e
> df <- df[!names(df) %in% c('root.victim.region',
+ 'root.victim.country',
+ 'root.summary',
+ 'root.summary=Source_Category',
+ 'root.victim.industry',
+ 'root.timeline.incident.year',
+ 'root.plus.dbir_year',
+ 'root.action.social.notes',
+ 'root.victim.secondary.notes',
+ 'root.action.hacking.notes',

## linearKMeans.R
#' @param df Dataframe with x and y columns.  (Hopefully in the future this can be x)
#' @param nlines The number of clusters.
#' @param ab a dataframe with a 'slopes' and 'intercepts' column and one row per initial line.  Dimensions must match nlines.
#' @param maxiter The maximum number of iterations to do
#' @export
#' @examples
linearKMeans <- function(df, ab=NULL, nlines=0, maxiter=1000) {
  # default number of lines
  nlines_default <- 5


## test_GENERIC.Rmd
---
title: "Test"
author: "Gabe"
date: "November 03, 2016"
output: html_document
params:
  df: data.frame()
  a: ""
  b: ""
  c: "FALSE"

## livesplit.R
speedrun <- XML::xmlParse("/livesplit.lss")
speedrun <- XML::xmlToList(speedrun)

chunk <- do.call(rbind, lapply(speedrun[['Segments']], function(segments) {

    segments.df <- do.call(rbind, lapply(segments[['SegmentHistory']], function(segment) {
        if ('RealTime' %in% names(segment))
        data.frame(`attemptID` = segment$.attrs['id'], RealTime = segment$RealTime)
    }))
    segments.df$name <- rep(segments$Name, nrow(segments.df))

## bayesian_credible_intervals.R
# pick an enumeration
enum <- "action.*.variety"
# establish filter criteria (easier than a complex standard-eval  filter_ line)
df <- vcdb %>%
  dplyr::filter(plus.dbir_year == 2016, subset.2017dbir) %>%
  dplyr::filter(attribute.confidentiality.data_disclosure.Yes) %>%
  dplyr::filter(victim.industry2.92)

# establish priors from previous year
priors <- df %>%

## two_barcharts.json
{
  "$schema": "https://vega.github.io/schema/vega-lite/v2.json",
  "vconcat": [
    {
      "data": {
        "values": [
          {
            "enum": "victim.industry2.52",
            "x": 471,
            "n": 1935,

## schema_to_graph.py
import networkx as nx # NOTE: written against dev networkx 2.0
import logging
import inspect
import json

logger = logging.getLogger()
fileLogger = logging.FileHandler("~/Documents/Development/tmp/vega.log")
fileLogger.setLevel(logging.DEBUG)
logger.addHandler(fileLogger)

## flip.R
#' Flip the x and y axis
#'
#' This is accomplished by updating the x & y marks, updating the flipping the
#' scales, and updating the axis labels.
#'
#' WARNING: This currently works for rectangular layer figures.  It may not work with
#' multiple-layer figures, other marks, or signals.
#'
#' WARNING: No tests currently exist for this function
#'
	### Keybase proof

	I hereby claim:

	* I am gdbassett on github.
	* I am gdbassett (https://keybase.io/gdbassett) on keybase.
	* I have a public key whose fingerprint is 8F47 6E59 65B3 9C92 428C 5A8C C609 81ED D4FA 1957

	To claim this, I am signing this object:
	from scipy import stats as scistats
	import numpy as np

	# Implementation of Tau from http://amstat.tandfonline.com/doi/abs/10.1198/004017002188618509#.VDgKhdR4rEh
	# blatently transposed R robustbase library from http://r-forge.r-project.org/scm/?group_id=59, OGK.R
	def scaleTau2(x, c1 = 4.5, c2 = 3.0, consistency = True, mu_too = False, xargs, *kargs):
	## NOTA BENE: This is NOT consistency corrected
	x = np.asarray(x)
	n = len(x)
	medx = np.median(x)
	> df <- df[!names(df) %in% c('root.victim.region',
	+ 'root.victim.country',
	+ 'root.summary',
	+ 'root.summary=Source_Category',
	+ 'root.victim.industry',
	+ 'root.timeline.incident.year',
	+ 'root.plus.dbir_year',
	+ 'root.action.social.notes',
	+ 'root.victim.secondary.notes',
	+ 'root.action.hacking.notes',
	#' @param df Dataframe with x and y columns. (Hopefully in the future this can be x)
	#' @param nlines The number of clusters.
	#' @param ab a dataframe with a 'slopes' and 'intercepts' column and one row per initial line. Dimensions must match nlines.
	#' @param maxiter The maximum number of iterations to do
	#' @export
	#' @examples
	linearKMeans <- function(df, ab=NULL, nlines=0, maxiter=1000) {
	# default number of lines
	nlines_default <- 5
	---
	title: "Test"
	author: "Gabe"
	date: "November 03, 2016"
	output: html_document
	params:
	df: data.frame()
	a: ""
	b: ""
	c: "FALSE"
	speedrun <- XML::xmlParse("/livesplit.lss")
	speedrun <- XML::xmlToList(speedrun)

	chunk <- do.call(rbind, lapply(speedrun[['Segments']], function(segments) {

	segments.df <- do.call(rbind, lapply(segments[['SegmentHistory']], function(segment) {
	if ('RealTime' %in% names(segment))
	data.frame(`attemptID` = segment$.attrs['id'], RealTime = segment$RealTime)
	}))
	segments.df$name <- rep(segments$Name, nrow(segments.df))
	# pick an enumeration
	enum <- "action.*.variety"
	# establish filter criteria (easier than a complex standard-eval filter_ line)
	df <- vcdb %>%
	dplyr::filter(plus.dbir_year == 2016, subset.2017dbir) %>%
	dplyr::filter(attribute.confidentiality.data_disclosure.Yes) %>%
	dplyr::filter(victim.industry2.92)

	# establish priors from previous year
	priors <- df %>%
	{
	"$schema": "https://vega.github.io/schema/vega-lite/v2.json",
	"vconcat": [
	{
	"data": {
	"values": [
	{
	"enum": "victim.industry2.52",
	"x": 471,
	"n": 1935,
	import networkx as nx # NOTE: written against dev networkx 2.0
	import logging
	import inspect
	import json

	logger = logging.getLogger()
	fileLogger = logging.FileHandler("~/Documents/Development/tmp/vega.log")
	fileLogger.setLevel(logging.DEBUG)
	logger.addHandler(fileLogger)
	#' Flip the x and y axis
	#'
	#' This is accomplished by updating the x & y marks, updating the flipping the
	#' scales, and updating the axis labels.
	#'
	#' WARNING: This currently works for rectangular layer figures. It may not work with
	#' multiple-layer figures, other marks, or signals.
	#'
	#' WARNING: No tests currently exist for this function
	#'