Aman amanahuja

## keybase.md

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              1 star
            
          
                amanahuja
                / keybase.md
            
            
              Created
              October 5, 2020 17:11
            
              
                keybase.md
              
          
    Keybase proof

I hereby claim:

I am amanahuja on github.
I am amanqa (https://keybase.io/amanqa) on keybase.
I have a public key ASASllH9sUL7cRzrWMq-nIMWp7iil-P5Y3I_7ec4VcBSXwo

To claim this, I am signing this object:

  
## shoutbase_client.py
# From Shoutbase team
# 2018 June 04

import requests
import time
import urllib
import csv

try:
    # for Python 2.x

## gini_coefficient_metric.py
"""
Calculation of gini coefficient metric
via https://www.kaggle.com/c/ClaimPredictionChallenge/forums/t/703/code-to-calculate-normalizedgini?forumMessageId=5897#post5897
I'm not the author, thant would be Kaggle user Patrick
See http://www.rhinorisk.com/Publications/Gini%20Coefficients.pdf
"""
def gini(actual, pred, cmpcol = 0, sortcol = 1):
  assert( len(actual) == len(pred) )
  all = np.asarray(np.c_[ actual, pred, np.arange(len(actual)) ], dtype=np.float)
  all = all[ np.lexsort((all[:,2], -1*all[:,1])) ]

## womens_stats_2015.ipynb

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                amanahuja
                / womens_stats_2015.ipynb
            
            
              Created
              May 26, 2015 22:35
            
              
                Women's stats #d1natties (temp)
              
          
      Loading

      Sorry, something went wrong. Reload?
      Sorry, we cannot display this file.
      Sorry, this file is invalid so it cannot be displayed.
      
          Viewer requires iframe.
      
    
## plotting_categorical_variables.py
"""

Plotting a categorical variable
----------------------------------
`df` is a pandas dataframe with a timeseries index.
`df` has a column `categorical` of dtype object, strings and nans, which is a categorical variable representing events

----------------------------------
>>> print df[:5]
                        categorical

## andrews_curve_column_order.py
import pandas as pd
import statsmodels.api as sm

#Change next two lines for dataset, such as in
#http://vincentarelbundock.github.io/Rdatasets/

data = sm.datasets.get_rdataset('airquality').data
class_column = 'Month'

fig, (ax1, ax2) = plt.subplots(nrows=2, ncols=1, sharex=True)

## cancer_data_expore.ipynb

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                amanahuja
                / cancer_data_expore.ipynb
            
            
              Created
              September 2, 2013 22:28
            
              
                Age-adjusted Urinary Bladder cancer occurrence, by state:
              
          
      Loading

      Sorry, something went wrong. Reload?
      Sorry, we cannot display this file.
      Sorry, this file is invalid so it cannot be displayed.
      
          Viewer requires iframe.
      
    
## sklearn-MAPE.py
from sklearn.utils import check_arrays

def mean_absolute_percentage_error(y_true, y_pred):
    """
    Use of this metric is not recommended; for illustration only.
    See other regression metrics on sklearn docs:
      http://scikit-learn.org/stable/modules/classes.html#regression-metrics

    Use like any other metric
    >>> y_true = [3, -0.5, 2, 7]; y_pred = [2.5, -0.3, 2, 8]

## news_01.py
import feedparser
import nltk
from collections import defaultdict

#Some userful parameters
nitemstoparse = 5
new_words = []

feedurls = [
  'http://www.nytimes.com/services/xml/rss/nyt/GlobalHome.xml',

## load-clean.py
# -*- coding: utf-8 -*-
"""
Created on Thu May 22 20:30:36 2012

http://www.meetup.com/r-enthusiasts/events/65306492/
   Mirroring the work that we do in Python.
   This is the code to import the sales and query data into a Py-Pandas
   dataframe (with conversion to time series).

Author (twitter): @amanqa
	# From Shoutbase team
	# 2018 June 04

	import requests
	import time
	import urllib
	import csv

	try:
	# for Python 2.x
	"""
	Calculation of gini coefficient metric
	via https://www.kaggle.com/c/ClaimPredictionChallenge/forums/t/703/code-to-calculate-normalizedgini?forumMessageId=5897#post5897
	I'm not the author, thant would be Kaggle user Patrick
	See http://www.rhinorisk.com/Publications/Gini%20Coefficients.pdf
	"""
	def gini(actual, pred, cmpcol = 0, sortcol = 1):
	assert( len(actual) == len(pred) )
	all = np.asarray(np.c_[ actual, pred, np.arange(len(actual)) ], dtype=np.float)
	all = all[ np.lexsort((all[:,2], -1*all[:,1])) ]
	"""

	Plotting a categorical variable
	----------------------------------
	`df` is a pandas dataframe with a timeseries index.
	`df` has a column `categorical` of dtype object, strings and nans, which is a categorical variable representing events

	----------------------------------
	>>> print df[:5]
	categorical
	import pandas as pd
	import statsmodels.api as sm

	#Change next two lines for dataset, such as in
	#http://vincentarelbundock.github.io/Rdatasets/

	data = sm.datasets.get_rdataset('airquality').data
	class_column = 'Month'

	fig, (ax1, ax2) = plt.subplots(nrows=2, ncols=1, sharex=True)
	from sklearn.utils import check_arrays

	def mean_absolute_percentage_error(y_true, y_pred):
	"""
	Use of this metric is not recommended; for illustration only.
	See other regression metrics on sklearn docs:
	http://scikit-learn.org/stable/modules/classes.html#regression-metrics

	Use like any other metric
	>>> y_true = [3, -0.5, 2, 7]; y_pred = [2.5, -0.3, 2, 8]
	import feedparser
	import nltk
	from collections import defaultdict

	#Some userful parameters
	nitemstoparse = 5
	new_words = []

	feedurls = [
	'http://www.nytimes.com/services/xml/rss/nyt/GlobalHome.xml',
	# -- coding: utf-8 --
	"""
	Created on Thu May 22 20:30:36 2012

	http://www.meetup.com/r-enthusiasts/events/65306492/
	Mirroring the work that we do in Python.
	This is the code to import the sales and query data into a Py-Pandas
	dataframe (with conversion to time series).

	Author (twitter): @amanqa