Jaya Zenchenko sigma23

## 2017 Fantasy Football Projections.ipynb

      
              1 file
            
          
              16 forks
            
          
              5 comments
            
          
              65 stars
            
          
                seanjtaylor
                / 2017 Fantasy Football Projections.ipynb
            
            
              Created
              September 4, 2017 01:38
            
          
        Loading

      Sorry, something went wrong. Reload?
      Sorry, we cannot display this file.
      Sorry, this file is invalid so it cannot be displayed.
      
          Viewer requires iframe.
      
    
## dash_simple_example_pandas_datareader.py
# See official docs at https://dash.plotly.com
# pip install dash pandas

from dash import Dash, dcc, html, Input, Output
import plotly.express as px

import pandas as pd

df = pd.read_csv('https://raw.githubusercontent.com/plotly/datasets/master/gapminderDataFiveYear.csv')

## Spark apply function on multiple columns at once
You can use select with varargs including *:

import spark.implicits._

df.select($"*" +: Seq("A", "B", "C").map(c =>
  sum(c).over(Window.partitionBy("ID").orderBy("time")).alias(s"cum$c")
): _*)
This:

Maps columns names to window expressions with Seq("A", ...).map(...)

## alb.sql
CREATE EXTERNAL TABLE IF NOT EXISTS alb_logs (
	type string,
	timestamp string,
	elb string,
	client_ip string,
	client_port int,
	target_ip string,
	target_port int,
	request_processing_time double,
	target_processing_time double,

## demo_faster_rcnn_notebook.ipynb

      
              1 file
            
          
              7 forks
            
          
              0 comments
            
          
              5 stars
            
          
                bigsnarfdude
                / demo_faster_rcnn_notebook.ipynb
            
            
              Created
              November 7, 2016 04:12
            
              
                faster rcnn notebook
              
          
        Loading

      Sorry, something went wrong. Reload?
      Sorry, we cannot display this file.
      Sorry, this file is invalid so it cannot be displayed.
      
          Viewer requires iframe.
      
    
## export_reveal.py
# -*- coding: utf-8 -*-

## EXPORTING TO PDF FROM revealjs OR jupyter notebook slides

## using nbconvert and decktape (https://github.com/astefanutti/decktape)
## to export pdf and/or html(revealjs)
## from jupyter notebook / revealjs html
## phantomjs must be included in path, and decktape directory must be place beside this export_reveal.py file
## for more detail, please check:
## nbconvert - https://github.com/jupyter/nbconvert

## fimp_xgboost.py
# credits @mmueller     https://www.kaggle.com/mmueller/liberty-mutual-group-property-inspection-prediction/xgb-feature-importance-python/code
import pandas as pd
import xgboost as xgb
import operator
from matplotlib import pylab as plt

def ceate_feature_map(features):
    outfile = open('xgb.fmap', 'w')
    i = 0
    for feat in features:

## README.md

      
              9 files
            
          
              1 fork
            
          
              0 comments
            
          
              3 stars
            
          
                rbren
                / README.md
            
            
              Created
              January 25, 2016 23:36
            
              
                Sync GitHub Issues to Trello
              
          
    DataFire Daemon: Sync GitHub Issues to Trello

Create a Trello list for every Milestone, and a card for every Issue
View on DataFire
[metadata]: ./ '{"links":[{"connection":"564cb90e2a034b0e0f1255fe","operation":{"method":"get","path":"/members/{idMember}/boards"}},{"connection":"563b9b84ea9ad5f345e97505","operation":{"method":"get","path":"/repos/{ownerId}/{repoId}/issues"}},{"connection":"564cb90e2a034b0e0f1255fe","operation":{"method":"get","path":"/boards/{idBoard}/cards"}},{"connection":"564cb90e2a034b0e0f1255fe","operation":{"method":"get","path":"/boards/{idBoard}/lists"}},{"connection":"563b9b84ea9ad5f345e97505","operation":{"method":"get","path":"/repos/{ownerId}/{repoId}/milestones"}},{"connection":"564cb90e2a034b0e0f1255fe","operation":{"method":"post","path":"/lists"}},{"connection":"564cb90e2a034b0e0f1255fe","operation":{"method":"post","path":"/cards"}},{"connection":"564cb90e2a034b0e0f1255fe","operation":{"method":"put","path":"/cards/{i

  
## K-Means.ipynb

      
              1 file
            
          
              13 forks
            
          
              9 comments
            
          
              53 stars
            
          
                narphorium
                / K-Means.ipynb
            
            
              Last active
              August 3, 2021 06:40
            
          
        Loading

      Sorry, something went wrong. Reload?
      Sorry, we cannot display this file.
      Sorry, this file is invalid so it cannot be displayed.
      
          Viewer requires iframe.
      
    
## Spark_OnlineLDA_wikipedia_example.scala
import org.apache.spark.ml.feature.{CountVectorizer, RegexTokenizer, StopWordsRemover}
import org.apache.spark.mllib.clustering.{LDA, OnlineLDAOptimizer}
import org.apache.spark.mllib.linalg.Vector

import sqlContext.implicits._

val numTopics: Int = 100
val maxIterations: Int = 100
val vocabSize: Int = 10000
	# See official docs at https://dash.plotly.com
	# pip install dash pandas

	from dash import Dash, dcc, html, Input, Output
	import plotly.express as px

	import pandas as pd

	df = pd.read_csv('https://raw.githubusercontent.com/plotly/datasets/master/gapminderDataFiveYear.csv')
	You can use select with varargs including *:

	import spark.implicits._

	df.select($"*" +: Seq("A", "B", "C").map(c =>
	sum(c).over(Window.partitionBy("ID").orderBy("time")).alias(s"cum$c")
	): _*)
	This:

	Maps columns names to window expressions with Seq("A", ...).map(...)
	CREATE EXTERNAL TABLE IF NOT EXISTS alb_logs (
	type string,
	timestamp string,
	elb string,
	client_ip string,
	client_port int,
	target_ip string,
	target_port int,
	request_processing_time double,
	target_processing_time double,
	# -- coding: utf-8 --

	## EXPORTING TO PDF FROM revealjs OR jupyter notebook slides

	## using nbconvert and decktape (https://github.com/astefanutti/decktape)
	## to export pdf and/or html(revealjs)
	## from jupyter notebook / revealjs html
	## phantomjs must be included in path, and decktape directory must be place beside this export_reveal.py file
	## for more detail, please check:
	## nbconvert - https://github.com/jupyter/nbconvert
	# credits @mmueller https://www.kaggle.com/mmueller/liberty-mutual-group-property-inspection-prediction/xgb-feature-importance-python/code
	import pandas as pd
	import xgboost as xgb
	import operator
	from matplotlib import pylab as plt

	def ceate_feature_map(features):
	outfile = open('xgb.fmap', 'w')
	i = 0
	for feat in features:
	import org.apache.spark.ml.feature.{CountVectorizer, RegexTokenizer, StopWordsRemover}
	import org.apache.spark.mllib.clustering.{LDA, OnlineLDAOptimizer}
	import org.apache.spark.mllib.linalg.Vector

	import sqlContext.implicits._

	val numTopics: Int = 100
	val maxIterations: Int = 100
	val vocabSize: Int = 10000