Christopher Fox cdfox

## reproduce_roblox_distilbert.py
# Reproducing Roblox DistilBERT Medium Post
# https://blog.roblox.com/2020/05/scaled-bert-serve-1-billion-daily-requests-cpus/
#
# 1. Launch C5 12xlarge with Deep Learning AMI (Ubuntu 18.04) Version 32.0 (ami-0dc2264cd927ca9eb)
# 2. pip install transformers[torch]
# 3. python reproduce_roblox_distilbert.py

import timeit
from transformers import DistilBertTokenizerFast, \
    DistilBertForSequenceClassification

## tuple_equality.py
class foo:
     def __eq__(self, o):
         return False

t = (foo(),)
t2 = (t[0],)

t == t2  # True
t[0] == t2[0]  # False
t[0] is t2[0]  # True

## out_of_memory_in_web_server.go
package main

import (
    "fmt"
    "log"
    "net/http"
)

func main() {
    http.HandleFunc("/", func(w http.ResponseWriter, r *http.Request) {

## gist:6857081
from itertools import permutations

perms = permutations(range(6))

def check(p):
    i1 = p.index(0) < p.index(3)
    i2 = p.index(1) < p.index(4)
    i3 = p.index(2) < p.index(1)
    i4 = p.index(2) < p.index(5)
    i5 = p.index(3) < p.index(4)

## preprocess.go
// For each line of the input file, remove nonalphanumeric characters,
// lowercase all letters, remove stopwords, and write the result to the output
// file. I used the answer here as a template for reading/writing files:
// http://stackoverflow.com/questions/1821811/how-to-read-write-from-to-file/9739903#9739903

package main

import (
	"bufio"
	"fmt"

## gist:2910560
sentences = [s for rev in reviews for s in rev.split(".")]

## gist:2830517
print 'hello world'

## gist:2560930
import requests
import codecs

url = 'http://www.instapaper.com/m'
params = {'u': 'http://techcrunch.com/2012/04/30/bn-8-k-microsoft-paying-180m-advance-on-nook-for-windows-8-125m-for-content-tech-acquisition/'}
r = requests.get(url, params=params)

# r.text holds the response from the server. It appears to be unicode in this case.
f = codecs.open("foo.html", mode="w", encoding="UTF-8")
f.write(r.text)

## gist:1037261

import json
import urllib
import urllib2
from gensim import corpora, models, similarities
import logging
import sys

# First 20 Twitter search results for "python"
tweets = [u'Long Integer Objects \u2014 Python v2.7.2 documentation http://bit.ly/jEzUVi',

## gist:1031054
Topic 0:

ICFP Programming Contest 2011 (Lambda: The Gathering) http://bit.ly/mfpZk6 #fp #fsharp #ocaml #haskell #scala #lisp #racket #scheme
[(0, 0.95871468032041129), (1, 0.079066183724039785)]

RT @rickasaurus: ICFP Programming Contest 2011 (Lambda: The Gathering) http://bit.ly/mfpZk6 #fp #fsharp #ocaml #haskell #scala #lisp #racket #scheme
[(0, 0.99229220887802994), (1, 0.062785061633268899)]

RT @rickasaurus: ICFP Programming Contest 2011 (Lambda: The Gathering) http://bit.ly/mfpZk6 #fp #fsharp #ocaml #haskell #scala #lisp #racket #scheme
[(0, 0.99229220887802994), (1, 0.062785061633268899)]
	# Reproducing Roblox DistilBERT Medium Post
	# https://blog.roblox.com/2020/05/scaled-bert-serve-1-billion-daily-requests-cpus/
	#
	# 1. Launch C5 12xlarge with Deep Learning AMI (Ubuntu 18.04) Version 32.0 (ami-0dc2264cd927ca9eb)
	# 2. pip install transformers[torch]
	# 3. python reproduce_roblox_distilbert.py

	import timeit
	from transformers import DistilBertTokenizerFast, \
	DistilBertForSequenceClassification
	class foo:
	def __eq__(self, o):
	return False

	t = (foo(),)
	t2 = (t[0],)

	t == t2 # True
	t[0] == t2[0] # False
	t[0] is t2[0] # True
	package main

	import (
	"fmt"
	"log"
	"net/http"
	)

	func main() {
	http.HandleFunc("/", func(w http.ResponseWriter, r *http.Request) {
	from itertools import permutations

	perms = permutations(range(6))

	def check(p):
	i1 = p.index(0) < p.index(3)
	i2 = p.index(1) < p.index(4)
	i3 = p.index(2) < p.index(1)
	i4 = p.index(2) < p.index(5)
	i5 = p.index(3) < p.index(4)
	// For each line of the input file, remove nonalphanumeric characters,
	// lowercase all letters, remove stopwords, and write the result to the output
	// file. I used the answer here as a template for reading/writing files:
	// http://stackoverflow.com/questions/1821811/how-to-read-write-from-to-file/9739903#9739903

	package main

	import (
	"bufio"
	"fmt"
	import requests
	import codecs

	url = 'http://www.instapaper.com/m'
	params = {'u': 'http://techcrunch.com/2012/04/30/bn-8-k-microsoft-paying-180m-advance-on-nook-for-windows-8-125m-for-content-tech-acquisition/'}
	r = requests.get(url, params=params)

	# r.text holds the response from the server. It appears to be unicode in this case.
	f = codecs.open("foo.html", mode="w", encoding="UTF-8")
	f.write(r.text)

	import json
	import urllib
	import urllib2
	from gensim import corpora, models, similarities
	import logging
	import sys

	# First 20 Twitter search results for "python"
	tweets = [u'Long Integer Objects \u2014 Python v2.7.2 documentation http://bit.ly/jEzUVi',
	Topic 0:

	ICFP Programming Contest 2011 (Lambda: The Gathering) http://bit.ly/mfpZk6 #fp #fsharp #ocaml #haskell #scala #lisp #racket #scheme
	[(0, 0.95871468032041129), (1, 0.079066183724039785)]

	RT @rickasaurus: ICFP Programming Contest 2011 (Lambda: The Gathering) http://bit.ly/mfpZk6 #fp #fsharp #ocaml #haskell #scala #lisp #racket #scheme
	[(0, 0.99229220887802994), (1, 0.062785061633268899)]

	RT @rickasaurus: ICFP Programming Contest 2011 (Lambda: The Gathering) http://bit.ly/mfpZk6 #fp #fsharp #ocaml #haskell #scala #lisp #racket #scheme
	[(0, 0.99229220887802994), (1, 0.062785061633268899)]