Skip to content

Instantly share code, notes, and snippets.

@TATABOX42
TATABOX42 / nlp_lib.py
Created September 17, 2019 00:10
Built this module in Python 3 to process and clean strings. It removes emojis, words that are smaller than a certain length, etc.
import re
from string import digits, punctuation
from nltk.stem import SnowballStemmer
from nltk.tokenize import word_tokenize
class ProcessTextMethods:
def __init__(self):
self.stemmer = SnowballStemmer("english")
self.emoji_pattern = re.compile("["
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
@TATABOX42
TATABOX42 / server.py
Last active August 29, 2015 14:28 — forked from christianroman/server.py
Rompiendo Captcha de CURP usando Python, OpenCV, Tesseract OCR y Tornado
import tornado.ioloop
import tornado.web
import urllib2 as urllib
from PIL import Image
from cStringIO import StringIO
import numpy as np
import tesserwrap
import cv2
class MainHandler(tornado.web.RequestHandler):
# ***********************************************
# ***********************************************
# Author: Benjamin Tovar
# Date: April 20, 2015
# Post: http://btovar.com/2015/04/introduction-to-k-means-in-r/ ‎
# ***********************************************
# ***********************************************
library(ggplot2)
library(reshape)
# **********************************
# Author: Benjamin Tovar
# Date: March 25, 2015
# Post: Using Neural Networks to fit equations in R
# Post url: http://btovar.com/2015/03/neural-networks-fit-eq/
# **********************************
# load libraries
library(RSNNS
library(ggplot2)
>gi|1620934|emb|Z80230.1| Calliphora vicina trp gene
AAAAGTTTAAATTGGATAAATTGCAAAAGGACAATTAAGGATACGGAATATATGCGTAGTTTGTGTAAAA
TGCGCTTATAGAAACACAGAAAAAAAAAATAAAAACGGATAAATCTTTAGAAACAATAAACACTAGCTTA
AAAATTAAAAGCAAAACAAACAATAAAACATGGCAACTGATCCGGAAAAAGGGAAAAATGAGGAAGAAAA
CTATAATATACAGTTTGCAGATGAATACGTGTTGACGGAGACAGAGAAAACCTTTATATTGGCTTGTGAG
CGCGGTGACATAGCAAGTGTCAAGGTAATAATTGAGGAAAATAAAGGTGCACCGGAAAAGTTTAATATTA
ATTGTGTTGATCCCATGAATCGTTCGGCCTTAATATCAGCCATTGAAAATGAAAATTTTGATTTAATGAT
TGTACTGTTGGAGGAAGGCATAGATGTGGGCGATGCATTGTTGCATGCTATTTCTGAAGAATATGTGGAG
GCTGTGGAGGAACTGTTGCAATGGGAAGAAACGCATCATAAGGAGGGTACACCATATAGTTGGGAGGCAG
TTGATCGTTCGAAATCGACATTTACGCCTGATATAACGCCTCTAATATTGGCAGCACATCGTAACAATTA
# ******************************************************************************
# FUNCTION: extract.five.utr.sequence | JULY/29/2012 | BENJAMIN TOVAR
# ******************************************************************************
extract.five.utr.sequence <- function(gene.list.refseq,
number.bases.upstream=1000){
# Author: Benjamin Tovar
# Date: July 29, 2012
# Post: http://btovar.com/2015/03/extracting-upstream-regions/
# Author: Benjamin Tovar
# Date: March 14, 2015
# Post: http://btovar.com/2015/03/markov-chains-in-r
#
# Example of a Markov Chain of zero order (the current nucleotide is
# totally independent of the previous nucleotide).
# ***********************************************************************
# ***********************************************************************
#
# PREDICTING LONG TERM CUSTOMER VALUE WITH BTYD PACKAGE
# Pareto/NBD (negative binomial distribution) modeling of
# repeat-buying behavior in a noncontractual setting
#
# Matthew Baggott, matt@baggott.net
#
# Accompanying slides at:
# http://www.slideshare.net/mattbagg/baggott-predict-customerinrpart1#
#
@TATABOX42
TATABOX42 / BirdMan
Last active August 29, 2015 14:13 — forked from anonymous/BirdMan
package crappyBird;
import java.awt.Graphics;
import java.awt.Rectangle;
import java.awt.event.ActionEvent;
import java.awt.event.ActionListener;
import java.awt.image.BufferedImage;
import java.io.IOException;
import java.net.URL;