Akshay jha akshayjh

## sources.list
deb http://kali.cs.nctu.edu.tw/ /kali main contrib non-free
deb http://kali.cs.nctu.edu.tw/ /wheezy main contrib non-free
deb http://kali.cs.nctu.edu.tw/kali kali-dev main contrib non-free
deb http://kali.cs.nctu.edu.tw/kali kali-dev main/debian-installer
deb-src http://kali.cs.nctu.edu.tw/kali kali-dev main contrib non-free
deb http://kali.cs.nctu.edu.tw/kali kali main contrib non-free
deb http://kali.cs.nctu.edu.tw/kali kali main/debian-installer
deb-src http://kali.cs.nctu.edu.tw/kali kali main contrib non-free
deb http://kali.cs.nctu.edu.tw/kali-security kali/updates main contrib non-free
deb-src http://kali.cs.nctu.edu.tw/kali-security kali/updates main contrib non-free

## taxes.py
import sys, re
from string import join
import requests

r = requests.get("http://www.co.kane.il.us/TaxAssessment/Treasurer.aspx?parcelnumber=" + sys.argv[1])
text = r.text

ADDRESS = """<span id="lblPropertyAddress[0-9]" style="display:inline-block;">([A-Za-z0-9 ,-.]*)</span><br />"""
TAXES = """TaxYear=(\d\d\d\d)">(\d\d\d\d|Current Year)</a></td><td>([0-9.]*)</td>"""
RATE = """<span id="lblTaxRate" style="display:inline-block;"><font face="Arial">([0-9.]*)</font></span><br />"""

## WebScrape.R
rm(list = ls(all = TRUE)) #CLEAR WORKSPACE
library(quantmod)

#Scrape data from the website
library(XML)
rawPMI <- readHTMLTable('http://www.ism.ws/ISMReport/content.cfm?ItemNumber=10752')
PMI <- data.frame(rawPMI[[1]])
names(PMI)[1] <- 'Year'

#Reshape

## FacebookFromR.r
###############################################################################################
##                                                                                           ##
##           Setup                                                                           ##
##                                                                                           ##
###############################################################################################

# install.packages("Rfacebook")  # from CRAN
# install.packages("Rook")  # from CRAN
# install.packages("igraph") # from CRAN

## ml-with-c50-credits.R
# Download data set via:
#   http://archive.ics.uci.edu/ml/datasets/Statlog+%28German+Credit+Data%29
#
# Note, the example below uses the pre-processed data that is used in the book 'Machine Learning with R' by Brett Lantz

library(C50)

df <- read.csv("credit.csv", stringsAsFactors=TRUE)
set.seed(12345)
df_rand <- df[order(runif(1000)),]

## example1.py
import nltk

with open('sample.txt', 'r') as f:
    sample = f.read()

sentences = nltk.sent_tokenize(sample)
tokenized_sentences = [nltk.word_tokenize(sentence) for sentence in sentences]
tagged_sentences = [nltk.pos_tag(sentence) for sentence in tokenized_sentences]
chunked_sentences = nltk.ne_chunk_sents(tagged_sentences, binary=True)

## pos_tagging.py
#Script tags POS and NER[Named Entity Recognition] for a supplied text file.
#Date: Nov 2 2012
#Author: Hota Sobhan

import nltk

f = open('C:\Python27\Test_File.txt')
data = f.readlines()

#Parse the text file for NER with POS Tagging

## nltk_tokenize_tag_chunk.rst

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                akshayjh
                / nltk_tokenize_tag_chunk.rst
            
            
              Created
              March 22, 2017 03:57
                — forked from japerk/nltk_tokenize_tag_chunk.rst
            
              
                NLTK Tokenization, Tagging, Chunking, Treebank
              
          
    Sentence Tokenization

>>> from nltk import tokenize >>> para = "Hello. My name is Jacob. Today you'll be learning NLTK." >>> sents = tokenize.sent_tokenize(para) >>> sents ['Hello.', 'My name is Jacob.', "Today you'll be learning NLTK."]

  
## convert_csv_to_json
def convertCSVtoJSON(input): #pass the name of the input csv file
	f = open(input, 'r')
	j = open('.tempJSON', 'w')
	fieldnames = ("field1,field2,field3")
	reader = csv.DictReader(f, fieldnames)
	for row in reader:
		json.dump(row, j)
		j.write('\n')
	f.close()
	j.close()

## gist:aa8cda2a287fc3dff34a2f04cdcc525f

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                akshayjh
                / gist:aa8cda2a287fc3dff34a2f04cdcc525f
            
            
              Created
              May 11, 2017 10:27
                — forked from folkengine/gist:f019c2dee3f6c3ab6345
            
              
                Neo4j Linked Data Links
              
          
    http://www.neo4j.org/develop/linked_data
http://neo4j.com/blog/and-now-for-something-completely-different-using-owl-with-neo4j/?_ga=1.82889430.1907739431.1411998329
http://losangelesindustries.tumblr.com/post/41701508265/loading-dbpedia-into-neo4j-with-clojure
http://michaelbloggs.blogspot.de/2013/05/importing-ttl-turtle-ontologies-in-neo4j.html
http://www.neo4j.org/develop/clojure
	deb http://kali.cs.nctu.edu.tw/ /kali main contrib non-free
	deb http://kali.cs.nctu.edu.tw/ /wheezy main contrib non-free
	deb http://kali.cs.nctu.edu.tw/kali kali-dev main contrib non-free
	deb http://kali.cs.nctu.edu.tw/kali kali-dev main/debian-installer
	deb-src http://kali.cs.nctu.edu.tw/kali kali-dev main contrib non-free
	deb http://kali.cs.nctu.edu.tw/kali kali main contrib non-free
	deb http://kali.cs.nctu.edu.tw/kali kali main/debian-installer
	deb-src http://kali.cs.nctu.edu.tw/kali kali main contrib non-free
	deb http://kali.cs.nctu.edu.tw/kali-security kali/updates main contrib non-free
	deb-src http://kali.cs.nctu.edu.tw/kali-security kali/updates main contrib non-free
	import sys, re
	from string import join
	import requests

	r = requests.get("http://www.co.kane.il.us/TaxAssessment/Treasurer.aspx?parcelnumber=" + sys.argv[1])
	text = r.text

	ADDRESS = """<span id="lblPropertyAddress[0-9]" style="display:inline-block;">([A-Za-z0-9 ,-.]*)</span><br />"""
	TAXES = """TaxYear=(\d\d\d\d)">(\d\d\d\d\|Current Year)</a></td><td>([0-9.]*)</td>"""
	RATE = """<span id="lblTaxRate" style="display:inline-block;"><font face="Arial">([0-9.]*)</font></span><br />"""
	rm(list = ls(all = TRUE)) #CLEAR WORKSPACE
	library(quantmod)

	#Scrape data from the website
	library(XML)
	rawPMI <- readHTMLTable('http://www.ism.ws/ISMReport/content.cfm?ItemNumber=10752')
	PMI <- data.frame(rawPMI[[1]])
	names(PMI)[1] <- 'Year'

	#Reshape
	###############################################################################################
	## ##
	## Setup ##
	## ##
	###############################################################################################

	# install.packages("Rfacebook") # from CRAN
	# install.packages("Rook") # from CRAN
	# install.packages("igraph") # from CRAN
	# Download data set via:
	# http://archive.ics.uci.edu/ml/datasets/Statlog+%28German+Credit+Data%29
	#
	# Note, the example below uses the pre-processed data that is used in the book 'Machine Learning with R' by Brett Lantz

	library(C50)

	df <- read.csv("credit.csv", stringsAsFactors=TRUE)
	set.seed(12345)
	df_rand <- df[order(runif(1000)),]
	import nltk

	with open('sample.txt', 'r') as f:
	sample = f.read()

	sentences = nltk.sent_tokenize(sample)
	tokenized_sentences = [nltk.word_tokenize(sentence) for sentence in sentences]
	tagged_sentences = [nltk.pos_tag(sentence) for sentence in tokenized_sentences]
	chunked_sentences = nltk.ne_chunk_sents(tagged_sentences, binary=True)
	#Script tags POS and NER[Named Entity Recognition] for a supplied text file.
	#Date: Nov 2 2012
	#Author: Hota Sobhan

	import nltk

	f = open('C:\Python27\Test_File.txt')
	data = f.readlines()

	#Parse the text file for NER with POS Tagging
	def convertCSVtoJSON(input): #pass the name of the input csv file
	f = open(input, 'r')
	j = open('.tempJSON', 'w')
	fieldnames = ("field1,field2,field3")
	reader = csv.DictReader(f, fieldnames)
	for row in reader:
	json.dump(row, j)
	j.write('\n')
	f.close()
	j.close()