thomasjensen

## ebtrust.r
library(ggplot2)

setwd("/path/to/file/")

data <- read.csv("ebAll.csv")

data$date <- as.Date(data$date, format = "%y/%m/%d")
data$Tend.to.trust <- as.numeric(gsub("%","",data$Tend.to.trust))
data$Tend.not.to.trust <- as.numeric(gsub("%","",data$Tend.not.to.trust))
data$DK...Don.t.know <- as.numeric(gsub("%","",data$DK...Don.t.know))

## textmining.r
##read in the libraries and set the working directory
library(tm)
library(corrplot)
setwd("/path/to/")

##read in the data and subset it to the relevant categories
data <- read.csv("indvandringPolitikken.csv", fileEncoding = "latin1")
data <- data[data$kategori == "Politik" | data$kategori == "Debat" | data$kategori == "Kronikken" | data$kategori == "Leder", ]

##create the corpus and clean it

## rbloggerAnalysis.r
#read the libraries
library(plyr)
library(ggplot2)
library(xtable)

#set the working direcotry to where you saved the output.csv file from the previous post
setwd("/.../")

#read the data
data <- read.csv("output.csv")

## extract.py
from BeautifulSoup import BeautifulSoup
import os
import re

path = "/Users/thomasjensen/Documents/RBloggersScrape/download"

listing = os.listdir(path)
listing = [name for name in listing if re.search(r"post\d+\.html",name) != None]

os.chdir(path)

## download.py
from BeautifulSoup import BeautifulSoup
import mechanize
import time

url = "http://www.r-bloggers.com/"

br = mechanize.Browser()

page = br.open(url)

## ft.r
library(plyr)
library(ggplot2)
setwd("/.../")

data <- read.csv("ft.csv")

data.final <- data[data$Amendment == 0,]
data.amendment <- data[data$Amendment == 1,]

activity <- ddply(data.final,c("Year","Month"),function(x) data.frame(count = length(unique(x$Voteid))))

## vectorize.r
data <- cbind(rnorm(100),rnorm(100),rnorm(100))

outlierMat <- function(mat) {
m <- rowMeans(mat)
devs <- abs(mat - m)
val <- apply(mat, 1, max)
pos <- which(mat == val, arr.ind = TRUE)
out <- cbind(pos,val)
return(out)
}

## simconf.r
#set the working directoy and read the foreign library
setwd("/.../")
library(foreign)

#read the data and remove missing values of the dependent variable
data <- read.dta("repdata.dta")
data <- data[data$onset != 4,]

#estimate the model
model <- glm(onset ~ warl + gdpenl + lpopl1 + lmtnest + ncontig + Oil + nwstate + instab + polity2l + ethfrac + relfrac, data = data, family = "binomial")

## applyexample.r
data <- cbind(rnorm(100),rnorm(100),rnorm(100))

outlier <- function(xrow){
  m <- mean(xrow)
  devs <- abs(xrow - m)
  pos <- which.max(devs)
  val <- devs[pos]
  out <- c(pos,val)
  return(out)
}

## tikz.tex
\documentclass{article}

\usepackage{tikz}

\begin{document}

\begin{figure}[ht]
\input{test.tex}
\caption{Sample output from tikzDevice}
\end{figure}
	library(ggplot2)

	setwd("/path/to/file/")

	data <- read.csv("ebAll.csv")

	data$date <- as.Date(data$date, format = "%y/%m/%d")
	data$Tend.to.trust <- as.numeric(gsub("%","",data$Tend.to.trust))
	data$Tend.not.to.trust <- as.numeric(gsub("%","",data$Tend.not.to.trust))
	data$DK...Don.t.know <- as.numeric(gsub("%","",data$DK...Don.t.know))
	##read in the libraries and set the working directory
	library(tm)
	library(corrplot)
	setwd("/path/to/")

	##read in the data and subset it to the relevant categories
	data <- read.csv("indvandringPolitikken.csv", fileEncoding = "latin1")
	data <- data[data$kategori == "Politik" \| data$kategori == "Debat" \| data$kategori == "Kronikken" \| data$kategori == "Leder", ]

	##create the corpus and clean it
	#read the libraries
	library(plyr)
	library(ggplot2)
	library(xtable)

	#set the working direcotry to where you saved the output.csv file from the previous post
	setwd("/.../")

	#read the data
	data <- read.csv("output.csv")
	from BeautifulSoup import BeautifulSoup
	import os
	import re

	path = "/Users/thomasjensen/Documents/RBloggersScrape/download"

	listing = os.listdir(path)
	listing = [name for name in listing if re.search(r"post\d+\.html",name) != None]

	os.chdir(path)
	from BeautifulSoup import BeautifulSoup
	import mechanize
	import time

	url = "http://www.r-bloggers.com/"

	br = mechanize.Browser()

	page = br.open(url)
	data <- cbind(rnorm(100),rnorm(100),rnorm(100))

	outlierMat <- function(mat) {
	m <- rowMeans(mat)
	devs <- abs(mat - m)
	val <- apply(mat, 1, max)
	pos <- which(mat == val, arr.ind = TRUE)
	out <- cbind(pos,val)
	return(out)
	}
	#set the working directoy and read the foreign library
	setwd("/.../")
	library(foreign)

	#read the data and remove missing values of the dependent variable
	data <- read.dta("repdata.dta")
	data <- data[data$onset != 4,]

	#estimate the model
	model <- glm(onset ~ warl + gdpenl + lpopl1 + lmtnest + ncontig + Oil + nwstate + instab + polity2l + ethfrac + relfrac, data = data, family = "binomial")
	data <- cbind(rnorm(100),rnorm(100),rnorm(100))

	outlier <- function(xrow){
	m <- mean(xrow)
	devs <- abs(xrow - m)
	pos <- which.max(devs)
	val <- devs[pos]
	out <- c(pos,val)
	return(out)
	}
	\documentclass{article}

	\usepackage{tikz}

	\begin{document}

	\begin{figure}[ht]
	\input{test.tex}
	\caption{Sample output from tikzDevice}
	\end{figure}