Jodie Burchell t-redactyl

## loading_in_depression_data.do
use http://www.ats.ucla.edu/stat/stata/library/depress, clear
reshape long dep, i(subj)
rename _j time
drop pre

## perm_alt_sample_plots.R
# Load required packages
require(ggplot2); require(gridExtra)

# Set the colours for the graphs
barfill <- "#4271AE"
barlines <- "#1F3552"
line1 <- "black"
line2 <- "#FF3721"

# Plotting histogram of sample 1

## generate_95CI_around_t_value.R
# Generate the 95% confidence interval.
lci <- -1 * qt(c(.975), 78)
uci <- qt(c(.975), 78)

## cat_class_1_method.py
def name_print(cat):
    '''Print the name of the cat.'''
    print "The cat is called %s." % cat.name

name_print(felix)

## web-scraping.py
import lxml.html
from lxml.cssselect import CSSSelector
import requests

def get_title(node):
    '''
    Extracts the movie title from the URL http://www.timeout.com/london/film/the-50-best-christmas-movies
    taking into account that some titles are tagged as h3, and some as h3 a.
    '''
    h3_elem = node.cssselect('div.feature-item__text h3')[0]

## mysql_setup.sql
-- Create tables
DROP TABLE IF EXISTS ratingsdata;
CREATE TABLE ratingsdata (
   userid INT,
   itemid INT,
   rating INT,
   timestamp INT,
   PRIMARY KEY (userid, itemid));

DROP TABLE IF EXISTS movies;

## data_extraction.py
import urllib2
import json
import math

import numpy as np
from pandas import Series, DataFrame
import pandas as pd
import matplotlib.pyplot as plt

def expired_listings(site, searchterm):

## gohan.go
package main

import (
	"fmt"
)

type Saiyan struct {
	Name   string
	Power  int
	Father *Saiyan

## Analyses of resolutions.R
library(ggplot2)

positions = c("Travel and Holidays", "Finances", "Learning and Career", "Mental Wellbeing",
              "Relationships", "Physical Health")

# What are the most popular resolutions?
p1 <- ggplot(twitter_df[twitter_df$Resolution.type != "",], aes(x = Resolution.type, fill = Resolution.type)) +
        geom_bar() +
        coord_flip() +
        ggtitle("Number of tweets by resolution type") +

## remove_numbers.py
# Function designed to strip out all numbers (alphabetic - English only - and numeric) from a string as part of a
# text normalisation process.

# Based on the text2num package (https://github.com/ghewgill/text2num) and using code from
# here (http://stackoverflow.com/questions/25346058/removing-list-of-words-from-a-string)

from string import digits

# List of number terms
nums = ['zero', 'one', 'two', 'three', 'four', 'five', 'six', 'seven', 'eight', 'nine', 'ten', 'eleven',
	use http://www.ats.ucla.edu/stat/stata/library/depress, clear
	reshape long dep, i(subj)
	rename _j time
	drop pre
	# Load required packages
	require(ggplot2); require(gridExtra)

	# Set the colours for the graphs
	barfill <- "#4271AE"
	barlines <- "#1F3552"
	line1 <- "black"
	line2 <- "#FF3721"

	# Plotting histogram of sample 1
	# Generate the 95% confidence interval.
	lci <- -1 * qt(c(.975), 78)
	uci <- qt(c(.975), 78)
	def name_print(cat):
	'''Print the name of the cat.'''
	print "The cat is called %s." % cat.name

	name_print(felix)
	import lxml.html
	from lxml.cssselect import CSSSelector
	import requests

	def get_title(node):
	'''
	Extracts the movie title from the URL http://www.timeout.com/london/film/the-50-best-christmas-movies
	taking into account that some titles are tagged as h3, and some as h3 a.
	'''
	h3_elem = node.cssselect('div.feature-item__text h3')[0]
	-- Create tables
	DROP TABLE IF EXISTS ratingsdata;
	CREATE TABLE ratingsdata (
	userid INT,
	itemid INT,
	rating INT,
	timestamp INT,
	PRIMARY KEY (userid, itemid));

	DROP TABLE IF EXISTS movies;
	import urllib2
	import json
	import math

	import numpy as np
	from pandas import Series, DataFrame
	import pandas as pd
	import matplotlib.pyplot as plt

	def expired_listings(site, searchterm):
	package main

	import (
	"fmt"
	)

	type Saiyan struct {
	Name string
	Power int
	Father *Saiyan
	library(ggplot2)

	positions = c("Travel and Holidays", "Finances", "Learning and Career", "Mental Wellbeing",
	"Relationships", "Physical Health")

	# What are the most popular resolutions?
	p1 <- ggplot(twitter_df[twitter_df$Resolution.type != "",], aes(x = Resolution.type, fill = Resolution.type)) +
	geom_bar() +
	coord_flip() +
	ggtitle("Number of tweets by resolution type") +
	# Function designed to strip out all numbers (alphabetic - English only - and numeric) from a string as part of a
	# text normalisation process.

	# Based on the text2num package (https://github.com/ghewgill/text2num) and using code from
	# here (http://stackoverflow.com/questions/25346058/removing-list-of-words-from-a-string)

	from string import digits

	# List of number terms
	nums = ['zero', 'one', 'two', 'three', 'four', 'five', 'six', 'seven', 'eight', 'nine', 'ten', 'eleven',