Skip to content

Instantly share code, notes, and snippets.

@shuozhang1985
Created August 22, 2016 00:26
Show Gist options
  • Star 0 You must be signed in to star a gist
  • Fork 0 You must be signed in to fork a gist
  • Save shuozhang1985/df2bdcb3ee74827de0cd02e530072ddf to your computer and use it in GitHub Desktop.
Save shuozhang1985/df2bdcb3ee74827de0cd02e530072ddf to your computer and use it in GitHub Desktop.
setwd("~/Desktop/web scraping")
library(ggplot2)
library(data.table)
library(dygraphs)
library(dplyr)
swimming=read.csv('swimming.txt', header=T, stringsAsFactors = F)
nrow(swimming)
View(swimming)
summary(swimming)
ss=swimming%>%
dplyr::group_by(Country) %>%
dplyr::summarise(avgscore=mean(Score)) %>%
arrange(desc(avgscore))
head(ss,20)
swimming1=filter(swimming, Country %in% c('United States', 'Australia','Greece',
'China', 'Ireland','Japan', 'Ukraine',
'Zimbabwe', 'Germany', 'Russia', 'Hungary',
'Netherlands', 'Bulgaria', 'Canada',
'Great Britain'))
#unique(df$Country)
swimming2=dcast(swimming1[,c('Country', 'Score', 'year')], year~ Country,value.var="Score")
#swimming3=dcast(swimming1[,c('Country', 'Percent', 'year')], year~ Country,value.var="Percent")
#swimming2[is.na(swimming2)]=0
color=c('red', 'pink', 'purple', 'indigo', 'blue',
'black', 'gray', 'teal', 'green', 'grey',
'lime', 'yellow', 'amber', 'orange', 'brown' )
dygraph(swimming2) %>%
dyOptions(colors = color)
# dygraph(swimming3) %>%
# dyOptions(colors = color)
athletics=read.csv('athletics.txt', header=T, stringsAsFactors = F)
nrow(athletics)
ss1=athletics%>%
dplyr::group_by(Country) %>%
dplyr::summarise(avgscore=mean(Score)) %>%
arrange(desc(avgscore))
head(ss1, 20)
athletics1=filter(athletics, Country %in% c('United States','Russia', 'Kenya', 'Great Britain',
'Germany', 'Finland', 'Jamaica', 'Ethiopia',
'Poland', 'Sweden', 'Belarus','Cuba',
'Australia', 'Romania', 'Greece'))
#athletics2[is.na(athletics2)]=0
athletics2=dcast(athletics1[,c('Country', 'Score', 'year')], year~ Country,value.var="Score")
dygraph(athletics2) %>%
dyOptions(colors = color)
gymnastics=read.csv('gymnastics.txt', header=T, stringsAsFactors = F)
nrow(gymnastics)
ss2=gymnastics%>%
dplyr::group_by(Country) %>%
dplyr::summarise(avgscore=mean(Score)) %>%
arrange(desc(avgscore))
head(ss2,20)
gymnastics1=filter(gymnastics, Country %in% c('China', 'United States', 'Japan', 'Russia',
'Romania', 'Switzerland', 'Germany', 'Italy',
'Hungary', 'Austria', 'Greece', 'Belarus',
'Ukraine', 'France', 'Finland'))
gymnastics2=dcast(gymnastics1[,c('Country', 'Score', 'year')], year~ Country,value.var="Score")
dygraph(gymnastics2) %>%
dyOptions(colors = color)
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment