Skip to content

Instantly share code, notes, and snippets.

@njtierney
Created August 5, 2016 01:20
Show Gist options
  • Star 0 You must be signed in to star a gist
  • Fork 0 You must be signed in to fork a gist
  • Save njtierney/e390b8880cec2f5cd787181c90f8773b to your computer and use it in GitHub Desktop.
Save njtierney/e390b8880cec2f5cd787181c90f8773b to your computer and use it in GitHub Desktop.
library(plyr)
library(dplyr)
library(tidyr)
library(visdat)
library(ggplot2)
library(readr)
bible_quote <- read_csv("/Users/tierneyn/Downloads/public-bible-quotations.csv")
# Parsed with column specification:
# cols(
# page = col_character(),
# reference = col_character(),
# prediction = col_character(),
# probability = col_double(),
# book = col_character(),
# chapter = col_integer(),
# verse = col_integer(),
# version = col_character(),
# testament = col_character(),
# lccn = col_integer(),
# date = col_date(format = ""),
# year = col_integer(),
# month = col_integer(),
# state = col_character(),
# title = col_character(),
# url = col_character(),
# multiple_references = col_character()
# )
# |================================================================================| 100% 258 MB
# Warning: 857311 parsing failures.
# row col expected actual
# 8817 lccn an integer sn00063520
# 8818 lccn an integer sn00063520
# 8819 lccn an integer sn00063520
# 8820 lccn an integer sn00063520
# 8821 lccn an integer sn00063520
# .... .... .......... ..........
# See problems(...) for more details.
#
# >
dim(bible_quote)
[1] 866127 17
# View(bible_quote)
glimpse(bible_quote)
# Observations: 866,127
# Variables: 17
# $ page <chr> "2003260222/18...
# $ reference <chr> "Matthew 11:28...
# $ prediction <chr> "quotation", "...
# $ probability <dbl> 0.8217737, 0.5...
# $ book <chr> "Matthew", "1 ...
# $ chapter <int> 11, 15, 8, 2, ...
# $ verse <int> 28, 46, 9, 14,...
# $ version <chr> "KJV", "KJV", ...
# $ testament <chr> "NT", "NT", "N...
# $ lccn <int> 2003260222, 20...
# $ date <date> 1890-12-20, 1...
# $ year <int> 1890, 1890, 18...
# $ month <int> 12, 12, 12, 12...
# $ state <chr> "Oregon", "Ore...
# $ title <chr> "The Dalles We...
# $ url <chr> "http://chroni...
# $ multiple_references <chr> NA, NA, NA, NA...
vis_dat(bible_quote)
# Warning message:
# attributes are not identical across measure variables; they will be dropped
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment