Created
August 5, 2016 01:20
-
-
Save njtierney/e390b8880cec2f5cd787181c90f8773b to your computer and use it in GitHub Desktop.
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
library(plyr) | |
library(dplyr) | |
library(tidyr) | |
library(visdat) | |
library(ggplot2) | |
library(readr) | |
bible_quote <- read_csv("/Users/tierneyn/Downloads/public-bible-quotations.csv") | |
# Parsed with column specification: | |
# cols( | |
# page = col_character(), | |
# reference = col_character(), | |
# prediction = col_character(), | |
# probability = col_double(), | |
# book = col_character(), | |
# chapter = col_integer(), | |
# verse = col_integer(), | |
# version = col_character(), | |
# testament = col_character(), | |
# lccn = col_integer(), | |
# date = col_date(format = ""), | |
# year = col_integer(), | |
# month = col_integer(), | |
# state = col_character(), | |
# title = col_character(), | |
# url = col_character(), | |
# multiple_references = col_character() | |
# ) | |
# |================================================================================| 100% 258 MB | |
# Warning: 857311 parsing failures. | |
# row col expected actual | |
# 8817 lccn an integer sn00063520 | |
# 8818 lccn an integer sn00063520 | |
# 8819 lccn an integer sn00063520 | |
# 8820 lccn an integer sn00063520 | |
# 8821 lccn an integer sn00063520 | |
# .... .... .......... .......... | |
# See problems(...) for more details. | |
# | |
# > | |
dim(bible_quote) | |
[1] 866127 17 | |
# View(bible_quote) | |
glimpse(bible_quote) | |
# Observations: 866,127 | |
# Variables: 17 | |
# $ page <chr> "2003260222/18... | |
# $ reference <chr> "Matthew 11:28... | |
# $ prediction <chr> "quotation", "... | |
# $ probability <dbl> 0.8217737, 0.5... | |
# $ book <chr> "Matthew", "1 ... | |
# $ chapter <int> 11, 15, 8, 2, ... | |
# $ verse <int> 28, 46, 9, 14,... | |
# $ version <chr> "KJV", "KJV", ... | |
# $ testament <chr> "NT", "NT", "N... | |
# $ lccn <int> 2003260222, 20... | |
# $ date <date> 1890-12-20, 1... | |
# $ year <int> 1890, 1890, 18... | |
# $ month <int> 12, 12, 12, 12... | |
# $ state <chr> "Oregon", "Ore... | |
# $ title <chr> "The Dalles We... | |
# $ url <chr> "http://chroni... | |
# $ multiple_references <chr> NA, NA, NA, NA... | |
vis_dat(bible_quote) | |
# Warning message: | |
# attributes are not identical across measure variables; they will be dropped |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment