fauxneticien · November 29, 2022 19:20
diff --git a/reddit.R b/reddit.R
 library(httr)
 library(purrr)
 library(tibble)

 # See also https://bookdown.org/paul/apis_for_social_scientists/reddit-api.html

 url <- 'https://www.reddit.com/r/mentalhealth/new.json?t=day&limit=100'

 response <- GET(url, user_agent('Extracting data from Reddit'))

 data <- content(response, type = 'application/json')

 # Figure out what you want to extract from sample (e.g. title)
 sample <- data$data$children[[1]]$data

 # Helpers:
 # sort(names(sample))
 # View(sample)

 df <- purrr::map_dfr(data$data$children, function(post) {
  
  d <- post$data
  
  tibble(
    title = d$title,
    text  = d$selftext,
    num_comments = d$num_comments
  )
  
 })

 head(df)
	library(httr)
	library(purrr)
	library(tibble)

	# See also https://bookdown.org/paul/apis_for_social_scientists/reddit-api.html

	url <- 'https://www.reddit.com/r/mentalhealth/new.json?t=day&limit=100'

	response <- GET(url, user_agent('Extracting data from Reddit'))

	data <- content(response, type = 'application/json')

	# Figure out what you want to extract from sample (e.g. title)
	sample <- data$data$children[[1]]$data

	# Helpers:
	# sort(names(sample))
	# View(sample)

	df <- purrr::map_dfr(data$data$children, function(post) {

	d <- post$data

	tibble(
	title = d$title,
	text = d$selftext,
	num_comments = d$num_comments
	)

	})

	head(df)