Andy Enkeboll enkeboll

I hereby claim:

To claim this, I am signing this object:

	# -- coding: utf-8 --
	"""Automation demo - Andy.ipynb

	Automatically generated by Colaboratory.

	Original file is located at
	https://colab.research.google.com/drive/1ehWn8-jcItWIFNFhKWUdZBOF0DAdMvll

	## Automating the process
	First, two important things to do to follow along with lecture:

	# This application that can compute the top 25 pages on Wikipedia for each of the Wikipedia sub-domains

	import argparse
	import csv
	import datetime
	import gzip
	import os
	import sys
	from collections import defaultdict, namedtuple
	from heapq import heappush, heappushpop

	import datetime
	from operator import attrgetter

	from ics import Calendar, Event

	BREAK_BEGIN = datetime.date(2020, 12, 28)

	def runs_over_break(start_date):
	if (BREAK_BEGIN > start_date and
	BREAK_BEGIN < start_date + datetime.timedelta(weeks=15, days=5)):

	redshift

	-- COMMAND LINE CONNECT:
	- seatgeek:
	- psql "host=redshift-datawarehouse.service.seatgeek.prod dbname=sganalytic user=andy port=5439"
	- greenhouse:
	- psql "host=redshift.greenhouse.io dbname=greenhouse user=org_978 port=5439 sslmode=require"

	-- CREDENTIALS LINE
	CREDENTIALS 'aws_iam_role=arn:aws:iam::093535234988:role/Production-RedshiftCopyUnload'

	# from http://blogs.quovantis.com/how-to-convert-csv-to-parquet-files/

	from pyspark import SparkContext
	from pyspark.sql import SQLContext
	from pyspark.sql.types import StructField, StructType, IntegerType, StringType, TimestampType


	if __name__ == "__main__":
	sc = SparkContext(appName="CSV2Parquet")
	sqlContext = SQLContext(sc)

	create_table = """
	DROP TABLE IF EXISTS `dec_test`;
	CREATE TABLE `dec_test` (
	`dec_2_2` decimal(4,2),
	`dec_4_2` decimal(6,2),
	`dec_8_4` decimal(8,4),
	`char_15` char(15)
	) ENGINE=InnoDB DEFAULT CHARSET=utf8;

	insert into dec_test values

	import bisect
	import datetime
	import operator

	import boto3

	client = boto3.client('cloudwatch')

	def get_metric(offset, metricname, threshold, oper='ge', stat='Average'):
	if offset >= 64:

	import csv
	import requests
	from bs4 import BeautifulSoup

	base_url = "http://www.pro-football-reference.com"
	next_page = "/super-bowl/i.htm"
	# this website doesn't have a "next" button to SB XLIX, for some reason
	extra = ['/super-bowl/xlix.htm']

	def pair(a, b):