This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
_text = 'raw.txt' | |
_index = 'index.txt' | |
def readFile(F): | |
'''Pretty generic 'read' operation''' | |
data = [] | |
with open(F, 'r') as f: | |
for line in f: | |
data.append(line.strip()) | |
return data |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
""" | |
This script was written to illustrate libraries that could be used to improve upon | |
the efficiency of a script posted to /r/learnprogramming: | |
Original script: | |
https://github.com/aesptux/download-reddit-saved-images/blob/master/script.py | |
Reddit post | |
http://www.reddit.com/r/learnprogramming/comments/14dojd | |
/pythoncode_review_script_to_download_saved_images/ | |
""" | |
from urllib2 import Request, urlopen |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
import praw | |
from collections import Counter | |
params = {'limit':None, 'url_data':{'limit':100}} | |
memo = Counter() | |
r = praw.Reddit('investigating popular video domains, /u/shaggorama') | |
subreddits = ['videos', 'trailers','listentothis'] | |
for sub_name in subreddits: | |
subr = r.get_subreddit(sub_name) |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
#!/usr/bin/env python | |
import sys | |
import random | |
import argparse | |
import praw | |
import webbrowser | |
r = praw.Reddit(user_agent='AlienFeed v0.1.0 by u/jw989 as seen on Github http://github.com/jawerty/AlienFeed') |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
import praw | |
from collections import Counter | |
import pandas as pd | |
import matplotlib.pyplot as plt | |
useragent='investigating a RAOA post' | |
r = praw.Reddit(useragent) | |
def get_comments(subm_id='190wmg'): | |
subm=r.get_submission(submission_id=subm_id) |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
import time # just to time the preprocessing step | |
index = {} | |
WORDS = set() | |
map=[' ' #0 | |
,' ' #1 | |
,('a','b','c') #2 | |
,('d','e','f') #3 | |
,('g','h','i') #4 |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
import praw # simple interface to the reddit API, also handles rate limiting of requests | |
import re | |
from collections import deque | |
from time import sleep | |
USERNAME = "Your username here" | |
PASSWORD = "Your password here" | |
USERAGENT = "Your useragent string here. It should include your /u/username as a courtesy to reddit" | |
r = praw.Reddit(USERAGENT) |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
boundingRange <- function(x){ | |
max(x) - min(x) | |
} | |
runif_box <-function(n,x){ | |
b = boundingRange(x) | |
u = runif(n) | |
u*b+min(x) | |
} |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
import praw | |
import time | |
import pandas as pd | |
import matplotlib.pyplot as plt | |
from collections import Counter | |
class UserScraper(object): | |
'''Generic utility for investigating redditors''' | |
def __init__(self | |
, username |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
import praw, csv | |
from collections import defaultdict, Counter | |
# your userlogin information here. If you don't provide, the script will prompt | |
# you for it at the terminal, so no big deal either way. Just a convenience. | |
USERNAME = '' | |
PASSWORD= '' | |
useragent='getting moderators graph by /u/shaggorama' | |
r=praw.Reddit(useragent) |
OlderNewer