Christopher Grainger cigrainger

151 followers · 37 following

View GitHub Profile

Recently created

Least recently created

Recently updated

Least recently updated

cigrainger / BE_1.py

Created February 16, 2015 15:05

meanvar

	import numpy as np
	from numpy import random

	m = 1000
	tot_n = np.zeros(m)
	for i in list(range(m)):
	n = 1
	mcint = random.randn(n)
	mean = str(np.mean(mcint)).split('.')
	while mean[1][:3] != '000':

cigrainger / BE_1.py

Created February 16, 2015 15:03

mcint

	import numpy as np
	from numpy import random

	m = 1000
	tot_n = np.zeros(m)
	for i in list(range(m)):
	n = 1
	mcint = random.randn(n)
	mean = str(np.mean(mcint)).split('.')
	while mean[1][:3] != '000':

cigrainger / gist:435b4ec9b67ef7a96b65

Created January 31, 2015 14:35

	import pandas as pd
	import re, string
	import numpy as np
	from scipy.spatial.distance import pdist, squareform, euclidean

	def firmmeans(data,year,key):
	d = data[data['bvdid'].isin(key['bvdid'][key['year']==year].tolist())]
	d[['year']] = d[['year']].astype(int)
	d = d[d['year']<=year]
	cols = [col for col in d.columns.values if col not in ['year','appln_id']]

cigrainger / gist:96c177256f5594d5a444

Created January 13, 2015 19:23

	library(xlsx)
	library(reshape2)
	library(dplyr)
	options(xlsx.datetime.format="yyyy-mm-dd")
	df <- read.xlsx('SPLICE results full - xlsx.xlsx',sheetIndex=2,header=TRUE,stringsAsFactors=FALSE,startRow=3)
	df <- df[-72,]
	id <- df[,1:4]
	sheet1 <- select(df,ends_with('Potential.Contribution.of.Energy.System.Components'))
	sheet2 <- select(df,ends_with('Criticality.of.Energy.System.Components'))
	sheet3 <- select(df,ends_with('Persistence.of.Impacts'))

cigrainger / gist:f367e725e8f33d7e47da

Created December 5, 2014 16:03

	install.packages('stargazer')

	states <- state.name
	# states <- c(states,states)
	states <- rep(times=2,x=states)
	variable <- c(rep('x',50),rep('y',50))

	# Create a dataframe called df consisting of states and variable.
	df <- data.frame(states,variable)

cigrainger / gist:ed51eff3d96a3753a7f3

Created December 5, 2014 14:10

	install.packages('stargazer')

	# states <- state.name
	states <- rep(state.name,2)
	# states <- rep(2,state.name)
	# states1 <- rep(x=state.name,times=2)
	# states2 <- rep(times=2,x=state.name)
	# states1==states2
	variable <- c(rep('x',50),rep('y',50))

cigrainger / gist:ae481df20bac8dfb8b91

Created August 17, 2014 22:51

	import pandas as pd
	import pystan

	df = pd.read_csv('firms.csv')
	df = df.dropna()
	country = pd.Categorical(df.country)
	year = pd.Categorical(df.year)
	nace = pd.Categorical(df.nace)
	bvd_id = pd.Categorical(df.bvd_id)

cigrainger / gist:b04cac5fea921267ddc2

Created August 14, 2014 15:28

	for firm in pd.unique(firms.bvdid):
	firms.ix[((firms.bvdid==firm)&(firms.year==2004)),'stock'] = firms.stock[(firms.bvdid==firm)&(firms.year==2004)] + firms.patents[(firms.bvdid==firm)&(firms.year==2004)]
	for i in range(2005,2014):
	firms.ix[((firms.bvdid==firm)&(firms.year==i)),'stock'] = firms.stock[(firms.bvdid==firm)&(firms.year==i-1)] + firms.patents[(firms.bvdid==firm)&(firms.year==i)]

cigrainger / gist:713008c919c34360d959

Created August 1, 2014 17:22

	COPY (SELECT abstracts FROM patents
	WHERE lang = 'en'
	ORDER BY random()
	LIMIT 10000000)
	TO E'~/randomsample.txt';

cigrainger / gist:8ea5842e9773e57cbdfe

Created July 30, 2014 14:22

	turnover.columns = [x[-4:] if x.startswith('turnover')
	else x
	for x in turnover.columns.values]
	turnover = pd.melt(turnover,id_vars=['bvd_id'],var_name='year',value_name='turnover')
	turnover.year = turnover.year.astype('int')
	turnover.turnover = [np.nan if x == 'n.a.'
	else x
	for x in turnover.turnover]
	turnover.turnover = [str(x).replace(',','') if x != np.nan
	else x