michaelfeng michaelfeng

💭

Be Happy~

Geek

michaelfeng / suffix-change

Created July 7, 2017 04:41

change file suffix

	import glob, os
	for filename in glob.iglob(os.path.join('.', '*')):
	os.rename(filename, filename + '.jpg')

michaelfeng / bnlstm.py

Created June 20, 2017 09:11 — forked from spitis/bnlstm.py

Batch normalized LSTM Cell for Tensorflow

	"""adapted from https://github.com/OlavHN/bnlstm to store separate population statistics per state"""
	import tensorflow as tf, numpy as np
	RNNCell = tf.nn.rnn_cell.RNNCell

	class BNLSTMCell(RNNCell):
	'''Batch normalized LSTM as described in arxiv.org/abs/1603.09025'''
	def __init__(self, num_units, is_training_tensor, max_bn_steps, initial_scale=0.1, activation=tf.tanh, decay=0.95):
	"""
	* max bn steps is the maximum number of steps for which to store separate population stats
	"""

michaelfeng / pg-pong.py

Created June 15, 2017 09:26 — forked from karpathy/pg-pong.py

Training a Neural Network ATARI Pong agent with Policy Gradients from raw pixels

	""" Trains an agent with (stochastic) Policy Gradients on Pong. Uses OpenAI Gym. """
	import numpy as np
	import cPickle as pickle
	import gym

	# hyperparameters
	H = 200 # number of hidden layer neurons
	batch_size = 10 # every how many episodes to do a param update?
	learning_rate = 1e-4
	gamma = 0.99 # discount factor for reward