📈

Aditya Rastogi thunderInfy

📈

Exploring algorithms which make perception, reasoning and action possible

thunderInfy / problem_parameters.py

Last active October 9, 2019 15:38

thunderInfy / poisson.py

Created October 9, 2019 15:45

	class poisson_:

	def __init__(self, λ):
	self.λ = λ

	ε = 0.01

	# [α , β] is the range of n's for which the pmf value is above ε
	self.α = 0
	state = 1

thunderInfy / exampleλis3.py

Created October 9, 2019 15:55

thunderInfy / location.py

Created October 9, 2019 15:59

	#A class holding the properties of a location together

	class location:

	def __init__(self, req, ret):
	self.α = req #value of lambda for requests
	self.β = ret #value of lambda for returns
	self.poissonα = poisson_(self.α)
	self.poissonβ = poisson_(self.β)

thunderInfy / imports.py

Last active October 9, 2019 16:02

	#IMPORTS
	import numpy as np
	import matplotlib.pyplot as plt
	import seaborn as sns
	from scipy.stats import poisson
	import sys

	#Problem Parameters
	class jcp:
	@staticmethod

thunderInfy / initialization.py

Created October 9, 2019 17:59

	#Initializing the value and policy matrices. Initial policy has zero value for all states.

	value = np.zeros((jcp.max_cars()+1, jcp.max_cars()+1))
	policy = value.copy().astype(int)

thunderInfy / policy_evaluation.py

Created October 9, 2019 19:01

	def expected_reward(state, action):
	global value
	"""
	state : It's a pair of integers, # of cars at A and at B
	action : # of cars transferred from A to B, -5 <= action <= 5
	"""

	ψ = 0 #reward
	new_state = [max(min(state[0] - action, jcp.max_cars()),0) , max(min(state[1] + action, jcp.max_cars()),0)]

thunderInfy / policy_improvement.py

Created October 9, 2019 19:08

thunderInfy / policy_iteration_loop.py

Created October 9, 2019 19:10

thunderInfy / non_linearities.py

Created October 9, 2019 20:11

	# adding reward for moving cars from one location to another (which is negative)

	if action <= 0:
	ψ = ψ + jcp.moving_reward() * abs(action)
	else:
	ψ = ψ + jcp.moving_reward() * (action - 1) #one car is moved by one of Jack's employees for free

	# adding reward for second parking lot (which is also negative)

	if new_state[0] > 10: