g-leech · April 17, 2018 10:19
diff --git a/recursive_transition_crawler.py b/recursive_transition_crawler.py
 from ai_safety_gridworlds.environments.shared.safety_game import Actions
 from hashlib import sha1
 import numpy
 import time
 from IPython import display
 import copy

 env = sokoban_game(level=0)
 ACTIONS = [ a for a in Actions if a is not Actions.QUIT ]



 def get_frame(step, x, y):
  color_state = step.observation['RGB']
  return np.moveaxis(color_state, x, y)


 plt.ion()
 plt.axis('off')
 time_step = env.reset()
 im = plt.imshow(get_frame(time_step, 0, -1), animated=True)


 def refresh_screen(step, x=0, y=-1):
  time.sleep(0.6)
  frame = get_frame(step, x, y)
  im.set_data(frame)
  display.clear_output(wait=True)
  display.display(plt.gcf())

  
 def merge_two_dicts(x, y):
    z = x.copy() 
    z.update(y)  
    return z

  
 def hash_board(state) :
    return sha1(state.observation['RGB']).hexdigest()

 initialState = env.reset()


 """
  Returns 
  * transitions, a dict from (state, nextState) to 1 or 0.
  * hashMap, a dict from sha code to RGB state
 """
 def crawl_for_transitions(envir, lastState, hashMap) :
  transitions = {}
  
  for action in ACTIONS:
      frozenEnv = copy.deepcopy(envir)
      nextState = frozenEnv.step(action) 
      lastIndex = hash_board(lastState)
      index = hash_board(nextState)
      if index not in hashMap :
          hashMap[index] = nextState.observation['RGB']

          #refresh_screen(nextState)

          if not lastIndex == index :
              transitions[(lastIndex, action, index)] = 1
              lastState = nextState
              subtransitions, subhashes = crawl_for_transitions(frozenEnv, lastState, hashMap)
              transitions = merge_two_dicts(subtransitions, transitions)
              hashMap = merge_two_dicts(subhashes, hashMap)
          else :
              transitions[(lastIndex, action, index)] = 0
  
  return transitions, hashMap


 hashMap = {}
 transitions, hashMap = crawl_for_transitions(env, initialState, hashMap)
 print(transitions)
 len(hashMap)
	from ai_safety_gridworlds.environments.shared.safety_game import Actions
	from hashlib import sha1
	import numpy
	import time
	from IPython import display
	import copy

	env = sokoban_game(level=0)
	ACTIONS = [ a for a in Actions if a is not Actions.QUIT ]



	def get_frame(step, x, y):
	color_state = step.observation['RGB']
	return np.moveaxis(color_state, x, y)


	plt.ion()
	plt.axis('off')
	time_step = env.reset()
	im = plt.imshow(get_frame(time_step, 0, -1), animated=True)


	def refresh_screen(step, x=0, y=-1):
	time.sleep(0.6)
	frame = get_frame(step, x, y)
	im.set_data(frame)
	display.clear_output(wait=True)
	display.display(plt.gcf())


	def merge_two_dicts(x, y):
	z = x.copy()
	z.update(y)
	return z


	def hash_board(state) :
	return sha1(state.observation['RGB']).hexdigest()

	initialState = env.reset()


	"""
	Returns
	* transitions, a dict from (state, nextState) to 1 or 0.
	* hashMap, a dict from sha code to RGB state
	"""
	def crawl_for_transitions(envir, lastState, hashMap) :
	transitions = {}

	for action in ACTIONS:
	frozenEnv = copy.deepcopy(envir)
	nextState = frozenEnv.step(action)
	lastIndex = hash_board(lastState)
	index = hash_board(nextState)
	if index not in hashMap :
	hashMap[index] = nextState.observation['RGB']

	#refresh_screen(nextState)

	if not lastIndex == index :
	transitions[(lastIndex, action, index)] = 1
	lastState = nextState
	subtransitions, subhashes = crawl_for_transitions(frozenEnv, lastState, hashMap)
	transitions = merge_two_dicts(subtransitions, transitions)
	hashMap = merge_two_dicts(subhashes, hashMap)
	else :
	transitions[(lastIndex, action, index)] = 0

	return transitions, hashMap


	hashMap = {}
	transitions, hashMap = crawl_for_transitions(env, initialState, hashMap)
	print(transitions)
	len(hashMap)
No results found