Skip to content

Instantly share code, notes, and snippets.

View Shmuma's full-sized avatar

Max Lapan Shmuma

View GitHub Profile
Uses ptan library: https://github.com/Shmuma/rl/blob/ptan/ptan/samples/dqn_expreplay.py
Config for the run: https://github.com/Shmuma/rl/blob/ptan/ptan/samples/runs/dqn_exp_cartpole.ini
Crossentropy method with dense NN 40+40
https://github.com/Shmuma/Practical_RL/blob/master/week1/MountainCar-xentropy.ipynb
Crossentropy method
https://github.com/Shmuma/Practical_RL/blob/master/week1/taxi_crossentropy.ipynb
Genetical algorythm with mutations probability decay.
https://github.com/Shmuma/Practical_RL/blob/master/week0/frozen-8x8.ipynb
https://github.com/Shmuma/rl/blob/master/algos/a3c_async.py
Slow version: https://github.com/Shmuma/rl/blob/master/test-1/a3c_atari.py
@Shmuma
Shmuma / A3C
Created February 14, 2017 16:07
#!/usr/bin/env python
# Quick-n-dirty implementation of Advantage Actor-Critic method from https://arxiv.org/abs/1602.01783
import argparse
import logging
import numpy as np
from rl_lib.wrappers import HistoryWrapper
logger = logging.getLogger()
#!/usr/bin/env python
# Multi-layer perceptron inspired by this: https://gym.openai.com/evaluations/eval_P4KyYPwIQdSg6EqvHgYjiw
# https://gist.githubusercontent.com/anonymous/d829ec2f8bda088ac897aa2055dcd3a8/raw/d3fcdfdcc9038bf24385589e94939dcd3c198349/crossentropy_method.py
import gym
import argparse
from gym import wrappers
import numpy as np
from keras.models import Sequential
from keras.layers import Dense, Activation
#!/usr/bin/env python
# Multi-layer perceptron inspired by this: https://gym.openai.com/evaluations/eval_P4KyYPwIQdSg6EqvHgYjiw
# https://gist.githubusercontent.com/anonymous/d829ec2f8bda088ac897aa2055dcd3a8/raw/d3fcdfdcc9038bf24385589e94939dcd3c198349/crossentropy_method.py
import gym
import argparse
from gym import wrappers
import numpy as np
from keras.models import Sequential
from keras.layers import Dense, Activation
#!/usr/bin/env python
# Multi-layer perceptron inspired by this: https://gym.openai.com/evaluations/eval_P4KyYPwIQdSg6EqvHgYjiw
# https://gist.githubusercontent.com/anonymous/d829ec2f8bda088ac897aa2055dcd3a8/raw/d3fcdfdcc9038bf24385589e94939dcd3c198349/crossentropy_method.py
import gym
import argparse
from gym import wrappers
import numpy as np
from keras.models import Sequential
from keras.layers import Dense, Activation