DQN( NIPS 2015 )
import gym
import random
import numpy as np
import skimage
from skimage import transform, color, exposure
from collections import deque
import tensorflow as tf
from keras import backend as K
from keras.models import Sequential
from keras.layers.convolutional import Convolution2D
from keras.layers.core import Dense, Activation, Flatten
from keras.optimizers import Adam
ACTIONS = 3
GAMMA = 0.99
OBSERVE = 320
EXPLORE = 200000
FINAL_EPSILON = 0.0001
INITIAL_EPSILON = 0.005
REPLAY_M