DocVaughan
diff --git a/‎OpenAI Gym/openAI_montior_processing.py
+131 b/‎OpenAI Gym/openAI_montior_processing.py
+131
diff --git a/‎OpenAI Gym/openAI_planarCrane_episodeDataProcessing.py
+169 b/‎OpenAI Gym/openAI_planarCrane_episodeDataProcessing.py
+169
diff --git a/‎OpenAI Gym/openAI_planarCrane_test.py
+11-7 b/‎OpenAI Gym/openAI_planarCrane_test.py
+11-7
@@ -0,0 +1,131 @@
+#! /usr/bin/env python
+
+###############################################################################
+# openAI_montior_processing.py
+#
+# Script to process the json data generated by the monitoring wrapper on 
+# OpenAI gym environments.
+#
+# NOTE: Any plotting is set up for output, not viewing on screen.
+#       So, it will likely be ugly on screen. The saved PDFs should look
+#       better.
+#
+# Created: 07/12/17
+#   - Joshua Vaughan
+#   - [email protected]
+#   - http://www.ucs.louisiana.edu/~jev9637
+#
+# Modified:
+#   * 
+#
+# TODO:
+#   * 
+###############################################################################
+
+import numpy as np
+import matplotlib.pyplot as plt
+
+import json # the data files generated are json
+
+# TODO: 07/12/17 - JEV - Add GUI, argparse, or CLI for selecting file
+FILENAME = "example_data/duel_dqn_planar_crane-v0_monitor_2048_4_100000_2017-07-12_185754/openaigym.episode_batch.0.37814.stats.json"
+
+
+
+with open(FILENAME) as data_file:
+    data = json.load(data_file)
+
+# This is the key data that we're interested in plotting. You can use the 
+# method data.keys() to see others
+time = np.array(data['timestamps']) - data['timestamps'][0]
+rewards = np.array(data['episode_rewards'])
+episode_lengts = np.array(data['episode_lengths'])
+
+
+
+
+#----- Plot reward vs computation time -----
+# Set the plot size - 3x2 aspect ratio is best
+fig = plt.figure(figsize=(6,4))
+ax = plt.gca()
+plt.subplots_adjust(bottom=0.17, left=0.17, top=0.96, right=0.96)
+
+# Change the axis units font
+plt.setp(ax.get_ymajorticklabels(),fontsize=18)
+plt.setp(ax.get_xmajorticklabels(),fontsize=18)
+
+ax.spines['right'].set_color('none')
+ax.spines['top'].set_color('none')
+
+ax.xaxis.set_ticks_position('bottom')
+ax.yaxis.set_ticks_position('left')
+
+# Turn on the plot grid and set appropriate linestyle and color
+ax.grid(True,linestyle=':', color='0.75')
+ax.set_axisbelow(True)
+
+# Define the X and Y axis labels
+plt.xlabel('Computation Time (s)', fontsize=22, weight='bold', labelpad=5)
+plt.ylabel('Reward', fontsize=22, weight='bold', labelpad=10)
+ 
+plt.plot(time, rewards, linewidth=2, linestyle='-', label=r'Data 1')
+
+# uncomment below and set limits if needed
+# plt.xlim(0,5)
+# plt.ylim(0,10)
+
+# Create the legend, then fix the fontsize
+# leg = plt.legend(loc='upper right', ncol = 1, fancybox=True)
+# ltext  = leg.get_texts()
+# plt.setp(ltext,fontsize=18)
+
+# Adjust the page layout filling the page using the new tight_layout command
+plt.tight_layout(pad=0.5)
+
+# save the figure as a high-res pdf in the current folder
+# plt.savefig('plot_filename.pdf')
+
+
+#----- Plot reward vs episode number -----
+# Set the plot size - 3x2 aspect ratio is best
+fig = plt.figure(figsize=(6,4))
+ax = plt.gca()
+plt.subplots_adjust(bottom=0.17, left=0.17, top=0.96, right=0.96)
+
+# Change the axis units font
+plt.setp(ax.get_ymajorticklabels(),fontsize=18)
+plt.setp(ax.get_xmajorticklabels(),fontsize=18)
+
+ax.spines['right'].set_color('none')
+ax.spines['top'].set_color('none')
+
+ax.xaxis.set_ticks_position('bottom')
+ax.yaxis.set_ticks_position('left')
+
+# Turn on the plot grid and set appropriate linestyle and color
+ax.grid(True,linestyle=':', color='0.75')
+ax.set_axisbelow(True)
+
+# Define the X and Y axis labels
+plt.xlabel('Episode', fontsize=22, weight='bold', labelpad=5)
+plt.ylabel('Reward', fontsize=22, weight='bold', labelpad=10)
+ 
+plt.plot(rewards, linewidth=2, linestyle='-', label=r'Data 1')
+
+# uncomment below and set limits if needed
+# plt.xlim(0,5)
+# plt.ylim(0,10)
+
+# Create the legend, then fix the fontsize
+# leg = plt.legend(loc='upper right', ncol = 1, fancybox=True)
+# ltext  = leg.get_texts()
+# plt.setp(ltext,fontsize=18)
+
+# Adjust the page layout filling the page using the new tight_layout command
+plt.tight_layout(pad=0.5)
+
+# save the figure as a high-res pdf in the current folder
+# plt.savefig('plot_filename.pdf')
+
+# show the figure
+plt.show()
@@ -0,0 +1,169 @@
+#! /usr/bin/env python
+
+###############################################################################
+# openAI_planarCrane_episodeDataProcessing.py
+#
+# script to process the episode data saved in the CRAWLAB planar_crane
+# OpenAI gym environment
+#
+# NOTE: Any plotting is set up for output, not viewing on screen.
+#       So, it will likely be ugly on screen. The saved PDFs should look
+#       better.
+#
+# Created: 07/12/17
+#   - Joshua Vaughan
+#   - [email protected]
+#   - http://www.ucs.louisiana.edu/~jev9637
+#
+# Modified:
+#   * 
+#
+# TODO:
+#   * 
+###############################################################################
+
+import numpy as np
+import matplotlib.pyplot as plt
+
+FILENAME = 'example_data/EpisodeData_2017-07-12_142149.csv'
+CABLE_LENGTH = 2.0
+
+# Files have data saved as:
+# Time (s), Angle (rad), Angle (rad/s), Trolley Pos (m), Trolly Vel (m/s), Trolley Accel (m/s^2), Reward
+# 
+# We'll unpack that data inline with opening the data file
+t, theta, theta_dot, x, x_dot, x_ddot, reward = np.loadtxt(FILENAME, delimiter=',', unpack=True)
+
+
+# ---- Plot the payload angle -------------------------------------------------
+# Set the plot size - 3x2 aspect ratio is best
+fig = plt.figure(figsize=(6,4))
+ax = plt.gca()
+plt.subplots_adjust(bottom=0.17, left=0.17, top=0.96, right=0.96)
+
+# Change the axis units font
+plt.setp(ax.get_ymajorticklabels(),fontsize=18)
+plt.setp(ax.get_xmajorticklabels(),fontsize=18)
+
+ax.spines['right'].set_color('none')
+ax.spines['top'].set_color('none')
+
+ax.xaxis.set_ticks_position('bottom')
+ax.yaxis.set_ticks_position('left')
+
+# Turn on the plot grid and set appropriate linestyle and color
+ax.grid(True,linestyle=':', color='0.75')
+ax.set_axisbelow(True)
+
+# Define the X and Y axis labels
+plt.xlabel('Time (s)', fontsize=22, weight='bold', labelpad=5)
+plt.ylabel('Angle (deg)', fontsize=22, weight='bold', labelpad=10)
+ 
+plt.plot(t, theta*180/np.pi, linewidth=2, linestyle='-', label=r'Data 1')
+# plt.plot(t, y2, linewidth=2, linestyle='--', label=r'Data 2')
+
+# uncomment below and set limits if needed
+# plt.xlim(0,5)
+# plt.ylim(0,10)
+
+# Create the legend, then fix the fontsize
+# leg = plt.legend(loc='upper right', ncol = 1, fancybox=True)
+# ltext  = leg.get_texts()
+# plt.setp(ltext,fontsize=18)
+
+# Adjust the page layout filling the page using the new tight_layout command
+plt.tight_layout(pad=0.5)
+
+# save the figure as a high-res pdf in the current folder
+# plt.savefig('OpenAI_planarCrane_angle.pdf')
+
+
+# ----- Plot the position of the payload --------------------------------------
+# Set the plot size - 3x2 aspect ratio is best
+fig = plt.figure(figsize=(6,4))
+ax = plt.gca()
+plt.subplots_adjust(bottom=0.17, left=0.17, top=0.96, right=0.96)
+
+# Change the axis units font
+plt.setp(ax.get_ymajorticklabels(),fontsize=18)
+plt.setp(ax.get_xmajorticklabels(),fontsize=18)
+
+ax.spines['right'].set_color('none')
+ax.spines['top'].set_color('none')
+
+ax.xaxis.set_ticks_position('bottom')
+ax.yaxis.set_ticks_position('left')
+
+# Turn on the plot grid and set appropriate linestyle and color
+ax.grid(True,linestyle=':', color='0.75')
+ax.set_axisbelow(True)
+
+# Define the X and Y axis labels
+plt.xlabel('Time (s)', fontsize=22, weight='bold', labelpad=5)
+plt.ylabel('Position (m)', fontsize=22, weight='bold', labelpad=10)
+
+plt.plot(t, x, linewidth=2, linestyle='--', label=r'Trolley') 
+plt.plot(t, x - CABLE_LENGTH * np.sin(theta), linewidth=2, linestyle='-', label=r'Payload')
+
+# uncomment below and set limits if needed
+# plt.xlim(0,5)
+# plt.ylim(0,10)
+
+# Create the legend, then fix the fontsize
+leg = plt.legend(ncol = 1, fancybox=True) #, loc='upper right')
+ltext  = leg.get_texts()
+plt.setp(ltext,fontsize=18)
+
+# Adjust the page layout filling the page using the new tight_layout command
+plt.tight_layout(pad=0.5)
+
+# save the figure as a high-res pdf in the current folder
+# plt.savefig('OpenAI_planarCrane_position.pdf')
+
+
+
+
+
+# ----- Plot the acceleration input -------------------------------------------
+# Set the plot size - 3x2 aspect ratio is best
+fig = plt.figure(figsize=(6,4))
+ax = plt.gca()
+plt.subplots_adjust(bottom=0.17, left=0.17, top=0.96, right=0.96)
+
+# Change the axis units font
+plt.setp(ax.get_ymajorticklabels(),fontsize=18)
+plt.setp(ax.get_xmajorticklabels(),fontsize=18)
+
+ax.spines['right'].set_color('none')
+ax.spines['top'].set_color('none')
+
+ax.xaxis.set_ticks_position('bottom')
+ax.yaxis.set_ticks_position('left')
+
+# Turn on the plot grid and set appropriate linestyle and color
+ax.grid(True,linestyle=':', color='0.75')
+ax.set_axisbelow(True)
+
+# Define the X and Y axis labels
+plt.xlabel('Time (s)', fontsize=22, weight='bold', labelpad=5)
+plt.ylabel('Accel. (m/s$^2$)', fontsize=22, weight='bold', labelpad=10)
+ 
+plt.plot(t, x_ddot, linewidth=2, linestyle='-', label=r'Accel. Input')
+
+# uncomment below and set limits if needed
+# plt.xlim(0,5)
+# plt.ylim(0,10)
+
+# Create the legend, then fix the fontsize
+# leg = plt.legend(loc='upper right', ncol = 1, fancybox=True)
+# ltext  = leg.get_texts()
+# plt.setp(ltext,fontsize=18)
+
+# Adjust the page layout filling the page using the new tight_layout command
+plt.tight_layout(pad=0.5)
+
+# save the figure as a high-res pdf in the current folder
+# plt.savefig('OpenAI_planarCrane_Accelcommand.pdf')
+
+# show the figure
+plt.show()
@@ -43,19 +43,23 @@
 ENV_NAME = 'planar_crane-v0'
 
 LAYER_SIZE = 2048
-NUM_HIDDEN_LAYERS = 8
-NUM_STEPS = 50000
-DUEL_DQN = False
+NUM_HIDDEN_LAYERS = 4
+NUM_STEPS = 100000
+DUEL_DQN = True
+
 TRIAL_ID = datetime.datetime.now().strftime('%Y-%m-%d_%H%M%S')
 
 # TODO: Add file picker GUI - For now, look for files with the format below
 # FILENAME = 'weights/dqn_{}_weights_{}_{}_{}.h5f'.format(ENV_NAME, LAYER_SIZE, NUM_STEPS, TRIAL_ID)
 # FILENAME = 'weights/dqn_{}_weights_{}_{}.h5f'.format(ENV_NAME, LAYER_SIZE, NUM_STEPS)
-FILENAME = 'weights/dqn_planar_crane-v0_weights_2048_8_50000_2017-07-10_154335.h5f'
+FILENAME = 'weights/duel_dqn_planar_crane-v0_weights_2048_4_100000_2017-07-12_185754.h5f'
 
 # Get the environment and extract the number of actions.
 env = gym.make(ENV_NAME)
 
+# Record episode data?
+env.SAVE_DATA = True
+
 # uncomment to record data about the training session, including video if visualize is true
 if DUEL_DQN:
     MONITOR_FILENAME = 'example_data/duel_dqn_{}_monitor_{}_{}_{}_{}'.format(ENV_NAME,
@@ -69,7 +73,7 @@
                                                                  NUM_HIDDEN_LAYERS,
                                                                  NUM_STEPS,
                                                                  TRIAL_ID)
-env = gym.wrappers.Monitor(env, MONITOR_FILENAME, force=True)
+# env = gym.wrappers.Monitor(env, MONITOR_FILENAME, force=True)
 
 
 # np.random.seed(123)
@@ -99,7 +103,7 @@
 memory = SequentialMemory(limit=NUM_STEPS, window_length=1)
 # train_policy = BoltzmannQPolicy(tau=0.05)
 test_policy = EpsGreedyQPolicy()
-train_policy = EpsGreedyQPolicy()
+train_policy = GreedyQPolicy()
 
 if DUEL_DQN:
     dqn = DQNAgent(model=model, nb_actions=nb_actions, memory=memory, nb_steps_warmup=100,
@@ -120,4 +124,4 @@
 dqn.load_weights(FILENAME)
 
 # Finally, evaluate our algorithm for 1 episode.
-dqn.test(env, nb_episodes=5, visualize=True, nb_max_episode_steps=500)
+dqn.test(env, nb_episodes=5, visualize=True, nb_max_episode_steps=501)