.travis.yml
AUTHORS.rst
HISTORY.rst
LICENSE.txt
MANIFEST.in
README.rst
nosetests_details.txt
requirements.txt
setup.cfg
setup.py
tox.ini
introrl/.gitattributes
introrl/.gitignore
introrl/LICENSE
introrl/README.md
introrl/_TODO.txt
introrl/__init__.py
introrl/_version.py
introrl/action.py
introrl/action_coll.py
introrl/build_mdp.py
introrl/gridworld_policy.png
introrl/nose_w_coverge.bat
introrl/nosetests_details.txt
introrl/policy.py
introrl/reward.py
introrl/sample_gridworld_policy.png
introrl/state.py
introrl/state_actions.py
introrl/state_actions_coll.py
introrl/state_coll.py
introrl/state_values.py
introrl/transition.py
introrl/transition_coll.py
introrl.egg-info/PKG-INFO
introrl.egg-info/SOURCES.txt
introrl.egg-info/dependency_links.txt
introrl.egg-info/entry_points.txt
introrl.egg-info/not-zip-safe
introrl.egg-info/requires.txt
introrl.egg-info/top_level.txt
introrl/agent_supt/__init__.py
introrl/agent_supt/action_tracker.py
introrl/agent_supt/action_value_coll.py
introrl/agent_supt/action_value_run_ave_coll.py
introrl/agent_supt/alpha_calc.py
introrl/agent_supt/change_tracker.py
introrl/agent_supt/episode.py
introrl/agent_supt/episode_maker.py
introrl/agent_supt/episode_stats.py
introrl/agent_supt/episode_summ_print.py
introrl/agent_supt/epsilon_calc.py
introrl/agent_supt/learning_tracker.py
introrl/agent_supt/model.py
introrl/agent_supt/model_state_data.py
introrl/agent_supt/model_w_timestamp.py
introrl/agent_supt/nstep_sarsa_eval_walker.py
introrl/agent_supt/nstep_sarsa_qstar_walker.py
introrl/agent_supt/nstep_td_eval_walker.py
introrl/agent_supt/state_value_coll.py
introrl/agent_supt/state_value_run_ave_coll.py
introrl/agents/__init__.py
introrl/agents/dyna_q_agent.py
introrl/agents/dyna_qplus_agent.py
introrl/agents/priority_sweep_agent.py
introrl/agents/tabular_agent.py
introrl/black_box_sims/_TODO_.txt
introrl/black_box_sims/__init__.py
introrl/black_box_sims/blackjack_sim.py
introrl/black_box_sims/blocking_maze.py
introrl/black_box_sims/car_rental_sim.py
introrl/black_box_sims/car_rental_sim_const_rtn.py
introrl/black_box_sims/cliff_walking.py
introrl/black_box_sims/maximization_bias_mdp.py
introrl/black_box_sims/racetrack_1_sim.py
introrl/black_box_sims/racetrack_1_w_crash_sim.py
introrl/black_box_sims/racetrack_2_sim.py
introrl/black_box_sims/racetrack_legal_moves.py
introrl/black_box_sims/sample_sim.py
introrl/black_box_sims/sample_sim_policy.png
introrl/black_box_sims/sim_baseline.py
introrl/black_box_sims/blackjack_supt/__init__.py
introrl/black_box_sims/blackjack_supt/bj_p21_calc.py
introrl/black_box_sims/blackjack_supt/bj_policy.py
introrl/black_box_sims/blackjack_supt/blackjack.py
introrl/black_box_sims/blackjack_supt/make_bj_charts.py
introrl/dp_funcs/__init__.py
introrl/dp_funcs/dp_policy_eval.py
introrl/dp_funcs/dp_policy_improve.py
introrl/dp_funcs/dp_policy_iter.py
introrl/dp_funcs/dp_value_iter.py
introrl/environments/__init__.py
introrl/environments/define_state_moves.py
introrl/environments/env_baseline.py
introrl/examples/summ_print_example.py
introrl/examples/chapter_3/figure_3_2_5x5_gridworld.py
introrl/examples/chapter_3/figure_3_5_5x5_gridworld.py
introrl/examples/chapter_3/figure_3_5_policy.png
introrl/examples/chapter_4/car_rental_const_rtn.png
introrl/examples/chapter_4/car_rental_sim_to_env_const_rtn.png
introrl/examples/chapter_4/car_rental_var_rtn.png
introrl/examples/chapter_4/car_rental_var_rtn_v2.png
introrl/examples/chapter_4/car_rental_var_rtn_v3.png
introrl/examples/chapter_4/dp_car_rental_PI.py
introrl/examples/chapter_4/dp_car_rental_PI_const_rtn.py
introrl/examples/chapter_4/dp_gamblers_problem.py
introrl/examples/chapter_4/dp_sutton_ex4_1_gridworld.py
introrl/examples/chapter_4/fig_4_2_car_rental_value.png
introrl/examples/chapter_4/fig_4_2_car_rental_value_v3.png
introrl/examples/chapter_4/figure_4_3_gamblers_full_policy.png
introrl/examples/chapter_4/figure_4_3_gamblers_policy.png
introrl/examples/chapter_4/plot_car_rental_3d.py
introrl/examples/chapter_4/plot_car_rental_bbsim_data.py
introrl/examples/chapter_4/plot_car_rental_policy.py
introrl/examples/chapter_4/policy_car_rental_sim_to_env_const_rtn.png
introrl/examples/chapter_5/blackjack_policy.png
introrl/examples/chapter_5/blackjack_policy_g1.png
introrl/examples/chapter_5/dp_blackjack.py
introrl/examples/chapter_5/dp_blackjack_policy.png
introrl/examples/chapter_5/fig_5_1_noace_10000.png
introrl/examples/chapter_5/fig_5_1_noace_500000.png
introrl/examples/chapter_5/fig_5_1_w_ace_10000.png
introrl/examples/chapter_5/fig_5_1_w_ace_500000.png
introrl/examples/chapter_5/fig_5_2_noace_mc_es.png
introrl/examples/chapter_5/fig_5_2_w_ace_mc_es.png
introrl/examples/chapter_5/mc_blackjack_epsilon_greedy.py
introrl/examples/chapter_5/mc_blackjack_eval.py
introrl/examples/chapter_5/mc_blackjack_explore_starts.py
introrl/examples/chapter_5/mc_blackjack_explore_starts_g1.py
introrl/examples/chapter_5/mc_racetrack_1_epsilon_greedy.py
introrl/examples/chapter_5/mc_racetrack_1_explore_starts.py
introrl/examples/chapter_5/mc_racetrack_1_policy_plots.py
introrl/examples/chapter_5/mc_racetrack_1_w_crash_epsilon_greedy.py
introrl/examples/chapter_5/mc_racetrack_1_w_crash_explore_starts.py
introrl/examples/chapter_5/mc_racetrack_2_epsilon_greedy.py
introrl/examples/chapter_5/plot_blackjack_10000_eval.py
introrl/examples/chapter_5/plot_blackjack_500000_eval.py
introrl/examples/chapter_5/plot_blackjack_es.py
introrl/examples/chapter_6/build_ex_6_6_data.py
introrl/examples/chapter_6/example_6_6_cliff_walking_plot_compare.png
introrl/examples/chapter_6/fig_6_2_online_random_walk.png
introrl/examples/chapter_6/figure_6_2_on_line.py
introrl/examples/chapter_6/figure_6_5_maximization_bias_nb10.png
introrl/examples/chapter_6/plot_example_6_6.py
introrl/examples/chapter_6/plot_fig_6_5_maximization_bias.py
introrl/examples/chapter_6/cliff_walking/build_fig_6_3_data.py
introrl/examples/chapter_6/cliff_walking/build_fig_6_3_data_wtd0.py
introrl/examples/chapter_6/cliff_walking/build_fig_6_3_interim_data.py
introrl/examples/chapter_6/cliff_walking/example_6_6_cliff_walking.py
introrl/examples/chapter_6/cliff_walking/example_6_6_cliff_walking_alpha_0_5.png
introrl/examples/chapter_6/cliff_walking/example_6_6_cliff_walking_td0.py
introrl/examples/chapter_6/cliff_walking/example_6_6_cliff_walking_td0_ExS.py
introrl/examples/chapter_6/cliff_walking/figure_6_3_cliff_walking_interim.png
introrl/examples/chapter_6/cliff_walking/figure_6_3_cliff_walking_plot.png
introrl/examples/chapter_6/cliff_walking/plot_fig_6_3.py
introrl/examples/chapter_6/cliff_walking/plot_fig_6_3_interim.py
introrl/examples/chapter_6/cliff_walking/plot_fig_6_3_wtd0.py
introrl/examples/chapter_6/random_walk/example_6_2_mc_td_random_walk.png
introrl/examples/chapter_6/random_walk/example_6_2_random_walk.py
introrl/examples/chapter_6/random_walk/fig_6_2_mc_td_random_walk.png
introrl/examples/chapter_6/random_walk/fig_6_2_mc_td_random_walk_v2.png
introrl/examples/chapter_6/random_walk/figure_6_2_random_walk.py
introrl/examples/chapter_6/random_walk/figure_6_2_random_walk_v2.py
introrl/examples/chapter_6/random_walk/mc_ev_random_walk.png
introrl/examples/chapter_6/random_walk/mc_ev_random_walk_mrp.py
introrl/examples/chapter_6/random_walk/td0_random_walk.png
introrl/examples/chapter_6/random_walk/td0_random_walk_mrp.py
introrl/examples/chapter_6/windy_gridworld/dp_windy_gridworld.py
introrl/examples/chapter_6/windy_gridworld/dp_windy_kings_gridworld.py
introrl/examples/chapter_6/windy_gridworld/dp_windy_stoich_kings_gridworld.py
introrl/examples/chapter_6/windy_gridworld/example_6_5_policy.png
introrl/examples/chapter_6/windy_gridworld/example_6_5_windy_gridworld.png
introrl/examples/chapter_6/windy_gridworld/example_6_5_windy_gridworld_v2.png
introrl/examples/chapter_6/windy_gridworld/qlearning_windy_gridworld.py
introrl/examples/chapter_6/windy_gridworld/sarsa_windy_gridworld.py
introrl/examples/chapter_6/windy_gridworld/sarsa_windy_kings_gridworld.py
introrl/examples/chapter_6/windy_gridworld/td0_epsgreedy_windy_gridworld.py
introrl/examples/chapter_6/windy_gridworld/td0_windy_stoich_kings_gridworld.py
introrl/examples/chapter_7/chk_sarsa_qstar.py
introrl/examples/chapter_7/example_7.1_with_td0_random_walk_19.png
introrl/examples/chapter_7/example_7_1_w_td0.py
introrl/examples/chapter_7/figure_7_2.py
introrl/examples/chapter_7/figure_7_2_random_walk_19.png
introrl/examples/chapter_7/figure_7_2_random_walk_19_pi.png
introrl/examples/chapter_7/figure_7_2_test.py
introrl/examples/chapter_8/blocking_maze_dynaq.py
introrl/examples/chapter_8/blocking_maze_sarsa.py
introrl/examples/chapter_8/chk_dqplus.py
introrl/examples/chapter_8/chk_pqueue.py
introrl/examples/chapter_8/example_8_4_psweep.png
introrl/examples/chapter_8/example_8_4_psweep_data.png
introrl/examples/chapter_8/example_8_4_psweep_env_updates.png
introrl/examples/chapter_8/fig_8_2_dyna_maze.png
introrl/examples/chapter_8/fig_8_2_dyna_maze_xN.png
introrl/examples/chapter_8/fig_8_4_blocking_maze.png
introrl/examples/chapter_8/fig_8_5_shortcut_maze.png
introrl/examples/chapter_8/plot_example_8_4_pqueue.py
introrl/examples/chapter_8/plot_example_8_4_pqueue_data.py
introrl/examples/chapter_8/plot_fig_8_2.py
introrl/examples/chapter_8/plot_fig_8_2_xN.py
introrl/examples/chapter_8/plot_fig_8_4_blocking_maze.py
introrl/examples/chapter_8/plot_fig_8_5_shortcut_maze.py
introrl/examples/misc_dp/dp_fallen_robot.py
introrl/examples/misc_dp/dp_sample_gridworld.py
introrl/examples/misc_dp/dp_simple_gridworld.py
introrl/examples/misc_dp/dp_slippery_cleaning_robot.py
introrl/layouts/__init__.py
introrl/layouts/generic_layout.py
introrl/layouts/sample_gridworld.png
introrl/mc_funcs/__init__.py
introrl/mc_funcs/mc_ev_prediction.py
introrl/mc_funcs/mc_exploring_starts.py
introrl/mc_funcs/mc_fv_epsilon_greedy.py
introrl/mc_funcs/mc_fv_prediction.py
introrl/mdp_data/__init__.py
introrl/mdp_data/car_rental.py
introrl/mdp_data/car_rental_const_rtn.py
introrl/mdp_data/car_rental_const_rtn_diagram.png
introrl/mdp_data/fallen_3state_robot.py
introrl/mdp_data/gambler_diagram.png
introrl/mdp_data/gamblers_problem.py
introrl/mdp_data/random_walk_generic_mrp.py
introrl/mdp_data/random_walk_mrp.py
introrl/mdp_data/sample_diagram.png
introrl/mdp_data/sample_gridworld.py
introrl/mdp_data/simple_grid_world.py
introrl/mdp_data/six_states.py
introrl/mdp_data/slippery_cleaning_robot.py
introrl/mdp_data/sutton_5x5_gridworld.png
introrl/mdp_data/sutton_5x5_gridworld.py
introrl/mdp_data/sutton_dyna_grid.py
introrl/mdp_data/sutton_dyna_grid_xN.py
introrl/mdp_data/sutton_ex4_1_grid.py
introrl/mdp_data/windy_gridworld.py
introrl/mdp_data/windy_kings_gridworld.py
introrl/mdp_data/windy_stoch_kings_gridworld.py
introrl/td_funcs/__init__.py
introrl/td_funcs/dbl_qlearning_epsilon_greedy.py
introrl/td_funcs/expected_sarsa_eps_greedy.py
introrl/td_funcs/qlearning_epsilon_greedy.py
introrl/td_funcs/sarsa_epsilon_greedy.py
introrl/td_funcs/sarsa_prediction.py
introrl/td_funcs/td0_epsilon_greedy.py
introrl/td_funcs/td0_prediction.py
introrl/tests/__init__.py
introrl/tests/chk_gen_layout.py
introrl/tests/chk_gen_layout_v2.py
introrl/tests/chk_grid_io.py
introrl/tests/chk_sca.py
introrl/tests/test_action.py
introrl/tests/test_env.py
introrl/tests/test_policy.py
introrl/tests/test_reward.py
introrl/tests/test_state.py
introrl/tests/test_state_act_coll.py
introrl/tests/test_state_actions.py
introrl/tests/test_transition.py
introrl/tests/test_transition_coll.py
introrl/tk/__init__.py
introrl/tk/tk_grid_world.def
introrl/tk/tk_grid_world.py
introrl/utils/__init__.py
introrl/utils/banner.py
introrl/utils/circular_list.py
introrl/utils/fifo_queue.py
introrl/utils/functions.py
introrl/utils/gen_sort_key.py
introrl/utils/grid_funcs.py
introrl/utils/pickle_esp.py
introrl/utils/pylab_displays.py
introrl/utils/running_ave.py
introrl/utils/running_stats.py
introrl/utils/smoother.py
introrl/utils/sorteddict.py
introrl/utils/sortedlist.py
introrl/utils/sortedset.py
introrl/utils/sweep_priority_queue.py