/dqn-hfo

Primary LanguageC++MIT LicenseMIT

dqn-hfo

This is an continuous action deep reinforcement learning agent for the RoboCup 2D domain. The domain can be found and downloaded from https://github.com/mhauskn/HFO.

This repo is designed to work with the latest version of Caffe (currently commit ff16f6e43dd718921e5203f640dd57c68f01cdb3) with the following minor changes:

--- a/include/caffe/solver.hpp
+++ b/include/caffe/solver.hpp
@@ -67,6 +67,7 @@ class Solver {
     return test_nets_;
   }
   int iter() { return iter_; }
+  void set_iter(int new_iter) { iter_ = new_iter; }
 
   // Invoked at specific points during an iteration
   class Callback {
@@ -84,7 +85,6 @@ class Solver {
 
   void CheckSnapshotWritePermissions();
 
- protected:
   // Make and apply the update value for the current iteration.
   virtual void ApplyUpdate() = 0;
   // The Solver::Snapshot function implements the basic snapshotting utility
@@ -95,6 +95,7 @@ class Solver {
   string SnapshotFilename(const string extension);
   string SnapshotToBinaryProto();
   string SnapshotToHDF5();
+ protected:
   // The test routine
   void TestAll();
   void Test(const int test_net_id = 0);