diff options
Diffstat (limited to 'examples/pybullet/gym/pybullet_envs/minitaur/agents/tools/loop_test.py')
-rw-r--r-- | examples/pybullet/gym/pybullet_envs/minitaur/agents/tools/loop_test.py | 54 |
1 files changed, 33 insertions, 21 deletions
diff --git a/examples/pybullet/gym/pybullet_envs/minitaur/agents/tools/loop_test.py b/examples/pybullet/gym/pybullet_envs/minitaur/agents/tools/loop_test.py index d4d03c513..3245d26b7 100644 --- a/examples/pybullet/gym/pybullet_envs/minitaur/agents/tools/loop_test.py +++ b/examples/pybullet/gym/pybullet_envs/minitaur/agents/tools/loop_test.py @@ -11,7 +11,6 @@ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # See the License for the specific language governing permissions and # limitations under the License. - """Tests for the training loop.""" from __future__ import absolute_import @@ -28,8 +27,7 @@ class LoopTest(tf.test.TestCase): def test_report_every_step(self): step = tf.Variable(0, False, dtype=tf.int32, name='step') loop = tools.Loop(None, step) - loop.add_phase( - 'phase_1', done=True, score=0, summary='', steps=1, report_every=3) + loop.add_phase('phase_1', done=True, score=0, summary='', steps=1, report_every=3) # Step: 0 1 2 3 4 5 6 7 8 # Report: x x x with self.test_session() as sess: @@ -45,15 +43,33 @@ class LoopTest(tf.test.TestCase): def test_phases_feed(self): score = tf.placeholder(tf.float32, []) loop = tools.Loop(None) - loop.add_phase( - 'phase_1', done=True, score=score, summary='', steps=1, report_every=1, - log_every=None, checkpoint_every=None, feed={score: 1}) - loop.add_phase( - 'phase_2', done=True, score=score, summary='', steps=3, report_every=1, - log_every=None, checkpoint_every=None, feed={score: 2}) - loop.add_phase( - 'phase_3', done=True, score=score, summary='', steps=2, report_every=1, - log_every=None, checkpoint_every=None, feed={score: 3}) + loop.add_phase('phase_1', + done=True, + score=score, + summary='', + steps=1, + report_every=1, + log_every=None, + checkpoint_every=None, + feed={score: 1}) + loop.add_phase('phase_2', + done=True, + score=score, + summary='', + steps=3, + report_every=1, + log_every=None, + checkpoint_every=None, + feed={score: 2}) + loop.add_phase('phase_3', + done=True, + score=score, + summary='', + steps=2, + report_every=1, + log_every=None, + checkpoint_every=None, + feed={score: 3}) with self.test_session() as sess: sess.run(tf.global_variables_initializer()) scores = list(loop.run(sess, saver=None, max_step=15)) @@ -61,10 +77,8 @@ class LoopTest(tf.test.TestCase): def test_average_score_over_phases(self): loop = tools.Loop(None) - loop.add_phase( - 'phase_1', done=True, score=1, summary='', steps=1, report_every=2) - loop.add_phase( - 'phase_2', done=True, score=2, summary='', steps=2, report_every=5) + loop.add_phase('phase_1', done=True, score=1, summary='', steps=1, report_every=2) + loop.add_phase('phase_2', done=True, score=2, summary='', steps=2, report_every=5) # Score: 1 2 2 1 2 2 1 2 2 1 2 2 1 2 2 1 2 # Report 1: x x x # Report 2: x x @@ -78,8 +92,7 @@ class LoopTest(tf.test.TestCase): done = tf.equal((step + 1) % 2, 0) score = tf.cast(step, tf.float32) loop = tools.Loop(None, step) - loop.add_phase( - 'phase_1', done, score, summary='', steps=1, report_every=3) + loop.add_phase('phase_1', done, score, summary='', steps=1, report_every=3) # Score: 0 1 2 3 4 5 6 7 8 # Done: x x x x # Report: x x x @@ -91,10 +104,9 @@ class LoopTest(tf.test.TestCase): def test_not_done_batch(self): step = tf.Variable(0, False, dtype=tf.int32, name='step') done = tf.equal([step % 3, step % 4], 0) - score = tf.cast([step, step ** 2], tf.float32) + score = tf.cast([step, step**2], tf.float32) loop = tools.Loop(None, step) - loop.add_phase( - 'phase_1', done, score, summary='', steps=1, report_every=8) + loop.add_phase('phase_1', done, score, summary='', steps=1, report_every=8) # Step: 0 2 4 6 # Score 1: 0 2 4 6 # Done 1: x x |