summaryrefslogtreecommitdiff
path: root/examples/pybullet/gym/pybullet_envs/minitaur/agents/tools/loop_test.py
diff options
context:
space:
mode:
Diffstat (limited to 'examples/pybullet/gym/pybullet_envs/minitaur/agents/tools/loop_test.py')
-rw-r--r--examples/pybullet/gym/pybullet_envs/minitaur/agents/tools/loop_test.py54
1 files changed, 33 insertions, 21 deletions
diff --git a/examples/pybullet/gym/pybullet_envs/minitaur/agents/tools/loop_test.py b/examples/pybullet/gym/pybullet_envs/minitaur/agents/tools/loop_test.py
index d4d03c513..3245d26b7 100644
--- a/examples/pybullet/gym/pybullet_envs/minitaur/agents/tools/loop_test.py
+++ b/examples/pybullet/gym/pybullet_envs/minitaur/agents/tools/loop_test.py
@@ -11,7 +11,6 @@
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
-
"""Tests for the training loop."""
from __future__ import absolute_import
@@ -28,8 +27,7 @@ class LoopTest(tf.test.TestCase):
def test_report_every_step(self):
step = tf.Variable(0, False, dtype=tf.int32, name='step')
loop = tools.Loop(None, step)
- loop.add_phase(
- 'phase_1', done=True, score=0, summary='', steps=1, report_every=3)
+ loop.add_phase('phase_1', done=True, score=0, summary='', steps=1, report_every=3)
# Step: 0 1 2 3 4 5 6 7 8
# Report: x x x
with self.test_session() as sess:
@@ -45,15 +43,33 @@ class LoopTest(tf.test.TestCase):
def test_phases_feed(self):
score = tf.placeholder(tf.float32, [])
loop = tools.Loop(None)
- loop.add_phase(
- 'phase_1', done=True, score=score, summary='', steps=1, report_every=1,
- log_every=None, checkpoint_every=None, feed={score: 1})
- loop.add_phase(
- 'phase_2', done=True, score=score, summary='', steps=3, report_every=1,
- log_every=None, checkpoint_every=None, feed={score: 2})
- loop.add_phase(
- 'phase_3', done=True, score=score, summary='', steps=2, report_every=1,
- log_every=None, checkpoint_every=None, feed={score: 3})
+ loop.add_phase('phase_1',
+ done=True,
+ score=score,
+ summary='',
+ steps=1,
+ report_every=1,
+ log_every=None,
+ checkpoint_every=None,
+ feed={score: 1})
+ loop.add_phase('phase_2',
+ done=True,
+ score=score,
+ summary='',
+ steps=3,
+ report_every=1,
+ log_every=None,
+ checkpoint_every=None,
+ feed={score: 2})
+ loop.add_phase('phase_3',
+ done=True,
+ score=score,
+ summary='',
+ steps=2,
+ report_every=1,
+ log_every=None,
+ checkpoint_every=None,
+ feed={score: 3})
with self.test_session() as sess:
sess.run(tf.global_variables_initializer())
scores = list(loop.run(sess, saver=None, max_step=15))
@@ -61,10 +77,8 @@ class LoopTest(tf.test.TestCase):
def test_average_score_over_phases(self):
loop = tools.Loop(None)
- loop.add_phase(
- 'phase_1', done=True, score=1, summary='', steps=1, report_every=2)
- loop.add_phase(
- 'phase_2', done=True, score=2, summary='', steps=2, report_every=5)
+ loop.add_phase('phase_1', done=True, score=1, summary='', steps=1, report_every=2)
+ loop.add_phase('phase_2', done=True, score=2, summary='', steps=2, report_every=5)
# Score: 1 2 2 1 2 2 1 2 2 1 2 2 1 2 2 1 2
# Report 1: x x x
# Report 2: x x
@@ -78,8 +92,7 @@ class LoopTest(tf.test.TestCase):
done = tf.equal((step + 1) % 2, 0)
score = tf.cast(step, tf.float32)
loop = tools.Loop(None, step)
- loop.add_phase(
- 'phase_1', done, score, summary='', steps=1, report_every=3)
+ loop.add_phase('phase_1', done, score, summary='', steps=1, report_every=3)
# Score: 0 1 2 3 4 5 6 7 8
# Done: x x x x
# Report: x x x
@@ -91,10 +104,9 @@ class LoopTest(tf.test.TestCase):
def test_not_done_batch(self):
step = tf.Variable(0, False, dtype=tf.int32, name='step')
done = tf.equal([step % 3, step % 4], 0)
- score = tf.cast([step, step ** 2], tf.float32)
+ score = tf.cast([step, step**2], tf.float32)
loop = tools.Loop(None, step)
- loop.add_phase(
- 'phase_1', done, score, summary='', steps=1, report_every=8)
+ loop.add_phase('phase_1', done, score, summary='', steps=1, report_every=8)
# Step: 0 2 4 6
# Score 1: 0 2 4 6
# Done 1: x x