|
42 | 42 | "0.5": {"tensorflow": "1.11"},
|
43 | 43 | "0.6.5": {"tensorflow": "1.12"},
|
44 | 44 | "0.6": {"tensorflow": "1.12"},
|
45 |
| - "0.8.2":{"tensorflow": "2.1"}, |
46 |
| - "0.8.5":{"tensorflow": "2.1", "pytorch": "1.5"} |
| 45 | + "0.8.2": {"tensorflow": "2.1"}, |
| 46 | + "0.8.5": {"tensorflow": "2.1", "pytorch": "1.5"}, |
47 | 47 | },
|
48 | 48 | }
|
49 | 49 |
|
@@ -290,8 +290,8 @@ def train_image(self):
|
290 | 290 | self.train_instance_type,
|
291 | 291 | self._image_version(),
|
292 | 292 | py_version="py36",
|
293 |
| - account=DEFAULT_RL_ACCOUNT |
294 |
| - ) |
| 293 | + account=DEFAULT_RL_ACCOUNT, |
| 294 | + ) |
295 | 295 |
|
296 | 296 | return fw_utils.create_image_uri(
|
297 | 297 | self.sagemaker_session.boto_region_name,
|
@@ -506,7 +506,10 @@ def default_metric_definitions(cls, toolkit):
|
506 | 506 | float_regex = "[-+]?[0-9]*[.]?[0-9]+([eE][-+]?[0-9]+)?" # noqa: W605, E501
|
507 | 507 |
|
508 | 508 | return [
|
509 |
| - {"Name": "episode_reward_mean", "Regex": "episode_reward_mean: (%s)" % float_regex}, |
510 |
| - {"Name": "episode_reward_max", "Regex": "episode_reward_max: (%s)" % float_regex}, |
| 509 | + { |
| 510 | + "Name": "episode_reward_mean", |
| 511 | + "Regex": "episode_reward_mean: (%s)" % float_regex, |
| 512 | + }, |
| 513 | + {"Name": "episode_reward_max", "Regex": "episode_reward_max: (%s)" % float_regex, }, |
511 | 514 | ]
|
512 | 515 | raise ValueError("An unknown RLToolkit enum was passed in. toolkit: {}".format(toolkit))
|
0 commit comments