File tree Expand file tree Collapse file tree 2 files changed +13
-5
lines changed
ml-agents/mlagents/trainers Expand file tree Collapse file tree 2 files changed +13
-5
lines changed Original file line number Diff line number Diff line change @@ -216,9 +216,10 @@ def create_tf_policy(
216
216
create_graph : bool = False ,
217
217
) -> TFPolicy :
218
218
"""
219
- Creates a PPO policy to trainers list of policies.
219
+ Creates a policy with a Tensorflow backend and PPO hyperparameters
220
+ :param parsed_behavior_id:
220
221
:param behavior_spec: specifications for policy construction
221
- :param create_graph: whether to create the graph when policy is constructed
222
+ :param create_graph: whether to create the Tensorflow graph on construction
222
223
:return policy
223
224
"""
224
225
policy = TFPolicy (
@@ -234,9 +235,9 @@ def create_torch_policy(
234
235
self , parsed_behavior_id : BehaviorIdentifiers , behavior_spec : BehaviorSpec
235
236
) -> TorchPolicy :
236
237
"""
237
- Creates a PPO policy to trainers list of policies.
238
+ Creates a policy with a PyTorch backend and PPO hyperparameters
238
239
:param parsed_behavior_id:
239
- :param brain_parameters : specifications for policy construction
240
+ :param behavior_spec : specifications for policy construction
240
241
:return policy
241
242
"""
242
243
policy = TorchPolicy (
Original file line number Diff line number Diff line change @@ -233,6 +233,13 @@ def create_tf_policy(
233
233
behavior_spec : BehaviorSpec ,
234
234
create_graph : bool = False ,
235
235
) -> TFPolicy :
236
+ """
237
+ Creates a policy with a Tensorflow backend and SAC hyperparameters
238
+ :param parsed_behavior_id:
239
+ :param behavior_spec: specifications for policy construction
240
+ :param create_graph: whether to create the Tensorflow graph on construction
241
+ :return policy
242
+ """
236
243
policy = TFPolicy (
237
244
self .seed ,
238
245
behavior_spec ,
@@ -248,7 +255,7 @@ def create_torch_policy(
248
255
self , parsed_behavior_id : BehaviorIdentifiers , behavior_spec : BehaviorSpec
249
256
) -> TorchPolicy :
250
257
"""
251
- Creates a PPO policy to trainers list of policies.
258
+ Creates a policy with a PyTorch backend and SAC hyperparameters
252
259
:param parsed_behavior_id:
253
260
:param behavior_spec: specifications for policy construction
254
261
:return policy
You can’t perform that action at this time.
0 commit comments