parser.add_argument("--nb-rollout-steps", type=int, default=100) // per epoch cycle and MPI worker
parser.add_argument("--noise-type", type=str, default="adaptive-param_0.2") // choices are adaptive-param_xx, ou_xx, normal_xx, none
boolean_flag(parser, "evaluation", default=False)
return vars(parser.parse_args())
if __name__ == "__main__":
args = parse_args()
After Change
if args.num_timesteps is not None:
assert(args.num_timesteps == args.nb_epochs * args.nb_epoch_cycles * args.nb_rollout_steps)
dict_args = vars(args)
del dict_args["num_timesteps"]
return dict_args
if __name__ == "__main__":