notebooks/unit1/unit1.ipynb (9 lines): - line 638: "# TODO: Define a PPO MlpPolicy architecture\n", - line 694: "# TODO: Train it for 1,000,000 timesteps\n", - line 696: "# TODO: Specify file name for model and save the model to file\n", - line 750: "# TODO: Evaluate the agent\n", - line 904: "## TODO: Define a repo_id\n", - line 908: "# TODO: Define the name of the environment\n", - line 915: "# TODO: Define the model architecture we used\n", - line 918: "## TODO: Define the commit message\n", - line 960: "# TODO: Define the model architecture we used\n", notebooks/unit4/unit4.ipynb (6 lines): - line 693: " state = # TODO: reset the environment\n", - line 696: " action, log_prob = # TODO get the action\n", - line 698: " state, reward, done, _ = # TODO: take an env step\n", - line 739: " returns.appendleft( ) # TODO: complete here \n", - line 1271: "repo_id = \"\" #TODO Define your repo id {username/Reinforce-{model-id}}\n", - line 1524: "repo_id = \"\" #TODO Define your repo id {username/Reinforce-{model-id}}\n", notebooks/unit6/unit6.ipynb (2 lines): - line 429: "env = # TODO: Add the wrapper" - line 779: " repo_id=f\"ThomasSimonini/a2c-{env_id}\", # TODO: Change the username\n", notebooks/unit2/unit2.ipynb (1 line): - line 364: "env = gym.make() # TODO use the correct parameters"