path # lines of code number of updates days since first update days since last update first updated last updated tf_agents/distributions/gumbel_softmax.py 36 2 848 424 2019-10-10 2020-12-07 tf_agents/distributions/reparameterized_sampling.py 19 2 848 424 2019-10-10 2020-12-07 tf_agents/distributions/shifted_categorical.py 48 3 1017 424 2019-04-24 2020-12-07 tf_agents/distributions/utils.py 246 23 1186 65 2018-11-06 2021-12-01 tf_agents/distributions/__init__.py 4 4 1186 424 2018-11-06 2020-12-07 tf_agents/distributions/masked.py 49 14 1186 56 2018-11-06 2021-12-10 tf_agents/distributions/tanh_bijector_stable.py 27 7 1120 424 2019-01-11 2020-12-07 tf_agents/replay_buffers/episodic_replay_buffer.py 726 4 841 424 2019-10-17 2020-12-07 tf_agents/replay_buffers/replay_buffer.py 104 18 1184 312 2018-11-08 2021-03-29 tf_agents/replay_buffers/reverb_replay_buffer.py 252 15 577 10 2020-07-07 2022-01-25 tf_agents/replay_buffers/reverb_utils.py 201 19 577 65 2020-07-07 2021-12-01 tf_agents/replay_buffers/__init__.py 11 6 1186 312 2018-11-06 2021-03-29 tf_agents/replay_buffers/tf_uniform_replay_buffer.py 276 29 1164 199 2018-11-28 2021-07-20 tf_agents/replay_buffers/episodic_table.py 122 4 841 424 2019-10-17 2020-12-07 tf_agents/replay_buffers/table.py 51 9 1186 424 2018-11-06 2020-12-07 tf_agents/replay_buffers/py_uniform_replay_buffer.py 127 12 1186 424 2018-11-06 2020-12-07 tf_agents/replay_buffers/py_hashed_replay_buffer.py 76 9 1158 221 2018-12-04 2021-06-28 tf_agents/trajectories/__init__.py 23 4 1029 312 2019-04-12 2021-03-29 tf_agents/trajectories/time_step.py 235 19 1029 65 2019-04-12 2021-12-01 tf_agents/trajectories/trajectory.py 349 23 1029 65 2019-04-12 2021-12-01 tf_agents/trajectories/policy_step.py 48 12 1029 65 2019-04-12 2021-12-01 tf_agents/bandits/multi_objective/multi_objective_scalarizer.py 187 9 588 65 2020-06-26 2021-12-01 tf_agents/bandits/multi_objective/__init__.py 1 2 588 424 2020-06-26 2020-12-07 tf_agents/bandits/replay_buffers/bandit_replay_buffer.py 2 1 60 60 2021-12-06 2021-12-06 tf_agents/bandits/drivers/driver_utils.py 17 5 876 65 2019-09-12 2021-12-01 tf_agents/bandits/drivers/__init__.py 1 2 876 424 2019-09-12 2020-12-07 tf_agents/bandits/environments/non_stationary_stochastic_environment.py 72 5 876 80 2019-09-12 2021-11-16 tf_agents/bandits/environments/movielens_py_environment.py 72 6 478 80 2020-10-14 2021-11-16 tf_agents/bandits/environments/stationary_stochastic_structured_py_environment.py 81 5 633 80 2020-05-12 2021-11-16 tf_agents/bandits/environments/random_bandit_environment.py 58 5 876 80 2019-09-12 2021-11-16 tf_agents/bandits/environments/movielens_per_arm_py_environment.py 103 5 431 80 2020-11-30 2021-11-16 tf_agents/bandits/environments/piecewise_stochastic_environment.py 133 5 876 80 2019-09-12 2021-11-16 tf_agents/bandits/environments/piecewise_bernoulli_py_environment.py 57 4 876 80 2019-09-12 2021-11-16 tf_agents/bandits/environments/classification_environment.py 100 10 876 80 2019-09-12 2021-11-16 tf_agents/bandits/environments/dataset_utilities.py 70 4 463 340 2020-10-29 2021-03-01 tf_agents/bandits/environments/environment_utilities.py 158 8 876 424 2019-09-12 2020-12-07 tf_agents/bandits/environments/stationary_stochastic_per_arm_py_environment.py 80 12 676 80 2020-03-30 2021-11-16 tf_agents/bandits/environments/__init__.py 17 8 876 424 2019-09-12 2020-12-07 tf_agents/bandits/environments/bernoulli_action_mask_tf_environment.py 74 7 828 80 2019-10-30 2021-11-16 tf_agents/bandits/environments/drifting_linear_environment.py 138 5 876 80 2019-09-12 2021-11-16 tf_agents/bandits/environments/stationary_stochastic_py_environment.py 70 7 876 80 2019-09-12 2021-11-16 tf_agents/bandits/environments/bernoulli_py_environment.py 40 5 876 74 2019-09-12 2021-11-22 tf_agents/bandits/environments/wheel_py_environment.py 104 5 876 80 2019-09-12 2021-11-16 tf_agents/bandits/environments/bandit_tf_environment.py 69 7 876 80 2019-09-12 2021-11-16 tf_agents/bandits/environments/bandit_py_environment.py 43 8 876 80 2019-09-12 2021-11-16 tf_agents/bandits/metrics/__init__.py 1 2 876 424 2019-09-12 2020-12-07 tf_agents/bandits/metrics/tf_metrics.py 98 8 876 65 2019-09-12 2021-12-01 tf_agents/bandits/networks/global_and_arm_feature_network.py 162 14 675 65 2020-03-31 2021-12-01 tf_agents/bandits/networks/heteroscedastic_q_network.py 77 7 784 65 2019-12-13 2021-12-01 tf_agents/bandits/networks/__init__.py 2 3 784 424 2019-12-13 2020-12-07 tf_agents/bandits/policies/greedy_reward_prediction_policy.py 149 24 876 65 2019-09-12 2021-12-01 tf_agents/bandits/policies/neural_linucb_policy.py 241 20 876 65 2019-09-12 2021-12-01 tf_agents/bandits/policies/linear_thompson_sampling_policy.py 39 9 876 65 2019-09-12 2021-12-01 tf_agents/bandits/policies/categorical_policy.py 49 6 876 65 2019-09-12 2021-12-01 tf_agents/bandits/policies/greedy_multi_objective_neural_policy.py 209 12 574 65 2020-07-10 2021-12-01 tf_agents/bandits/policies/lin_ucb_policy.py 40 11 876 65 2019-09-12 2021-12-01 tf_agents/bandits/policies/constraints.py 280 7 525 65 2020-08-28 2021-12-01 tf_agents/bandits/policies/linear_bandit_policy.py 276 15 798 65 2019-11-29 2021-12-01 tf_agents/bandits/policies/__init__.py 9 6 876 322 2019-09-12 2021-03-19 tf_agents/bandits/policies/bernoulli_thompson_sampling_policy.py 103 2 81 73 2021-11-15 2021-11-23 tf_agents/bandits/policies/boltzmann_reward_prediction_policy.py 207 3 249 65 2021-05-31 2021-12-01 tf_agents/bandits/policies/linalg.py 80 7 876 65 2019-09-12 2021-12-01 tf_agents/bandits/policies/mixture_policy.py 77 10 749 65 2020-01-17 2021-12-01 tf_agents/bandits/policies/loss_utils.py 28 4 526 65 2020-08-27 2021-12-01 tf_agents/bandits/__init__.py 8 3 876 322 2019-09-12 2021-03-19 tf_agents/bandits/agents/greedy_multi_objective_neural_agent.py 201 14 561 80 2020-07-23 2021-11-16 tf_agents/bandits/agents/neural_linucb_agent.py 360 28 876 80 2019-09-12 2021-11-16 tf_agents/bandits/agents/exp3_agent.py 76 10 876 80 2019-09-12 2021-11-16 tf_agents/bandits/agents/linear_bandit_agent.py 369 18 798 80 2019-11-29 2021-11-16 tf_agents/bandits/agents/neural_epsilon_greedy_agent.py 59 19 876 80 2019-09-12 2021-11-16 tf_agents/bandits/agents/linear_thompson_sampling_agent.py 50 14 876 80 2019-09-12 2021-11-16 tf_agents/bandits/agents/neural_boltzmann_agent.py 64 3 248 80 2021-06-01 2021-11-16 tf_agents/bandits/agents/mixture_agent.py 111 7 722 80 2020-02-13 2021-11-16 tf_agents/bandits/agents/utils.py 73 13 876 80 2019-09-12 2021-11-16 tf_agents/bandits/agents/__init__.py 15 6 876 79 2019-09-12 2021-11-17 tf_agents/bandits/agents/greedy_reward_prediction_agent.py 225 39 876 80 2019-09-12 2021-11-16 tf_agents/bandits/agents/lin_ucb_agent.py 50 22 876 80 2019-09-12 2021-11-16 tf_agents/bandits/agents/static_mixture_agent.py 9 3 744 424 2020-01-22 2020-12-07 tf_agents/bandits/agents/exp3_mixture_agent.py 107 5 722 80 2020-02-13 2021-11-16 tf_agents/bandits/agents/dropout_thompson_sampling_agent.py 87 17 876 80 2019-09-12 2021-11-16 tf_agents/bandits/agents/bernoulli_thompson_sampling_agent.py 97 3 80 73 2021-11-16 2021-11-23 tf_agents/experimental/distributed/reverb_variable_container.py 53 2 549 424 2020-08-04 2020-12-07 tf_agents/experimental/distributed/__init__.py 1 3 501 421 2020-09-21 2020-12-10 tf_agents/experimental/__init__.py 2 4 548 421 2020-08-05 2020-12-10 tf_agents/drivers/py_driver.py 53 15 1186 65 2018-11-06 2021-12-01 tf_agents/drivers/tf_driver.py 55 11 758 65 2020-01-08 2021-12-01 tf_agents/drivers/dynamic_step_driver.py 88 27 1186 289 2018-11-06 2021-04-21 tf_agents/drivers/dynamic_episode_driver.py 97 23 1186 424 2018-11-06 2020-12-07 tf_agents/drivers/__init__.py 4 4 1186 424 2018-11-06 2020-12-07 tf_agents/drivers/driver.py 26 8 1186 424 2018-11-06 2020-12-07 tf_agents/environments/tf_environment.py 39 7 1186 424 2018-11-06 2020-12-07 tf_agents/environments/batched_py_environment.py 113 19 1186 80 2018-11-06 2021-11-16 tf_agents/environments/atari_preprocessing.py 78 16 1165 80 2018-11-27 2021-11-16 tf_agents/environments/suite_bsuite.py 35 4 727 80 2020-02-08 2021-11-16 tf_agents/environments/random_tf_environment.py 61 6 961 161 2019-06-19 2021-08-27 tf_agents/environments/atari_wrappers.py 60 12 1186 80 2018-11-06 2021-11-16 tf_agents/environments/random_py_environment.py 103 14 1186 80 2018-11-06 2021-11-16 tf_agents/environments/py_environment.py 77 22 1186 80 2018-11-06 2021-11-16 tf_agents/environments/suite_pybullet.py 5 6 1186 424 2018-11-06 2020-12-07 tf_agents/environments/suite_gym.py 63 18 1186 80 2018-11-06 2021-11-16 tf_agents/environments/parallel_py_environment.py 253 29 1186 80 2018-11-06 2021-11-16 tf_agents/environments/utils.py 54 16 1186 80 2018-11-06 2021-11-16 tf_agents/environments/__init__.py 42 7 1186 312 2018-11-06 2021-03-29 tf_agents/environments/dm_control_wrapper.py 65 9 1186 424 2018-11-06 2020-12-07 tf_agents/environments/gym_wrapper.py 156 39 1186 80 2018-11-06 2021-11-16 tf_agents/environments/suite_mujoco.py 33 7 1164 80 2018-11-28 2021-11-16 tf_agents/environments/wrappers.py 586 48 1186 80 2018-11-06 2021-11-16 tf_agents/environments/tf_wrappers.py 62 3 841 424 2019-10-17 2020-12-07 tf_agents/environments/suite_dm_control.py 90 13 1186 80 2018-11-06 2021-11-16 tf_agents/environments/tf_py_environment.py 185 32 1186 80 2018-11-06 2021-11-16 tf_agents/environments/trajectory_replay.py 114 14 1163 424 2018-11-29 2020-12-07 tf_agents/environments/suite_atari.py 54 16 1186 80 2018-11-06 2021-11-16 tf_agents/metrics/batched_py_metric.py 61 6 1186 65 2018-11-06 2021-12-01 tf_agents/metrics/py_metric.py 101 13 1186 65 2018-11-06 2021-12-01 tf_agents/metrics/py_metrics.py 166 14 1186 65 2018-11-06 2021-12-01 tf_agents/metrics/tf_metric.py 111 15 1186 147 2018-11-06 2021-09-10 tf_agents/metrics/__init__.py 6 4 1186 424 2018-11-06 2020-12-07 tf_agents/metrics/tf_py_metric.py 57 9 1186 424 2018-11-06 2020-12-07 tf_agents/metrics/tf_metrics.py 283 20 1186 424 2018-11-06 2020-12-07 tf_agents/networks/value_network.py 49 22 1186 424 2018-11-06 2020-12-07 tf_agents/networks/q_network.py 64 14 1186 424 2018-11-06 2020-12-07 tf_agents/networks/q_rnn_network.py 51 18 1186 424 2018-11-06 2020-12-07 tf_agents/networks/nest_map.py 87 5 582 65 2020-07-02 2021-12-01 tf_agents/networks/mask_splitter_network.py 58 3 563 65 2020-07-21 2021-12-01 tf_agents/networks/sequential.py 158 13 589 65 2020-06-25 2021-12-01 tf_agents/networks/expand_dims_layer.py 31 5 1112 424 2019-01-19 2020-12-07 tf_agents/networks/categorical_q_network.py 48 6 961 424 2019-06-19 2020-12-07 tf_agents/networks/utils.py 114 21 1186 65 2018-11-06 2021-12-01 tf_agents/networks/encoding_network.py 157 40 1186 235 2018-11-06 2021-06-14 tf_agents/networks/__init__.py 21 9 1186 379 2018-11-06 2021-01-21 tf_agents/networks/lstm_encoding_network.py 122 29 1186 424 2018-11-06 2020-12-07 tf_agents/networks/network.py 311 45 1186 64 2018-11-06 2021-12-02 tf_agents/networks/value_rnn_network.py 54 22 1176 424 2018-11-16 2020-12-07 tf_agents/networks/categorical_projection_network.py 73 23 1186 424 2018-11-06 2020-12-07 tf_agents/networks/actor_distribution_rnn_network.py 85 29 1176 424 2018-11-16 2020-12-07 tf_agents/networks/actor_distribution_network.py 103 29 1186 282 2018-11-06 2021-04-28 tf_agents/networks/normal_projection_network.py 127 30 1186 246 2018-11-06 2021-06-03 tf_agents/policies/boltzmann_policy.py 41 16 1128 80 2019-01-03 2021-11-16 tf_agents/policies/q_policy.py 93 38 1186 80 2018-11-06 2021-11-16 tf_agents/policies/policy_info_updater_wrapper.py 49 6 693 424 2020-03-13 2020-12-07 tf_agents/policies/gaussian_policy.py 49 8 1031 80 2019-04-10 2021-11-16 tf_agents/policies/epsilon_greedy_policy.py 118 40 1186 80 2018-11-06 2021-11-16 tf_agents/policies/tf_policy.py 252 48 1186 80 2018-11-06 2021-11-16 tf_agents/policies/policy_loader.py 29 3 653 424 2020-04-22 2020-12-07 tf_agents/policies/tf_py_policy.py 86 21 1186 80 2018-11-06 2021-11-16 tf_agents/policies/py_policy.py 88 17 1186 80 2018-11-06 2021-11-16 tf_agents/policies/samplers/cem_actions_sampler_continuous.py 114 2 133 23 2021-09-24 2022-01-12 tf_agents/policies/samplers/cem_actions_sampler_hybrid.py 43 1 133 133 2021-09-24 2021-09-24 tf_agents/policies/samplers/cem_actions_sampler_continuous_and_one_hot.py 293 4 133 2 2021-09-24 2022-02-02 tf_agents/policies/samplers/cem_actions_sampler.py 30 2 133 23 2021-09-24 2022-01-12 tf_agents/policies/py_epsilon_greedy_policy.py 70 10 1186 80 2018-11-06 2021-11-16 tf_agents/policies/async_policy_saver.py 73 5 689 331 2020-03-17 2021-03-10 tf_agents/policies/random_tf_policy.py 143 31 1186 80 2018-11-06 2021-11-16 tf_agents/policies/greedy_policy.py 42 23 1186 80 2018-11-06 2021-11-16 tf_agents/policies/utils.py 161 4 322 80 2021-03-19 2021-11-16 tf_agents/policies/__init__.py 25 7 1186 312 2018-11-06 2021-03-29 tf_agents/policies/batched_py_policy.py 114 5 612 80 2020-06-02 2021-11-16 tf_agents/policies/temporal_action_smoothing.py 41 7 997 80 2019-05-14 2021-11-16 tf_agents/policies/categorical_q_policy.py 89 19 961 80 2019-06-19 2021-11-16 tf_agents/policies/ou_noise_policy.py 56 17 1186 80 2018-11-06 2021-11-16 tf_agents/policies/scripted_py_policy.py 55 12 1186 80 2018-11-06 2021-11-16 tf_agents/policies/random_py_policy.py 73 19 1186 80 2018-11-06 2021-11-16 tf_agents/policies/fixed_policy.py 61 20 1186 57 2018-11-06 2021-12-09 tf_agents/policies/qtopt_cem_policy.py 300 4 132 87 2021-09-25 2021-11-09 tf_agents/policies/policy_saver.py 387 46 1050 80 2019-03-22 2021-11-16 tf_agents/policies/py_tf_eager_policy.py 115 24 910 29 2019-08-09 2022-01-06 tf_agents/policies/py_tf_policy.py 148 24 1186 80 2018-11-06 2021-11-16 tf_agents/policies/actor_policy.py 101 30 1186 80 2018-11-06 2021-11-16 tf_agents/keras_layers/bias_layer.py 39 5 666 424 2020-04-09 2020-12-07 tf_agents/keras_layers/rnn_wrapper.py 107 5 589 65 2020-06-25 2021-12-01 tf_agents/keras_layers/permanent_variable_rate_dropout.py 24 1 238 238 2021-06-11 2021-06-11 tf_agents/keras_layers/__init__.py 5 6 631 394 2020-05-14 2021-01-06 tf_agents/keras_layers/dynamic_unroll_layer.py 248 8 631 423 2020-05-14 2020-12-08 tf_agents/keras_layers/inner_reshape.py 40 3 582 65 2020-07-02 2021-12-01 tf_agents/keras_layers/squashed_outer_wrapper.py 95 1 423 423 2020-12-08 2020-12-08 tf_agents/__init__.py 46 12 1186 421 2018-11-06 2020-12-10 tf_agents/utils/example_encoding.py 143 12 1052 221 2019-03-20 2021-06-28 tf_agents/utils/value_ops.py 63 9 1186 424 2018-11-06 2020-12-07 tf_agents/utils/tensor_normalizer.py 225 22 1186 269 2018-11-06 2021-05-11 tf_agents/utils/eager_utils.py 283 27 1186 160 2018-11-06 2021-08-28 tf_agents/utils/nest_utils.py 584 50 1186 65 2018-11-06 2021-12-01 tf_agents/utils/composite.py 99 4 903 424 2019-08-16 2020-12-07 tf_agents/utils/object_identity.py 121 2 704 424 2020-03-02 2020-12-07 tf_agents/utils/xla.py 43 3 956 424 2019-06-24 2020-12-07 tf_agents/utils/__init__.py 12 7 1186 424 2018-11-06 2020-12-07 tf_agents/utils/numpy_storage.py 91 4 1033 424 2019-04-08 2020-12-07 tf_agents/utils/common.py 627 81 1186 99 2018-11-06 2021-10-28 tf_agents/utils/lazy_loader.py 26 3 577 331 2020-07-07 2021-03-10 tf_agents/utils/timer.py 20 4 1186 424 2018-11-06 2020-12-07 tf_agents/utils/session_utils.py 21 6 1186 424 2018-11-06 2020-12-07 tf_agents/utils/example_encoding_dataset.py 117 15 1025 161 2019-04-16 2021-08-27 tf_agents/system/system_multiprocessing.py 128 5 627 126 2020-05-18 2021-10-01 tf_agents/system/__init__.py 1 3 639 424 2020-05-06 2020-12-07 tf_agents/system/default/__init__.py 1 2 639 424 2020-05-06 2020-12-07 tf_agents/system/default/multiprocessing_core.py 40 3 627 424 2020-05-18 2020-12-07 tf_agents/eval/__init__.py 1 3 1030 424 2019-04-11 2020-12-07 tf_agents/eval/metric_utils.py 85 6 1030 424 2019-04-11 2020-12-07 tf_agents/typing/types.py 75 23 639 65 2020-05-06 2021-12-01 tf_agents/typing/__init__.py 1 3 634 424 2020-05-11 2020-12-07 tf_agents/version.py 12 14 1164 81 2018-11-28 2021-11-15 tf_agents/benchmark/dqn_benchmark.py 28 4 395 227 2021-01-05 2021-06-22 tf_agents/benchmark/ppo_benchmark.py 45 4 395 87 2021-01-05 2021-11-09 tf_agents/benchmark/perfzero_benchmark.py 41 3 456 415 2020-11-05 2020-12-16 tf_agents/benchmark/distribution_strategy_utils.py 47 3 815 424 2019-11-12 2020-12-07 tf_agents/benchmark/utils.py 167 10 815 144 2019-11-12 2021-09-13 tf_agents/benchmark/__init__.py 1 2 815 424 2019-11-12 2020-12-07 tf_agents/benchmark/sac_benchmark.py 39 6 456 87 2020-11-05 2021-11-09 tf_agents/benchmark/cql_sac_benchmark.py 46 2 91 65 2021-11-05 2021-12-01 tf_agents/train/actor.py 127 7 428 174 2020-12-03 2021-08-14 tf_agents/train/ppo_learner_test_utils.py 74 1 330 330 2021-03-11 2021-03-11 tf_agents/train/interval_trigger.py 23 3 428 248 2020-12-03 2021-06-01 tf_agents/train/step_per_second_tracker.py 14 2 428 424 2020-12-03 2020-12-07 tf_agents/train/learner.py 238 18 428 57 2020-12-03 2021-12-09 tf_agents/train/__init__.py 5 3 428 421 2020-12-03 2020-12-10 tf_agents/train/triggers.py 131 12 428 37 2020-12-03 2021-12-29 tf_agents/train/utils/spec_utils.py 17 2 428 424 2020-12-03 2020-12-07 tf_agents/train/utils/train_utils.py 96 3 428 395 2020-12-03 2021-01-05 tf_agents/train/utils/strategy_utils.py 22 3 428 232 2020-12-03 2021-06-17 tf_agents/train/utils/__init__.py 1 2 428 424 2020-12-03 2020-12-07 tf_agents/train/utils/replay_buffer_utils.py 68 5 428 141 2020-12-03 2021-09-16 tf_agents/train/ppo_learner.py 138 8 330 186 2021-03-11 2021-08-02 tf_agents/agents/qtopt/qtopt_agent.py 382 3 128 65 2021-09-29 2021-12-01 tf_agents/agents/data_converter.py 303 9 557 65 2020-07-27 2021-12-01 tf_agents/agents/categorical_dqn/__init__.py 1 2 921 424 2019-07-29 2020-12-07 tf_agents/agents/categorical_dqn/categorical_dqn_agent.py 324 24 961 65 2019-06-19 2021-12-01 tf_agents/agents/sac/sac_agent.py 452 61 1115 65 2019-01-16 2021-12-01 tf_agents/agents/sac/__init__.py 1 3 1109 424 2019-01-22 2020-12-07 tf_agents/agents/sac/tanh_normal_projection_network.py 79 6 731 65 2020-02-04 2021-12-01 tf_agents/agents/behavioral_cloning/behavioral_cloning_agent.py 174 47 1152 65 2018-12-10 2021-12-01 tf_agents/agents/behavioral_cloning/__init__.py 1 4 1152 424 2018-12-10 2020-12-07 tf_agents/agents/__init__.py 23 10 1186 190 2018-11-06 2021-07-29 tf_agents/agents/ddpg/critic_rnn_network.py 147 18 1166 424 2018-11-26 2020-12-07 tf_agents/agents/ddpg/actor_rnn_network.py 98 17 1166 424 2018-11-26 2020-12-07 tf_agents/agents/ddpg/__init__.py 5 4 1186 424 2018-11-06 2020-12-07 tf_agents/agents/ddpg/actor_network.py 61 20 1173 274 2018-11-19 2021-05-06 tf_agents/agents/ddpg/ddpg_agent.py 252 44 1186 65 2018-11-06 2021-12-01 tf_agents/agents/ddpg/critic_network.py 79 20 1173 134 2018-11-19 2021-09-23 tf_agents/agents/td3/td3_agent.py 330 48 1186 65 2018-11-06 2021-12-01 tf_agents/agents/td3/__init__.py 1 4 1186 424 2018-11-06 2020-12-07 tf_agents/agents/dqn/__init__.py 1 4 1186 424 2018-11-06 2020-12-07 tf_agents/agents/dqn/dqn_agent.py 306 73 1186 65 2018-11-06 2021-12-01 tf_agents/agents/tf_agent.py 222 57 1186 65 2018-11-06 2021-12-01 tf_agents/agents/ppo/ppo_utils.py 109 22 1186 65 2018-11-06 2021-12-01 tf_agents/agents/ppo/ppo_policy.py 155 34 1186 65 2018-11-06 2021-12-01 tf_agents/agents/ppo/ppo_kl_penalty_agent.py 88 10 709 65 2020-02-26 2021-12-01 tf_agents/agents/ppo/__init__.py 6 10 1186 291 2018-11-06 2021-04-19 tf_agents/agents/ppo/ppo_agent.py 903 90 1186 62 2018-11-06 2021-12-04 tf_agents/agents/ppo/ppo_actor_network.py 62 3 303 282 2021-04-07 2021-04-28 tf_agents/agents/ppo/ppo_clip_agent.py 82 14 715 65 2020-02-20 2021-12-01 tf_agents/agents/cql/__init__.py 1 1 190 190 2021-07-29 2021-07-29 tf_agents/agents/cql/cql_sac_agent.py 454 4 218 65 2021-07-01 2021-12-01 tf_agents/agents/reinforce/reinforce_agent.py 276 45 1186 65 2018-11-06 2021-12-01 tf_agents/agents/reinforce/__init__.py 1 4 1186 424 2018-11-06 2020-12-07 tf_agents/agents/random/random_agent.py 30 4 721 65 2020-02-14 2021-12-01 tf_agents/agents/random/__init__.py 2 2 721 424 2020-02-14 2020-12-07 tf_agents/agents/random/fixed_policy_agent.py 44 7 721 65 2020-02-14 2021-12-01 MANIFEST.in 1 1 450 450 2020-11-11 2020-11-11 setup.py 242 51 1186 3 2018-11-06 2022-02-01 tools/graph_builder.py 146 3 467 424 2020-10-25 2020-12-07 tools/build_docs.py 52 2 546 424 2020-08-07 2020-12-07 tools/release_builder.py 130 2 564 424 2020-07-20 2020-12-07