|
8 | 8 | "on_sample_end": null,
|
9 | 9 | "on_train_result": null
|
10 | 10 | },
|
11 |
| - "clip_actions": false, |
| 11 | + "clip_actions": true, |
12 | 12 | "clip_param": 0.3,
|
13 | 13 | "clip_rewards": null,
|
14 | 14 | "collect_metrics_timeout": 180,
|
15 | 15 | "compress_observations": false,
|
16 | 16 | "custom_resources_per_worker": {},
|
| 17 | + "eager": false, |
| 18 | + "eager_tracing": false, |
17 | 19 | "entropy_coeff": 0.0,
|
18 | 20 | "entropy_coeff_schedule": null,
|
19 |
| - "env": "MultiWaveAttenuationPOEnv-v0", |
| 21 | + "env": "MultiAgentAccelPOEnv-v1", |
20 | 22 | "env_config": {
|
21 |
| - "flow_params": "{\n \"env\": {\n \"additional_params\": {\n \"max_accel\": 1,\n \"max_decel\": 1,\n \"ring_length\": [\n 230,\n 230\n ],\n \"target_velocity\": 4\n },\n \"clip_actions\": true,\n \"evaluate\": false,\n \"horizon\": 3000,\n \"sims_per_step\": 1,\n \"warmup_steps\": 750\n },\n \"env_name\": \"MultiWaveAttenuationPOEnv\",\n \"exp_tag\": \"lord_of_numrings1\",\n \"initial\": {\n \"additional_params\": {},\n \"bunching\": 20.0,\n \"edges_distribution\": \"all\",\n \"lanes_distribution\": Infinity,\n \"min_gap\": 0,\n \"perturbation\": 0.0,\n \"shuffle\": false,\n \"spacing\": \"custom\",\n \"x0\": 0\n },\n \"net\": {\n \"additional_params\": {\n \"lanes\": 1,\n \"length\": 230,\n \"num_rings\": 1,\n \"resolution\": 40,\n \"speed_limit\": 30\n },\n \"inflows\": {\n \"_InFlows__flows\": []\n },\n \"osm_path\": null,\n \"template\": null\n },\n \"network\": \"MultiRingNetwork\",\n \"sim\": {\n \"color_vehicles\": true,\n \"emission_path\": null,\n \"lateral_resolution\": null,\n \"no_step_log\": true,\n \"num_clients\": 1,\n \"overtake_right\": false,\n \"port\": null,\n \"print_warnings\": true,\n \"pxpm\": 2,\n \"render\": false,\n \"restart_instance\": false,\n \"save_render\": false,\n \"seed\": null,\n \"show_radius\": false,\n \"sight_radius\": 25,\n \"sim_step\": 0.1,\n \"teleport_time\": -1\n },\n \"simulator\": \"traci\",\n \"veh\": [\n {\n \"acceleration_controller\": [\n \"IDMController\",\n {\n \"noise\": 0.2\n }\n ],\n \"car_following_params\": {\n \"controller_params\": {\n \"accel\": 2.6,\n \"carFollowModel\": \"IDM\",\n \"decel\": 4.5,\n \"impatience\": 0.5,\n \"maxSpeed\": 30,\n \"minGap\": 2.5,\n \"sigma\": 0.5,\n \"speedDev\": 0.1,\n \"speedFactor\": 1.0,\n \"tau\": 1.0\n },\n \"speed_mode\": 25\n },\n \"initial_speed\": 0,\n \"lane_change_controller\": [\n \"SimLaneChangeController\",\n {}\n ],\n \"lane_change_params\": {\n \"controller_params\": {\n \"laneChangeModel\": \"LC2013\",\n \"lcCooperative\": \"1.0\",\n \"lcKeepRight\": \"1.0\",\n \"lcSpeedGain\": \"1.0\",\n \"lcStrategic\": \"1.0\"\n },\n \"lane_change_mode\": 512\n },\n \"num_vehicles\": 21,\n \"routing_controller\": [\n \"ContinuousRouter\",\n {}\n ],\n \"veh_id\": \"human_0\"\n },\n {\n \"acceleration_controller\": [\n \"RLController\",\n {}\n ],\n \"car_following_params\": {\n \"controller_params\": {\n \"accel\": 2.6,\n \"carFollowModel\": \"IDM\",\n \"decel\": 4.5,\n \"impatience\": 0.5,\n \"maxSpeed\": 30,\n \"minGap\": 2.5,\n \"sigma\": 0.5,\n \"speedDev\": 0.1,\n \"speedFactor\": 1.0,\n \"tau\": 1.0\n },\n \"speed_mode\": 25\n },\n \"initial_speed\": 0,\n \"lane_change_controller\": [\n \"SimLaneChangeController\",\n {}\n ],\n \"lane_change_params\": {\n \"controller_params\": {\n \"laneChangeModel\": \"LC2013\",\n \"lcCooperative\": \"1.0\",\n \"lcKeepRight\": \"1.0\",\n \"lcSpeedGain\": \"1.0\",\n \"lcStrategic\": \"1.0\"\n },\n \"lane_change_mode\": 512\n },\n \"num_vehicles\": 1,\n \"routing_controller\": [\n \"ContinuousRouter\",\n {}\n ],\n \"veh_id\": \"rl_0\"\n }\n ]\n}", |
| 23 | + "flow_params": "{\n \"env\": {\n \"additional_params\": {\n \"max_accel\": 3,\n \"max_decel\": 3,\n \"sort_vehicles\": false,\n \"target_velocity\": 20\n },\n \"clip_actions\": true,\n \"evaluate\": false,\n \"horizon\": 1500,\n \"sims_per_step\": 1,\n \"warmup_steps\": 0\n },\n \"env_name\": \"flow.envs.multiagent.ring.accel.MultiAgentAccelPOEnv\",\n \"exp_tag\": \"multiagent_figure_eight\",\n \"initial\": {\n \"additional_params\": {},\n \"bunching\": 0,\n \"edges_distribution\": \"all\",\n \"lanes_distribution\": Infinity,\n \"min_gap\": 0,\n \"perturbation\": 0.0,\n \"shuffle\": false,\n \"spacing\": \"uniform\",\n \"x0\": 0\n },\n \"net\": {\n \"additional_params\": {\n \"lanes\": 1,\n \"radius_ring\": 30,\n \"resolution\": 40,\n \"speed_limit\": 30\n },\n \"inflows\": {\n \"_InFlows__flows\": []\n },\n \"osm_path\": null,\n \"template\": null\n },\n \"network\": \"flow.networks.figure_eight.FigureEightNetwork\",\n \"sim\": {\n \"color_by_speed\": false,\n \"emission_path\": null,\n \"force_color_update\": false,\n \"lateral_resolution\": null,\n \"no_step_log\": true,\n \"num_clients\": 1,\n \"overtake_right\": false,\n \"port\": null,\n \"print_warnings\": true,\n \"pxpm\": 2,\n \"render\": false,\n \"restart_instance\": false,\n \"save_render\": false,\n \"seed\": null,\n \"show_radius\": false,\n \"sight_radius\": 25,\n \"sim_step\": 0.1,\n \"teleport_time\": -1,\n \"use_ballistic\": false\n },\n \"simulator\": \"traci\",\n \"veh\": [\n {\n \"acceleration_controller\": [\n \"IDMController\",\n {\n \"noise\": 0.2\n }\n ],\n \"car_following_params\": {\n \"controller_params\": {\n \"accel\": 2.6,\n \"carFollowModel\": \"IDM\",\n \"decel\": 1.5,\n \"impatience\": 0.5,\n \"maxSpeed\": 30,\n \"minGap\": 2.5,\n \"sigma\": 0.5,\n \"speedDev\": 0.1,\n \"speedFactor\": 1.0,\n \"tau\": 1.0\n },\n \"speed_mode\": 1\n },\n \"initial_speed\": 0,\n \"lane_change_controller\": [\n \"SimLaneChangeController\",\n {}\n ],\n \"lane_change_params\": {\n \"controller_params\": {\n \"laneChangeModel\": \"LC2013\",\n \"lcCooperative\": \"1.0\",\n \"lcKeepRight\": \"1.0\",\n \"lcSpeedGain\": \"1.0\",\n \"lcStrategic\": \"1.0\"\n },\n \"lane_change_mode\": 512\n },\n \"num_vehicles\": 6,\n \"routing_controller\": [\n \"ContinuousRouter\",\n {}\n ],\n \"veh_id\": \"human_0\"\n },\n {\n \"acceleration_controller\": [\n \"RLController\",\n {}\n ],\n \"car_following_params\": {\n \"controller_params\": {\n \"accel\": 3,\n \"carFollowModel\": \"IDM\",\n \"decel\": 3,\n \"impatience\": 0.5,\n \"maxSpeed\": 30,\n \"minGap\": 2.5,\n \"sigma\": 0.5,\n \"speedDev\": 0.1,\n \"speedFactor\": 1.0,\n \"tau\": 1.0\n },\n \"speed_mode\": 1\n },\n \"initial_speed\": 0,\n \"lane_change_controller\": [\n \"SimLaneChangeController\",\n {}\n ],\n \"lane_change_params\": {\n \"controller_params\": {\n \"laneChangeModel\": \"LC2013\",\n \"lcCooperative\": \"1.0\",\n \"lcKeepRight\": \"1.0\",\n \"lcSpeedGain\": \"1.0\",\n \"lcStrategic\": \"1.0\"\n },\n \"lane_change_mode\": 512\n },\n \"num_vehicles\": 1,\n \"routing_controller\": [\n \"ContinuousRouter\",\n {}\n ],\n \"veh_id\": \"rl_0\"\n },\n {\n \"acceleration_controller\": [\n \"IDMController\",\n {\n \"noise\": 0.2\n }\n ],\n \"car_following_params\": {\n \"controller_params\": {\n \"accel\": 2.6,\n \"carFollowModel\": \"IDM\",\n \"decel\": 1.5,\n \"impatience\": 0.5,\n \"maxSpeed\": 30,\n \"minGap\": 2.5,\n \"sigma\": 0.5,\n \"speedDev\": 0.1,\n \"speedFactor\": 1.0,\n \"tau\": 1.0\n },\n \"speed_mode\": 1\n },\n \"initial_speed\": 0,\n \"lane_change_controller\": [\n \"SimLaneChangeController\",\n {}\n ],\n \"lane_change_params\": {\n \"controller_params\": {\n \"laneChangeModel\": \"LC2013\",\n \"lcCooperative\": \"1.0\",\n \"lcKeepRight\": \"1.0\",\n \"lcSpeedGain\": \"1.0\",\n \"lcStrategic\": \"1.0\"\n },\n \"lane_change_mode\": 512\n },\n \"num_vehicles\": 6,\n \"routing_controller\": [\n \"ContinuousRouter\",\n {}\n ],\n \"veh_id\": \"human_1\"\n },\n {\n \"acceleration_controller\": [\n \"RLController\",\n {}\n ],\n \"car_following_params\": {\n \"controller_params\": {\n \"accel\": 3,\n \"carFollowModel\": \"IDM\",\n \"decel\": 3,\n \"impatience\": 0.5,\n \"maxSpeed\": 30,\n \"minGap\": 2.5,\n \"sigma\": 0.5,\n \"speedDev\": 0.1,\n \"speedFactor\": 1.0,\n \"tau\": 1.0\n },\n \"speed_mode\": 1\n },\n \"initial_speed\": 0,\n \"lane_change_controller\": [\n \"SimLaneChangeController\",\n {}\n ],\n \"lane_change_params\": {\n \"controller_params\": {\n \"laneChangeModel\": \"LC2013\",\n \"lcCooperative\": \"1.0\",\n \"lcKeepRight\": \"1.0\",\n \"lcSpeedGain\": \"1.0\",\n \"lcStrategic\": \"1.0\"\n },\n \"lane_change_mode\": 512\n },\n \"num_vehicles\": 1,\n \"routing_controller\": [\n \"ContinuousRouter\",\n {}\n ],\n \"veh_id\": \"rl_1\"\n }\n ]\n}", |
22 | 24 | "run": "PPO"
|
23 | 25 | },
|
24 | 26 | "evaluation_config": {},
|
25 | 27 | "evaluation_interval": null,
|
26 | 28 | "evaluation_num_episodes": 10,
|
27 | 29 | "gamma": 0.999,
|
28 | 30 | "grad_clip": null,
|
29 |
| - "horizon": 3000, |
| 31 | + "horizon": 1500, |
30 | 32 | "ignore_worker_failures": false,
|
31 | 33 | "input": "sampler",
|
32 | 34 | "input_evaluation": [
|
33 | 35 | "is",
|
34 | 36 | "wis"
|
35 | 37 | ],
|
36 | 38 | "kl_coeff": 0.2,
|
37 |
| - "kl_target": 0.01, |
38 |
| - "lambda": 1.0, |
| 39 | + "kl_target": 0.02, |
| 40 | + "lambda": 0.97, |
39 | 41 | "local_tf_session_args": {
|
40 | 42 | "inter_op_parallelism_threads": 8,
|
41 | 43 | "intra_op_parallelism_threads": 8
|
42 | 44 | },
|
43 |
| - "log_level": "INFO", |
| 45 | + "log_level": "WARN", |
44 | 46 | "log_sys_usage": true,
|
45 |
| - "lr": 1e-05, |
| 47 | + "lr": 5e-05, |
46 | 48 | "lr_schedule": null,
|
| 49 | + "memory": 0, |
| 50 | + "memory_per_worker": 0, |
47 | 51 | "metrics_smoothing_episodes": 100,
|
48 | 52 | "min_iter_time_s": 0,
|
49 | 53 | "model": {
|
50 | 54 | "conv_activation": "relu",
|
51 | 55 | "conv_filters": null,
|
| 56 | + "custom_action_dist": null, |
52 | 57 | "custom_model": null,
|
53 | 58 | "custom_options": {},
|
54 | 59 | "custom_preprocessor": null,
|
55 | 60 | "dim": 84,
|
56 | 61 | "fcnet_activation": "tanh",
|
57 | 62 | "fcnet_hiddens": [
|
| 63 | + 32, |
58 | 64 | 32,
|
59 | 65 | 32
|
60 | 66 | ],
|
|
75 | 81 | "policies": {
|
76 | 82 | "av": [
|
77 | 83 | "<class 'ray.rllib.policy.tf_policy_template.PPOTFPolicy'>",
|
78 |
| - "Box(3,)", |
| 84 | + "Box(6,)", |
79 | 85 | "Box(1,)",
|
80 | 86 | {}
|
81 | 87 | ]
|
82 | 88 | },
|
83 |
| - "policies_to_train": [ |
84 |
| - "av" |
85 |
| - ], |
86 |
| - "policy_mapping_fn": "tune.function(<function setup_exps.<locals>.policy_mapping_fn at 0x7fda132e6c80>)" |
| 89 | + "policies_to_train": null, |
| 90 | + "policy_mapping_fn": "<function policy_mapping_fn at 0x147740598>" |
87 | 91 | },
|
| 92 | + "no_done_at_end": false, |
| 93 | + "no_eager_on_workers": false, |
88 | 94 | "num_cpus_for_driver": 1,
|
89 | 95 | "num_cpus_per_worker": 1,
|
90 | 96 | "num_envs_per_worker": 1,
|
91 | 97 | "num_gpus": 0,
|
92 | 98 | "num_gpus_per_worker": 0,
|
93 |
| - "num_sgd_iter": 30, |
| 99 | + "num_sgd_iter": 10, |
94 | 100 | "num_workers": 2,
|
| 101 | + "object_store_memory": 0, |
| 102 | + "object_store_memory_per_worker": 0, |
95 | 103 | "observation_filter": "NoFilter",
|
96 | 104 | "optimizer": {},
|
97 | 105 | "output": null,
|
|
110 | 118 | "sgd_minibatch_size": 128,
|
111 | 119 | "shuffle_buffer_size": 0,
|
112 | 120 | "shuffle_sequences": true,
|
113 |
| - "simple_optimizer": true, |
| 121 | + "simple_optimizer": false, |
114 | 122 | "soft_horizon": false,
|
115 | 123 | "synchronize_filters": true,
|
116 | 124 | "tf_session_args": {
|
|
126 | 134 | "log_device_placement": false
|
127 | 135 | },
|
128 | 136 | "timesteps_per_iteration": 0,
|
129 |
| - "train_batch_size": 60000, |
| 137 | + "train_batch_size": 30000, |
130 | 138 | "use_gae": true,
|
131 | 139 | "vf_clip_param": 10.0,
|
132 | 140 | "vf_loss_coeff": 1.0,
|
|
0 commit comments