File size: 13,907 Bytes
571b03b
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
{
    "policy_class": {
        ":type:": "<class 'abc.ABCMeta'>",
        ":serialized:": "gASVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
        "__module__": "stable_baselines3.common.policies",
        "__doc__": "\n    Policy class for actor-critic algorithms (has both policy and value prediction).\n    Used by A2C, PPO and the likes.\n\n    :param observation_space: Observation space\n    :param action_space: Action space\n    :param lr_schedule: Learning rate schedule (could be constant)\n    :param net_arch: The specification of the policy and value networks.\n    :param activation_fn: Activation function\n    :param ortho_init: Whether to use or not orthogonal initialization\n    :param use_sde: Whether to use State Dependent Exploration or not\n    :param log_std_init: Initial value for the log standard deviation\n    :param full_std: Whether to use (n_features x n_actions) parameters\n        for the std instead of only (n_features,) when using gSDE\n    :param sde_net_arch: Network architecture for extracting features\n        when using gSDE. If None, the latent features from the policy will be used.\n        Pass an empty list to use the states as features.\n    :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n        a positive standard deviation (cf paper). It allows to keep variance\n        above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n    :param squash_output: Whether to squash the output using a tanh function,\n        this allows to ensure boundaries when using gSDE.\n    :param features_extractor_class: Features extractor to use.\n    :param features_extractor_kwargs: Keyword arguments\n        to pass to the features extractor.\n    :param normalize_images: Whether to normalize images or not,\n         dividing by 255.0 (True by default)\n    :param optimizer_class: The optimizer to use,\n        ``th.optim.Adam`` by default\n    :param optimizer_kwargs: Additional keyword arguments,\n        excluding the learning rate, to pass to the optimizer\n    ",
        "__init__": "<function ActorCriticPolicy.__init__ at 0x7f109e1b87a0>",
        "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f109e1b8830>",
        "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f109e1b88c0>",
        "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f109e1b8950>",
        "_build": "<function ActorCriticPolicy._build at 0x7f109e1b89e0>",
        "forward": "<function ActorCriticPolicy.forward at 0x7f109e1b8a70>",
        "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f109e1b8b00>",
        "_predict": "<function ActorCriticPolicy._predict at 0x7f109e1b8b90>",
        "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f109e1b8c20>",
        "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f109e1b8cb0>",
        "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f109e1b8d40>",
        "__abstractmethods__": "frozenset()",
        "_abc_impl": "<_abc_data object at 0x7f109e18c360>"
    },
    "verbose": 1,
    "policy_kwargs": {},
    "observation_space": {
        ":type:": "<class 'gym.spaces.box.Box'>",
        ":serialized:": "gASVwwEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLCIWUjANsb3eUjBVudW1weS5jb3JlLm11bHRpYXJyYXmUjAxfcmVjb25zdHJ1Y3SUk5RoBowHbmRhcnJheZSTlEsAhZRDAWKUh5RSlChLAUsIhZRoColDIAAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/lHSUYowEaGlnaJRoEmgUSwCFlGgWh5RSlChLAUsIhZRoColDIAAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/lHSUYowNYm91bmRlZF9iZWxvd5RoEmgUSwCFlGgWh5RSlChLAUsIhZRoB4wCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYolDCAAAAAAAAAAAlHSUYowNYm91bmRlZF9hYm92ZZRoEmgUSwCFlGgWh5RSlChLAUsIhZRoKolDCAAAAAAAAAAAlHSUYowKX25wX3JhbmRvbZROdWIu",
        "dtype": "float32",
        "_shape": [
            8
        ],
        "low": "[-inf -inf -inf -inf -inf -inf -inf -inf]",
        "high": "[inf inf inf inf inf inf inf inf]",
        "bounded_below": "[False False False False False False False False]",
        "bounded_above": "[False False False False False False False False]",
        "_np_random": null
    },
    "action_space": {
        ":type:": "<class 'gym.spaces.discrete.Discrete'>",
        ":serialized:": "gASVggAAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwGX3NoYXBllCmMBWR0eXBllIwFbnVtcHmUaAeTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZROdWIu",
        "n": 4,
        "_shape": [],
        "dtype": "int64",
        "_np_random": null
    },
    "n_envs": 1,
    "num_timesteps": 500736,
    "_total_timesteps": 500000,
    "_num_timesteps_at_start": 0,
    "seed": null,
    "action_noise": null,
    "start_time": 1652403659.498233,
    "learning_rate": 0.0003,
    "tensorboard_log": null,
    "lr_schedule": {
        ":type:": "<class 'function'>",
        ":serialized:": "gASVXwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX2ZpbGxfZnVuY3Rpb26Uk5QoaACMD19tYWtlX3NrZWxfZnVuY5STlGgAjA1fYnVpbHRpbl90eXBllJOUjAhDb2RlVHlwZZSFlFKUKEsBSwBLAUsBSxNDBIgAUwCUToWUKYwBX5SFlIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLgEMCAAGUjAN2YWyUhZQpdJRSlEsBfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEgvdXNyL2xvY2FsL2xpYi9weXRob24zLjcvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdYeUUpR9lCiMB2dsb2JhbHOUfZSMCGRlZmF1bHRzlE6MBGRpY3SUfZSMDmNsb3N1cmVfdmFsdWVzlF2URz8zqSowVTJhYYwGbW9kdWxllGgZjARuYW1llGgPjANkb2OUTowXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC2Fubm90YXRpb25zlH2UjAhxdWFsbmFtZZSMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjAprd2RlZmF1bHRzlE51dFIu"
    },
    "_last_obs": {
        ":type:": "<class 'numpy.ndarray'>",
        ":serialized:": "gASVqgAAAAAAAACMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMDF9yZWNvbnN0cnVjdJSTlIwFbnVtcHmUjAduZGFycmF5lJOUSwCFlEMBYpSHlFKUKEsBSwFLCIaUaAOMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiiUMg7fwmPsNlLDs2eui8rQIxPFbF9D14iWu9AACAPwAAgD+UdJRiLg=="
    },
    "_last_episode_starts": {
        ":type:": "<class 'numpy.ndarray'>",
        ":serialized:": "gASViQAAAAAAAACMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMDF9yZWNvbnN0cnVjdJSTlIwFbnVtcHmUjAduZGFycmF5lJOUSwCFlEMBYpSHlFKUKEsBSwGFlGgDjAVkdHlwZZSTlIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYolDAQCUdJRiLg=="
    },
    "_last_original_obs": null,
    "_episode_num": 0,
    "use_sde": false,
    "sde_sample_freq": -1,
    "_current_progress_remaining": -0.0014719999999999178,
    "ep_info_buffer": {
        ":type:": "<class 'collections.deque'>",
        ":serialized:": "gASVgRAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMI31M57ak5YUCUhpRSlIwBbJRN6AOMAXSUR0CRDS/IKc/ddX2UKGgGaAloD0MIs874vjjdbkCUhpRSlGgVTSADaBZHQJEUlb2USqV1fZQoaAZoCWgPQwhb6bXZ2ARsQJSGlFKUaBVNZgFoFkdAkRbji0fHP3V9lChoBmgJaA9DCLRYiuSrEHBAlIaUUpRoFU1NAWgWR0CRGQtDUmUodX2UKGgGaAloD0MIke18PzXbbUCUhpRSlGgVTTABaBZHQJEcGMir1dx1fZQoaAZoCWgPQwgVyOws+sluQJSGlFKUaBVNVwFoFkdAkR5iXt0FKXV9lChoBmgJaA9DCPOOU3Sk9XFAlIaUUpRoFU1NAWgWR0CRIFraufVadX2UKGgGaAloD0MI56vkY3cvckCUhpRSlGgVTWEBaBZHQJEjoR/ViF11fZQoaAZoCWgPQwjnUIaqGKRsQJSGlFKUaBVNQAFoFkdAkSWiW/rSmnV9lChoBmgJaA9DCNe9FYmJ629AlIaUUpRoFU1jAWgWR0CRJ/mSyMUAdX2UKGgGaAloD0MI4syv5gDPa0CUhpRSlGgVTTUBaBZHQJErJTqB3A51fZQoaAZoCWgPQwhRFVPppx9vQJSGlFKUaBVNeAFoFkdAkS17Fn7HhnV9lChoBmgJaA9DCPM5d7te025AlIaUUpRoFU28AWgWR0CRMZNvOyE+dX2UKGgGaAloD0MIE51lFqHHbkCUhpRSlGgVTcABaBZHQJE0ks8PnSx1fZQoaAZoCWgPQwjXUGovIgJuQJSGlFKUaBVNlQJoFkdAkTpa2v0ROHV9lChoBmgJaA9DCL98smL4nHFAlIaUUpRoFU1pAWgWR0CRPKh3qzJIdX2UKGgGaAloD0MIwW7Ytqi3bUCUhpRSlGgVTUIBaBZHQJE+kinpB5Z1fZQoaAZoCWgPQwjLSSh9IXJvQJSGlFKUaBVNEgNoFkdAkUWUGJN0vHV9lChoBmgJaA9DCLeZCvEIIXFAlIaUUpRoFU3oAmgWR0CRTF4iHIp6dX2UKGgGaAloD0MIqpog6j5vcUCUhpRSlGgVTU0BaBZHQJFOTr7fpEB1fZQoaAZoCWgPQwjWqfI9IwpuQJSGlFKUaBVNQgFoFkdAkVBLdrO7hHV9lChoBmgJaA9DCJfjFYieEm5AlIaUUpRoFU1hAWgWR0CRU9wUQCjldX2UKGgGaAloD0MIYVRSJyC0akCUhpRSlGgVTWcBaBZHQJFWE/pt78h1fZQoaAZoCWgPQwiZDwh0JtVhQJSGlFKUaBVN6ANoFkdAkWAcI7eVLXV9lChoBmgJaA9DCFlN1xPdC2pAlIaUUpRoFU1nAWgWR0CRYpFiay8jdX2UKGgGaAloD0MIDeNuEK1lMkCUhpRSlGgVTVkBaBZHQJFl6vFFUhp1fZQoaAZoCWgPQwjGFoIc1IhwQJSGlFKUaBVNYgFoFkdAkWhWS+xnnXV9lChoBmgJaA9DCJmCNc6m5GxAlIaUUpRoFU2bAWgWR0CRbDpJwsGxdX2UKGgGaAloD0MIDoXP1sEDbUCUhpRSlGgVTcgBaBZHQJFvd9lVcUx1fZQoaAZoCWgPQwheTZ6yGpJxQJSGlFKUaBVNZwFoFkdAkXHfBnBciXV9lChoBmgJaA9DCFhYcD9gnXBAlIaUUpRoFU2kAWgWR0CRdhuDBdledX2UKGgGaAloD0MIs7ES86xeQcCUhpRSlGgVTYMBaBZHQJF4mimEXch1fZQoaAZoCWgPQwjyzwziw65wQJSGlFKUaBVNQwJoFkdAkX3uLWI42nV9lChoBmgJaA9DCN4E3zR9FHBAlIaUUpRoFU3fAWgWR0CRgUZUDMePdX2UKGgGaAloD0MIknU4ukpqb0CUhpRSlGgVTaYBaBZHQJGFLk5p8F91fZQoaAZoCWgPQwiJljyelpNuQJSGlFKUaBVN3gFoFkdAkYjkhJRO13V9lChoBmgJaA9DCCwOZ351hnFAlIaUUpRoFU3DAWgWR0CRi9zDGcWkdX2UKGgGaAloD0MI2zNLAlRZYUCUhpRSlGgVTZoCaBZHQJGSHhl18st1fZQoaAZoCWgPQwgTZARU+DlwQJSGlFKUaBVNnAFoFkdAkZT4G2TgVHV9lChoBmgJaA9DCPPK9bYZH29AlIaUUpRoFU3EAWgWR0CRmS9Ba9sadX2UKGgGaAloD0MIOLu1TIbeb0CUhpRSlGgVTa0BaBZHQJGcJoRIz311fZQoaAZoCWgPQwjba0HvjUVxQJSGlFKUaBVNgwFoFkdAkZ/gQpWmxnV9lChoBmgJaA9DCHUGRl7Wdm5AlIaUUpRoFU2rAWgWR0CRopbT+ee4dX2UKGgGaAloD0MIE7u2t1uxbECUhpRSlGgVTaIBaBZHQJGmewPiDNB1fZQoaAZoCWgPQwj9TL1ukRFuQJSGlFKUaBVNswFoFkdAkakrv5P/JnV9lChoBmgJaA9DCDzB/uscWXBAlIaUUpRoFU2pAWgWR0CRrANyYG+sdX2UKGgGaAloD0MIlddK6K5sbUCUhpRSlGgVTcUBaBZHQJGwIh8pkPN1fZQoaAZoCWgPQwj+tidIbDtwQJSGlFKUaBVNhgFoFkdAkbKmkadc0XV9lChoBmgJaA9DCMe8jjjkqG5AlIaUUpRoFU1nAWgWR0CRtly44Ia+dX2UKGgGaAloD0MI/mDgufd4bkCUhpRSlGgVTZgBaBZHQJG5ROGj9GZ1fZQoaAZoCWgPQwif508blWBwQJSGlFKUaBVN2wFoFkdAkby0FKTSs3V9lChoBmgJaA9DCPJfIAiQo1lAlIaUUpRoFU3oA2gWR0CRxrH3Dej3dX2UKGgGaAloD0MI4V0u4jvmbECUhpRSlGgVTbgCaBZHQJHNB9y925h1fZQoaAZoCWgPQwgLCoMyDapqQJSGlFKUaBVNgQFoFkdAkc+pv1lGw3V9lChoBmgJaA9DCIyjchM1FWBAlIaUUpRoFU3oA2gWR0CR2CVuJk5IdX2UKGgGaAloD0MIpmH4iBhgcECUhpRSlGgVTbcBaBZHQJHcL2f02+B1fZQoaAZoCWgPQwgx73GmCfZsQJSGlFKUaBVNKwJoFkdAkeA2HDaXbHV9lChoBmgJaA9DCN82UyGerGxAlIaUUpRoFU3CAWgWR0CR5QUdq+JxdX2UKGgGaAloD0MIVtKKbygVYECUhpRSlGgVTegDaBZHQJHtG1twaR91fZQoaAZoCWgPQwj4wmSqYDpwQJSGlFKUaBVNzAFoFkdAkfBlOXVslHV9lChoBmgJaA9DCIMz+PtF9WpAlIaUUpRoFU0lAmgWR0CR9kMuvlltdX2UKGgGaAloD0MIAWpq2drhZUCUhpRSlGgVTegDaBZHQJH/3SPU8V51fZQoaAZoCWgPQwgo84++yWlhQJSGlFKUaBVN6ANoFkdAkgioiHIp6XV9lChoBmgJaA9DCDCca5ihqWpAlIaUUpRoFU3AAWgWR0CSC+CuU2UCdX2UKGgGaAloD0MIhBCQLyGdbkCUhpRSlGgVTd8BaBZHQJIQG+evpyJ1fZQoaAZoCWgPQwi2D3nLlWlwQJSGlFKUaBVNowFoFkdAkhMK64Ds+nV9lChoBmgJaA9DCPsD5bZ9/WpAlIaUUpRoFU2HAWgWR0CSFbjAzpHJdX2UKGgGaAloD0MILIApA4cKbkCUhpRSlGgVTSkCaBZHQJIbW2Dxsl91fZQoaAZoCWgPQwiJCtXNxQFxQJSGlFKUaBVNwQFoFkdAkh6bP6be/HV9lChoBmgJaA9DCI4EGmxqu3BAlIaUUpRoFU21AWgWR0CSIps/pt78dX2UKGgGaAloD0MIkgVM4JY7cUCUhpRSlGgVTb4BaBZHQJIlgqtozvZ1fZQoaAZoCWgPQwh3FOeoI+tvQJSGlFKUaBVNwwFoFkdAkimBXKbKBHV9lChoBmgJaA9DCIUjSKXYJG9AlIaUUpRoFU24AWgWR0CSLGrXlKbsdX2UKGgGaAloD0MIa9PYXgsYbkCUhpRSlGgVTb0BaBZHQJIwt19v0iB1fZQoaAZoCWgPQwjXTSmvFdFtQJSGlFKUaBVNoAFoFkdAkjPSprDZUXV9lChoBmgJaA9DCBHGT+Pe23BAlIaUUpRoFU3cAWgWR0CSNwtFKCg9dX2UKGgGaAloD0MINgNckK2EcUCUhpRSlGgVTZMBaBZHQJI65pnHvMN1fZQoaAZoCWgPQwjXMa64OH9vQJSGlFKUaBVNsgFoFkdAkj5ophF3IXV9lChoBmgJaA9DCERq2sU0PGpAlIaUUpRoFU3IAWgWR0CSQuA9mpVCdX2UKGgGaAloD0MIKxcq/1oabUCUhpRSlGgVTZwBaBZHQJJF/ojfNzN1fZQoaAZoCWgPQwgeF9UioqJrQJSGlFKUaBVNBQJoFkdAkkrcXWOIZnV9lChoBmgJaA9DCIEFMGVgf25AlIaUUpRoFU3EAWgWR0CSTfri2lVMdX2UKGgGaAloD0MINiOD3IVMcECUhpRSlGgVTbYBaBZHQJJR3KEFnqV1fZQoaAZoCWgPQwhLj6Z68olwQJSGlFKUaBVNhQFoFkdAklRR6Ww/xHV9lChoBmgJaA9DCGBWKNL92G9AlIaUUpRoFU3eAWgWR0CSV5qCpWFOdX2UKGgGaAloD0MIwVWeQNiocECUhpRSlGgVTWoBaBZHQJJbCOaOPvN1fZQoaAZoCWgPQwjrbwnA/41wQJSGlFKUaBVNgQFoFkdAkl1597Wuo3V9lChoBmgJaA9DCI21v7M92G9AlIaUUpRoFU3IAWgWR0CSYcwD/2kBdX2UKGgGaAloD0MIUrr0L0kfbUCUhpRSlGgVTYwBaBZHQJJkpOwgTyt1fZQoaAZoCWgPQwiCyvj3GVtvQJSGlFKUaBVN0wFoFkdAkmfSYsunM3V9lChoBmgJaA9DCGSWPQls019AlIaUUpRoFU3oA2gWR0CScCqveP7vdX2UKGgGaAloD0MICOOncS9ScECUhpRSlGgVTdwBaBZHQJJ0mgg5imV1fZQoaAZoCWgPQwjSj4ZTZgRtQJSGlFKUaBVNkQFoFkdAkncPKyOaOXV9lChoBmgJaA9DCHvBpzn5kGpAlIaUUpRoFU2UAWgWR0CSeuepXIU8dX2UKGgGaAloD0MIPZ6WH7gAcECUhpRSlGgVTcwBaBZHQJJ+Dh0hePd1fZQoaAZoCWgPQwgYmYBfo1RrQJSGlFKUaBVNpwFoFkdAkoC/m1YyPHV9lChoBmgJaA9DCO0MU1vqVW5AlIaUUpRoFU3bAWgWR0CShUkAPuohdX2UKGgGaAloD0MI1LfM6fKocECUhpRSlGgVTawBaBZHQJKIISYgJTl1fZQoaAZoCWgPQwjBjv8CARZwQJSGlFKUaBVNeQFoFkdAkouyyt3fRHV9lChoBmgJaA9DCOId4EkLYWxAlIaUUpRoFU24AWgWR0CSjqIRAbADdWUu"
    },
    "ep_success_buffer": {
        ":type:": "<class 'collections.deque'>",
        ":serialized:": "gASVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
    },
    "_n_updates": 1956,
    "n_steps": 1024,
    "gamma": 0.999,
    "gae_lambda": 0.98,
    "ent_coef": 0.01,
    "vf_coef": 0.5,
    "max_grad_norm": 0.5,
    "batch_size": 64,
    "n_epochs": 4,
    "clip_range": {
        ":type:": "<class 'function'>",
        ":serialized:": "gASVXwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX2ZpbGxfZnVuY3Rpb26Uk5QoaACMD19tYWtlX3NrZWxfZnVuY5STlGgAjA1fYnVpbHRpbl90eXBllJOUjAhDb2RlVHlwZZSFlFKUKEsBSwBLAUsBSxNDBIgAUwCUToWUKYwBX5SFlIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLgEMCAAGUjAN2YWyUhZQpdJRSlEsBfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEgvdXNyL2xvY2FsL2xpYi9weXRob24zLjcvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdYeUUpR9lCiMB2dsb2JhbHOUfZSMCGRlZmF1bHRzlE6MBGRpY3SUfZSMDmNsb3N1cmVfdmFsdWVzlF2URz/JmZmZmZmaYYwGbW9kdWxllGgZjARuYW1llGgPjANkb2OUTowXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC2Fubm90YXRpb25zlH2UjAhxdWFsbmFtZZSMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjAprd2RlZmF1bHRzlE51dFIu"
    },
    "clip_range_vf": null,
    "normalize_advantage": true,
    "target_kl": null
}