{
  "battle_won_mean": [
    0.0,
    0.0,
    0.0
  ],
  "battle_won_mean_T": [
    190,
    20309,
    40443
  ],
  "ep_length_mean": [
    23.75,
    23.28587962962963,
    22.879545454545454
  ],
  "ep_length_mean_T": [
    190,
    20309,
    40443
  ],
  "episode": [
    864,
    1744
  ],
  "episode_T": [
    20119,
    40251
  ],
  "epsilon": [
    1.0,
    0.617739,
    0.23523100000000008
  ],
  "epsilon_T": [
    190,
    20309,
    40443
  ],
  "grad_norm": [
    15.953059992800439,
    2.724685948223765,
    1.590997387155217
  ],
  "grad_norm_T": [
    763,
    20883,
    40991
  ],
  "loss": [
    2.0028555393218994,
    0.08743997663259506,
    0.06634704023599625
  ],
  "loss_T": [
    763,
    20883,
    40991
  ],
  "q_taken_mean": [
    0.008163971273906369,
    0.43020190771065914,
    0.5808055622017865
  ],
  "q_taken_mean_T": [
    763,
    20883,
    40991
  ],
  "return_mean": [
    5.424197635135135,
    5.85646779592092,
    6.36121967137592
  ],
  "return_mean_T": [
    190,
    20309,
    40443
  ],
  "return_std": [
    0.4604345506038491,
    0.5803035025242452,
    0.6698600231190486
  ],
  "return_std_T": [
    190,
    20309,
    40443
  ],
  "target_mean": [
    0.20306575136863805,
    0.4524452715345907,
    0.5907033352231746
  ],
  "target_mean_T": [
    763,
    20883,
    40991
  ],
  "td_error_abs": [
    1.191874052875164,
    0.234304962364682,
    0.1996596091279336
  ],
  "td_error_abs_T": [
    763,
    20883,
    40991
  ],
  "test_battle_won_mean": [
    0.0,
    0.0,
    0.0
  ],
  "test_battle_won_mean_T": [
    190,
    20309,
    40443
  ],
  "test_ep_length_mean": [
    25.958333333333332,
    21.791666666666668,
    24.458333333333332
  ],
  "test_ep_length_mean_T": [
    190,
    20309,
    40443
  ],
  "test_return_mean": [
    7.6756756756756745,
    6.582207207207207,
    6.252604166666665
  ],
  "test_return_mean_T": [
    190,
    20309,
    40443
  ],
  "test_return_std": [
    0.7191424159810847,
    0.6201990757129011,
    0.8006676542389004
  ],
  "test_return_std_T": [
    190,
    20309,
    40443
  ]
}