Iteration: 1, Mean Reward: -269.72, Threshold: -203.86
Iteration: 2, Mean Reward: -214.88, Threshold: -174.57
Iteration: 3, Mean Reward: -193.35, Threshold: -163.07
Iteration: 4, Mean Reward: -181.44, Threshold: -150.71
Iteration: 5, Mean Reward: -179.10, Threshold: -150.28
Iteration: 6, Mean Reward: -164.94, Threshold: -146.30
Iteration: 7, Mean Reward: -166.23, Threshold: -143.38
Iteration: 8, Mean Reward: -164.63, Threshold: -142.32
Iteration: 9, Mean Reward: -158.53, Threshold: -137.96
Iteration: 10, Mean Reward: -151.76, Threshold: -135.14
Iteration: 11, Mean Reward: -146.64, Threshold: -131.94
Iteration: 12, Mean Reward: -143.42, Threshold: -128.11
Iteration: 13, Mean Reward: -141.43, Threshold: -125.82
Iteration: 14, Mean Reward: -137.67, Threshold: -121.26
Iteration: 15, Mean Reward: -134.23, Threshold: -119.86
Iteration: 16, Mean Reward: -136.16, Threshold: -120.03
Iteration: 17, Mean Reward: -136.39, Threshold: -120.20
Iteration: 18, Mean Reward: -133.29, Threshold: -117.34
Iteration: 19, Mean Reward: -129.45, Threshold: -111.65
Iteration: 20, Mean Reward: -116.96, Threshold: -102.58
Iteration: 21, Mean Reward: -111.81, Threshold: -97.48
Iteration: 22, Mean Reward: -106.67, Threshold: -91.14
Iteration: 23, Mean Reward: -103.95, Threshold: -87.00
Iteration: 24, Mean Reward: -99.29, Threshold: -85.47
Iteration: 25, Mean Reward: -97.34, Threshold: -80.83
Iteration: 26, Mean Reward: -92.53, Threshold: -72.83
Iteration: 27, Mean Reward: -86.11, Threshold: -69.51
Iteration: 28, Mean Reward: -80.60, Threshold: -63.33
Iteration: 29, Mean Reward: -75.42, Threshold: -58.15
Iteration: 30, Mean Reward: -70.59, Threshold: -50.97
Iteration: 31, Mean Reward: -68.76, Threshold: -49.85
Iteration: 32, Mean Reward: -61.13, Threshold: -42.77
Iteration: 33, Mean Reward: -51.18, Threshold: -33.70
Iteration: 34, Mean Reward: -43.07, Threshold: -28.81
Iteration: 35, Mean Reward: -39.56, Threshold: -23.69
Iteration: 36, Mean Reward: -36.65, Threshold: -23.10
Iteration: 37, Mean Reward: -33.14, Threshold: -21.38
Iteration: 38, Mean Reward: -29.72, Threshold: -17.45
Iteration: 39, Mean Reward: -33.77, Threshold: -18.18
Iteration: 40, Mean Reward: -32.35, Threshold: -17.26
Iteration: 41, Mean Reward: -31.75, Threshold: -13.29
Iteration: 42, Mean Reward: -24.68, Threshold: -10.19
Iteration: 43, Mean Reward: -25.64, Threshold: -8.92
Iteration: 44, Mean Reward: -23.88, Threshold: -8.31
Iteration: 45, Mean Reward: -23.91, Threshold: -8.06
Iteration: 46, Mean Reward: -20.34, Threshold: -1.55
Iteration: 47, Mean Reward: -17.85, Threshold: -5.08
Iteration: 48, Mean Reward: -14.60, Threshold: -2.69
Iteration: 49, Mean Reward: -15.16, Threshold: -1.01
Iteration: 50, Mean Reward: -13.45, Threshold: -0.35
Iteration: 51, Mean Reward: -11.53, Threshold: 1.86
Iteration: 52, Mean Reward: -7.97, Threshold: 12.26
Iteration: 53, Mean Reward: -6.37, Threshold: 6.34
Iteration: 54, Mean Reward: -7.71, Threshold: 8.11
Iteration: 55, Mean Reward: -6.05, Threshold: 14.80
Iteration: 56, Mean Reward: -10.54, Threshold: 18.15
Iteration: 57, Mean Reward: -12.18, Threshold: 11.31
Iteration: 58, Mean Reward: -9.79, Threshold: 14.14
Iteration: 59, Mean Reward: -5.03, Threshold: 16.74
Iteration: 60, Mean Reward: -1.74, Threshold: 27.77
Iteration: 61, Mean Reward: -0.54, Threshold: 29.65
Iteration: 62, Mean Reward: 2.07, Threshold: 34.06
Iteration: 63, Mean Reward: 3.84, Threshold: 36.15
Iteration: 64, Mean Reward: 14.03, Threshold: 44.41
Iteration: 65, Mean Reward: 15.56, Threshold: 50.69
Iteration: 66, Mean Reward: 16.35, Threshold: 50.72
Iteration: 67, Mean Reward: 26.99, Threshold: 56.30
Iteration: 68, Mean Reward: 17.75, Threshold: 47.04
Iteration: 69, Mean Reward: 8.56, Threshold: 46.65
Iteration: 70, Mean Reward: 13.78, Threshold: 49.92
Iteration: 71, Mean Reward: 17.87, Threshold: 50.34
Iteration: 72, Mean Reward: 26.04, Threshold: 56.95
Iteration: 73, Mean Reward: 20.07, Threshold: 58.79
Iteration: 74, Mean Reward: 24.12, Threshold: 60.84
Iteration: 75, Mean Reward: 32.86, Threshold: 62.61
Iteration: 76, Mean Reward: 20.36, Threshold: 59.52
Iteration: 77, Mean Reward: 25.65, Threshold: 58.96
Iteration: 78, Mean Reward: 19.73, Threshold: 53.70
Iteration: 79, Mean Reward: 30.65, Threshold: 65.19
Iteration: 80, Mean Reward: 30.73, Threshold: 64.52
Iteration: 81, Mean Reward: 26.07, Threshold: 62.50
Iteration: 82, Mean Reward: 27.76, Threshold: 71.62
Iteration: 83, Mean Reward: 29.18, Threshold: 69.42
Iteration: 84, Mean Reward: 34.19, Threshold: 67.37
Iteration: 85, Mean Reward: 31.08, Threshold: 67.35
Iteration: 86, Mean Reward: 32.46, Threshold: 65.26
Iteration: 87, Mean Reward: 25.25, Threshold: 67.23
Iteration: 88, Mean Reward: 32.50, Threshold: 65.15
Iteration: 89, Mean Reward: 33.05, Threshold: 68.15
Iteration: 90, Mean Reward: 33.94, Threshold: 62.61
Iteration: 91, Mean Reward: 34.96, Threshold: 62.65
Iteration: 92, Mean Reward: 35.79, Threshold: 67.68
Iteration: 93, Mean Reward: 35.53, Threshold: 62.79
Iteration: 94, Mean Reward: 34.33, Threshold: 61.85
Iteration: 95, Mean Reward: 26.08, Threshold: 54.09
Iteration: 96, Mean Reward: 28.57, Threshold: 55.93
Iteration: 97, Mean Reward: 29.68, Threshold: 56.43
Iteration: 98, Mean Reward: 28.07, Threshold: 54.67
Iteration: 99, Mean Reward: 40.48, Threshold: 68.97
Iteration: 100, Mean Reward: 37.26, Threshold: 63.06