-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathnohup.out
5628 lines (5628 loc) · 201 KB
/
nohup.out
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
'args'
{'action_scale': 1.0,
'advantages_per_action': False,
'adversary_accel': 3.0,
'adversary_max_speed': 1.0,
'adversary_size': 0.2,
'agent_size': 0.2,
'arena_size': 1.0,
'batch_size': 500,
'collaborative': True,
'comm_action_one': False,
'comm_init': 'uniform',
'comm_mask_zero': False,
'comm_mode': 'avg',
'comm_passes': 1,
'commnet': False,
'continuous': False,
'detach_gap': 10000,
'dim_actions': 1,
'display': True,
'entr': 0,
'env_name': 'simple_spread',
'epoch_size': 10,
'gamma': 1.0,
'good_accel': 1.0,
'good_max_speed': 0.5,
'good_size': 0.1,
'hard_attn': False,
'hid_size': 64,
'ic3net': False,
'landmark_size': 0.1,
'load': '',
'lrate': 0.001,
'max_steps': 100,
'mean_ratio': 1.0,
'naction_heads': [5],
'nactions': '1',
'nagents': 3,
'nfriendly': 3,
'normalize_rewards': False,
'nprocesses': 12,
'num_actions': [5],
'num_adversaries': 2,
'num_epochs': 1000,
'num_good_agents': 1,
'num_inputs': 18,
'num_landmarks': 3,
'plot': True,
'plot_env': 'main',
'random': False,
'record_video': False,
'recurrent': False,
'rnn_type': 'MLP',
'save': 'model_1g',
'save_every': 10,
'seed': 8376,
'share_weights': False,
'silent': True,
'tau': 1.0,
'value_coeff': 0.01,
'video_name': ''}
Setting up a new session...
Setting up a new session...
'args'
{'action_scale': 1.0,
'advantages_per_action': False,
'adversary_accel': 3.0,
'adversary_max_speed': 1.0,
'adversary_size': 0.2,
'agent_size': 0.2,
'arena_size': 1.0,
'batch_size': 500,
'collaborative': True,
'comm_action_one': False,
'comm_init': 'uniform',
'comm_mask_zero': False,
'comm_mode': 'avg',
'comm_passes': 1,
'commnet': False,
'continuous': False,
'detach_gap': 10000,
'dim_actions': 1,
'display': True,
'entr': 0,
'env_name': 'simple_spread',
'epoch_size': 10,
'gamma': 1.0,
'good_accel': 1.0,
'good_max_speed': 0.5,
'good_size': 0.1,
'hard_attn': False,
'hid_size': 64,
'ic3net': False,
'landmark_size': 0.1,
'load': '',
'lrate': 0.001,
'max_steps': 100,
'mean_ratio': 1.0,
'naction_heads': [5],
'nactions': '1',
'nagents': 3,
'nfriendly': 3,
'normalize_rewards': False,
'nprocesses': 1,
'num_actions': [5],
'num_adversaries': 2,
'num_epochs': 1000,
'num_good_agents': 1,
'num_inputs': 18,
'num_landmarks': 3,
'plot': True,
'plot_env': 'main',
'random': False,
'record_video': False,
'recurrent': False,
'rnn_type': 'MLP',
'save': 'model_1g_1pro',
'save_every': 10,
'seed': 128,
'share_weights': False,
'silent': True,
'tau': 1.0,
'value_coeff': 0.01,
'video_name': ''}
Epoch 1 Reward [-1600.6 -1600.6 -1600.6] Time 10.67s
Steps-taken: 100.00
Epoch 2 Reward [-1612.14 -1612.14 -1612.14] Time 10.66s
Steps-taken: 100.00
Epoch 3 Reward [-1221.26 -1221.26 -1221.26] Time 10.59s
Steps-taken: 100.00
Epoch 4 Reward [-1060.89 -1060.89 -1060.89] Time 10.51s
Steps-taken: 100.00
Epoch 5 Reward [-979.58 -979.58 -979.58] Time 10.72s
Steps-taken: 100.00
Epoch 6 Reward [-1065.03 -1065.03 -1065.03] Time 10.68s
Steps-taken: 100.00
Epoch 7 Reward [-955.37 -955.37 -955.37] Time 10.47s
Steps-taken: 100.00
Epoch 8 Reward [-1036.86 -1036.86 -1036.86] Time 10.45s
Steps-taken: 100.00
Epoch 9 Reward [-1145.26 -1145.26 -1145.26] Time 10.50s
Steps-taken: 100.00
Epoch 10 Reward [-1058.32 -1058.32 -1058.32] Time 10.49s
Steps-taken: 100.00
Epoch 11 Reward [-970.73 -970.73 -970.73] Time 10.54s
Steps-taken: 100.00
Epoch 12 Reward [-885.42 -885.42 -885.42] Time 10.53s
Steps-taken: 100.00
Epoch 13 Reward [-949.6 -949.6 -949.6] Time 10.53s
Steps-taken: 100.00
Epoch 14 Reward [-1016.4 -1016.4 -1016.4] Time 10.53s
Steps-taken: 100.00
Epoch 15 Reward [-871.6 -871.6 -871.6] Time 10.42s
Steps-taken: 100.00
Epoch 16 Reward [-881.55 -881.55 -881.55] Time 10.39s
Steps-taken: 100.00
Epoch 17 Reward [-924.96 -924.96 -924.96] Time 10.54s
Steps-taken: 100.00
Epoch 18 Reward [-989.98 -989.98 -989.98] Time 10.38s
Steps-taken: 100.00
Epoch 19 Reward [-1166.39 -1166.39 -1166.39] Time 10.53s
Steps-taken: 100.00
Epoch 20 Reward [-1399.64 -1399.64 -1399.64] Time 10.50s
Steps-taken: 100.00
Epoch 21 Reward [-1600.1 -1600.1 -1600.1] Time 10.62s
Steps-taken: 100.00
Epoch 22 Reward [-1538.72 -1538.72 -1538.72] Time 10.61s
Steps-taken: 100.00
Epoch 23 Reward [-1146.44 -1146.44 -1146.44] Time 10.53s
Steps-taken: 100.00
Epoch 24 Reward [-1093.18 -1093.18 -1093.18] Time 10.59s
Steps-taken: 100.00
Epoch 25 Reward [-1154.88 -1154.88 -1154.88] Time 10.53s
Steps-taken: 100.00
Epoch 26 Reward [-1150.45 -1150.45 -1150.45] Time 10.48s
Steps-taken: 100.00
Epoch 27 Reward [-1154.29 -1154.29 -1154.29] Time 10.29s
Steps-taken: 100.00
Epoch 28 Reward [-1147. -1147. -1147.] Time 10.49s
Steps-taken: 100.00
Epoch 29 Reward [-1153.57 -1153.57 -1153.57] Time 10.53s
Steps-taken: 100.00
Epoch 30 Reward [-1165.84 -1165.84 -1165.84] Time 10.46s
Steps-taken: 100.00
Epoch 31 Reward [-1307.84 -1307.84 -1307.84] Time 10.51s
Steps-taken: 100.00
Epoch 32 Reward [-1143. -1143. -1143.] Time 10.43s
Steps-taken: 100.00
Epoch 33 Reward [-1107.91 -1107.91 -1107.91] Time 10.42s
Steps-taken: 100.00
Epoch 34 Reward [-1165.31 -1165.31 -1165.31] Time 10.50s
Steps-taken: 100.00
Epoch 35 Reward [-1038.09 -1038.09 -1038.09] Time 10.51s
Steps-taken: 100.00
Epoch 36 Reward [-941.56 -941.56 -941.56] Time 10.53s
Steps-taken: 100.00
Epoch 37 Reward [-1004.49 -1004.49 -1004.49] Time 10.49s
Steps-taken: 100.00
Epoch 38 Reward [-1000.92 -1000.92 -1000.92] Time 10.37s
Steps-taken: 100.00
Epoch 39 Reward [-1069.01 -1069.01 -1069.01] Time 10.41s
Steps-taken: 100.00
Epoch 40 Reward [-932.43 -932.43 -932.43] Time 10.44s
Steps-taken: 100.00
Epoch 41 Reward [-1142.06 -1142.06 -1142.06] Time 10.48s
Steps-taken: 100.00
Epoch 42 Reward [-1134.19 -1134.19 -1134.19] Time 10.45s
Steps-taken: 100.00
Epoch 43 Reward [-1048.11 -1048.11 -1048.11] Time 10.20s
Steps-taken: 100.00
Epoch 44 Reward [-1279.76 -1279.76 -1279.76] Time 10.36s
Steps-taken: 100.00
Epoch 45 Reward [-1187.71 -1187.71 -1187.71] Time 10.43s
Steps-taken: 100.00
Epoch 46 Reward [-1123.9 -1123.9 -1123.9] Time 10.49s
Steps-taken: 100.00
Epoch 47 Reward [-1189.25 -1189.25 -1189.25] Time 10.46s
Steps-taken: 100.00
Epoch 48 Reward [-1225.61 -1225.61 -1225.61] Time 10.46s
Steps-taken: 100.00
Epoch 49 Reward [-1128.41 -1128.41 -1128.41] Time 10.26s
Steps-taken: 100.00
Epoch 50 Reward [-1149.76 -1149.76 -1149.76] Time 10.32s
Steps-taken: 100.00
Epoch 51 Reward [-1136.6 -1136.6 -1136.6] Time 10.44s
Steps-taken: 100.00
Epoch 52 Reward [-1176.42 -1176.42 -1176.42] Time 10.44s
Steps-taken: 100.00
Epoch 53 Reward [-1064.69 -1064.69 -1064.69] Time 10.33s
Steps-taken: 100.00
Epoch 54 Reward [-1131.38 -1131.38 -1131.38] Time 10.37s
Steps-taken: 100.00
Epoch 55 Reward [-1074.97 -1074.97 -1074.97] Time 10.33s
Steps-taken: 100.00
Epoch 56 Reward [-1101.46 -1101.46 -1101.46] Time 10.44s
Steps-taken: 100.00
Epoch 57 Reward [-1018.29 -1018.29 -1018.29] Time 10.49s
Steps-taken: 100.00
Epoch 58 Reward [-1070.36 -1070.36 -1070.36] Time 10.39s
Steps-taken: 100.00
Epoch 59 Reward [-1047.47 -1047.47 -1047.47] Time 10.40s
Steps-taken: 100.00
Epoch 60 Reward [-1184.62 -1184.62 -1184.62] Time 10.35s
Steps-taken: 100.00
Epoch 61 Reward [-1188.86 -1188.86 -1188.86] Time 10.39s
Steps-taken: 100.00
Epoch 62 Reward [-1093.89 -1093.89 -1093.89] Time 10.21s
Steps-taken: 100.00
Epoch 63 Reward [-1061.24 -1061.24 -1061.24] Time 10.33s
Steps-taken: 100.00
Epoch 64 Reward [-1129.06 -1129.06 -1129.06] Time 10.46s
Steps-taken: 100.00
Epoch 65 Reward [-1144.77 -1144.77 -1144.77] Time 10.43s
Steps-taken: 100.00
Epoch 66 Reward [-1204.27 -1204.27 -1204.27] Time 10.46s
Steps-taken: 100.00
Epoch 67 Reward [-1073.75 -1073.75 -1073.75] Time 10.40s
Steps-taken: 100.00
Epoch 68 Reward [-1149.63 -1149.63 -1149.63] Time 10.40s
Steps-taken: 100.00
Epoch 69 Reward [-1173.04 -1173.04 -1173.04] Time 10.34s
Steps-taken: 100.00
Epoch 70 Reward [-1090.59 -1090.59 -1090.59] Time 10.40s
Steps-taken: 100.00
Epoch 71 Reward [-990.52 -990.52 -990.52] Time 10.39s
Steps-taken: 100.00
Epoch 72 Reward [-993.88 -993.88 -993.88] Time 10.43s
Steps-taken: 100.00
Epoch 73 Reward [-1062. -1062. -1062.] Time 10.35s
Steps-taken: 100.00
Epoch 74 Reward [-1041.32 -1041.32 -1041.32] Time 10.35s
Steps-taken: 100.00
Epoch 75 Reward [-1111.98 -1111.98 -1111.98] Time 10.38s
Steps-taken: 100.00
Epoch 76 Reward [-1132.98 -1132.98 -1132.98] Time 10.42s
Steps-taken: 100.00
Epoch 77 Reward [-998.1 -998.1 -998.1] Time 10.45s
Steps-taken: 100.00
Epoch 78 Reward [-1095.87 -1095.87 -1095.87] Time 10.47s
Steps-taken: 100.00
Epoch 79 Reward [-1063.49 -1063.49 -1063.49] Time 10.41s
Steps-taken: 100.00
Epoch 80 Reward [-1056.29 -1056.29 -1056.29] Time 10.50s
Steps-taken: 100.00
Epoch 81 Reward [-1124.03 -1124.03 -1124.03] Time 10.45s
Steps-taken: 100.00
Epoch 82 Reward [-1120.97 -1120.97 -1120.97] Time 10.22s
Steps-taken: 100.00
Epoch 83 Reward [-982.07 -982.07 -982.07] Time 10.27s
Steps-taken: 100.00
Epoch 84 Reward [-1031.3 -1031.3 -1031.3] Time 10.24s
Steps-taken: 100.00
Epoch 85 Reward [-1001.12 -1001.12 -1001.12] Time 10.10s
Steps-taken: 100.00
Epoch 86 Reward [-1001.48 -1001.48 -1001.48] Time 10.34s
Steps-taken: 100.00
Epoch 87 Reward [-1000.13 -1000.13 -1000.13] Time 10.15s
Steps-taken: 100.00
Epoch 88 Reward [-1001.71 -1001.71 -1001.71] Time 10.43s
Steps-taken: 100.00
Epoch 89 Reward [-961.57 -961.57 -961.57] Time 10.42s
Steps-taken: 100.00
Epoch 90 Reward [-994.75 -994.75 -994.75] Time 10.25s
Steps-taken: 100.00
Epoch 91 Reward [-940.77 -940.77 -940.77] Time 10.52s
Steps-taken: 100.00
Epoch 92 Reward [-1022.29 -1022.29 -1022.29] Time 10.58s
Steps-taken: 100.00
Epoch 93 Reward [-1048.88 -1048.88 -1048.88] Time 10.30s
Steps-taken: 100.00
Epoch 94 Reward [-983.54 -983.54 -983.54] Time 10.36s
Steps-taken: 100.00
Epoch 95 Reward [-983.65 -983.65 -983.65] Time 10.34s
Steps-taken: 100.00
Epoch 96 Reward [-1053.45 -1053.45 -1053.45] Time 10.50s
Steps-taken: 100.00
Epoch 97 Reward [-1041.17 -1041.17 -1041.17] Time 10.34s
Steps-taken: 100.00
Epoch 98 Reward [-1011.02 -1011.02 -1011.02] Time 10.25s
Steps-taken: 100.00
Epoch 99 Reward [-1063.39 -1063.39 -1063.39] Time 10.36s
Steps-taken: 100.00
Epoch 100 Reward [-954.52 -954.52 -954.52] Time 10.22s
Steps-taken: 100.00
Epoch 101 Reward [-1042.91 -1042.91 -1042.91] Time 10.22s
Steps-taken: 100.00
Epoch 102 Reward [-1162.28 -1162.28 -1162.28] Time 10.36s
Steps-taken: 100.00
Epoch 103 Reward [-1084.97 -1084.97 -1084.97] Time 10.37s
Steps-taken: 100.00
Epoch 104 Reward [-952.02 -952.02 -952.02] Time 10.20s
Steps-taken: 100.00
Epoch 105 Reward [-1002.28 -1002.28 -1002.28] Time 10.27s
Steps-taken: 100.00
Epoch 106 Reward [-938.66 -938.66 -938.66] Time 10.47s
Steps-taken: 100.00
Epoch 107 Reward [-948.71 -948.71 -948.71] Time 10.32s
Steps-taken: 100.00
Epoch 108 Reward [-947.75 -947.75 -947.75] Time 10.36s
Steps-taken: 100.00
Epoch 109 Reward [-978.61 -978.61 -978.61] Time 10.40s
Steps-taken: 100.00
Epoch 110 Reward [-980.95 -980.95 -980.95] Time 10.22s
Steps-taken: 100.00
Epoch 111 Reward [-1039.04 -1039.04 -1039.04] Time 10.13s
Steps-taken: 100.00
Epoch 112 Reward [-1288.38 -1288.38 -1288.38] Time 10.25s
Steps-taken: 100.00
Epoch 113 Reward [-1348.76 -1348.76 -1348.76] Time 10.20s
Steps-taken: 100.00
Epoch 114 Reward [-1030.13 -1030.13 -1030.13] Time 10.30s
Steps-taken: 100.00
Epoch 115 Reward [-1081.73 -1081.73 -1081.73] Time 10.28s
Steps-taken: 100.00
Epoch 116 Reward [-1045.76 -1045.76 -1045.76] Time 10.34s
Steps-taken: 100.00
Epoch 117 Reward [-1023.77 -1023.77 -1023.77] Time 10.32s
Steps-taken: 100.00
Epoch 118 Reward [-1027.91 -1027.91 -1027.91] Time 10.18s
Steps-taken: 100.00
Epoch 119 Reward [-1001.31 -1001.31 -1001.31] Time 10.39s
Steps-taken: 100.00
Epoch 120 Reward [-1198.32 -1198.32 -1198.32] Time 10.25s
Steps-taken: 100.00
Epoch 121 Reward [-1105.15 -1105.15 -1105.15] Time 10.22s
Steps-taken: 100.00
Epoch 122 Reward [-1052.25 -1052.25 -1052.25] Time 10.14s
Steps-taken: 100.00
Epoch 123 Reward [-1035.71 -1035.71 -1035.71] Time 10.26s
Steps-taken: 100.00
Epoch 124 Reward [-1058.65 -1058.65 -1058.65] Time 10.20s
Steps-taken: 100.00
Epoch 125 Reward [-1051.43 -1051.43 -1051.43] Time 10.29s
Steps-taken: 100.00
Epoch 126 Reward [-1001.02 -1001.02 -1001.02] Time 10.50s
Steps-taken: 100.00
Epoch 127 Reward [-1075.91 -1075.91 -1075.91] Time 10.52s
Steps-taken: 100.00
Epoch 128 Reward [-996.04 -996.04 -996.04] Time 10.46s
Steps-taken: 100.00
Epoch 129 Reward [-1077.95 -1077.95 -1077.95] Time 10.19s
Steps-taken: 100.00
Epoch 130 Reward [-991.77 -991.77 -991.77] Time 10.34s
Steps-taken: 100.00
Epoch 131 Reward [-977.73 -977.73 -977.73] Time 10.43s
Steps-taken: 100.00
Epoch 132 Reward [-999.39 -999.39 -999.39] Time 10.28s
Steps-taken: 100.00
Epoch 133 Reward [-1031.78 -1031.78 -1031.78] Time 10.40s
Steps-taken: 100.00
Epoch 134 Reward [-951.36 -951.36 -951.36] Time 10.61s
Steps-taken: 100.00
Epoch 135 Reward [-983.11 -983.11 -983.11] Time 10.55s
Steps-taken: 100.00
Epoch 136 Reward [-956.22 -956.22 -956.22] Time 10.52s
Steps-taken: 100.00
Epoch 137 Reward [-946.17 -946.17 -946.17] Time 10.32s
Steps-taken: 100.00
Epoch 138 Reward [-940.72 -940.72 -940.72] Time 10.78s
Steps-taken: 100.00
Epoch 139 Reward [-869.61 -869.61 -869.61] Time 10.16s
Steps-taken: 100.00
Epoch 140 Reward [-846.09 -846.09 -846.09] Time 10.23s
Steps-taken: 100.00
Epoch 141 Reward [-847.4 -847.4 -847.4] Time 10.26s
Steps-taken: 100.00
Epoch 142 Reward [-883.37 -883.37 -883.37] Time 10.17s
Steps-taken: 100.00
Epoch 143 Reward [-879.54 -879.54 -879.54] Time 10.27s
Steps-taken: 100.00
Epoch 144 Reward [-906.83 -906.83 -906.83] Time 10.23s
Steps-taken: 100.00
Epoch 145 Reward [-847.91 -847.91 -847.91] Time 10.36s
Steps-taken: 100.00
Epoch 146 Reward [-829.77 -829.77 -829.77] Time 10.13s
Steps-taken: 100.00
Epoch 147 Reward [-867.39 -867.39 -867.39] Time 10.20s
Steps-taken: 100.00
Epoch 148 Reward [-904.9 -904.9 -904.9] Time 10.18s
Steps-taken: 100.00
Epoch 149 Reward [-912.71 -912.71 -912.71] Time 10.41s
Steps-taken: 100.00
Epoch 150 Reward [-851.24 -851.24 -851.24] Time 10.26s
Steps-taken: 100.00
Epoch 151 Reward [-892.98 -892.98 -892.98] Time 10.18s
Steps-taken: 100.00
Epoch 152 Reward [-872.94 -872.94 -872.94] Time 10.36s
Steps-taken: 100.00
Epoch 153 Reward [-933.58 -933.58 -933.58] Time 10.53s
Steps-taken: 100.00
Epoch 154 Reward [-842.14 -842.14 -842.14] Time 10.33s
Steps-taken: 100.00
Epoch 155 Reward [-888.7 -888.7 -888.7] Time 10.19s
Steps-taken: 100.00
Epoch 156 Reward [-871.97 -871.97 -871.97] Time 10.20s
Steps-taken: 100.00
Epoch 157 Reward [-821.87 -821.87 -821.87] Time 10.22s
Steps-taken: 100.00
Epoch 158 Reward [-894.76 -894.76 -894.76] Time 10.47s
Steps-taken: 100.00
Epoch 159 Reward [-839.84 -839.84 -839.84] Time 10.18s
Steps-taken: 100.00
Epoch 160 Reward [-883.73 -883.73 -883.73] Time 10.27s
Steps-taken: 100.00
Epoch 161 Reward [-843.86 -843.86 -843.86] Time 10.36s
Steps-taken: 100.00
Epoch 162 Reward [-817.93 -817.93 -817.93] Time 10.27s
Steps-taken: 100.00
Epoch 163 Reward [-831.78 -831.78 -831.78] Time 10.31s
Steps-taken: 100.00
Epoch 164 Reward [-842.27 -842.27 -842.27] Time 10.18s
Steps-taken: 100.00
Epoch 165 Reward [-864.85 -864.85 -864.85] Time 10.19s
Steps-taken: 100.00
Epoch 166 Reward [-830.9 -830.9 -830.9] Time 10.13s
Steps-taken: 100.00
Epoch 167 Reward [-805.06 -805.06 -805.06] Time 10.25s
Steps-taken: 100.00
Epoch 168 Reward [-824.36 -824.36 -824.36] Time 10.14s
Steps-taken: 100.00
Epoch 169 Reward [-874.01 -874.01 -874.01] Time 10.24s
Steps-taken: 100.00
Epoch 170 Reward [-1017.25 -1017.25 -1017.25] Time 10.12s
Steps-taken: 100.00
Epoch 171 Reward [-991.81 -991.81 -991.81] Time 10.20s
Steps-taken: 100.00
Epoch 172 Reward [-854.25 -854.25 -854.25] Time 10.24s
Steps-taken: 100.00
Epoch 173 Reward [-883.1 -883.1 -883.1] Time 10.14s
Steps-taken: 100.00
Epoch 174 Reward [-803.4 -803.4 -803.4] Time 10.28s
Steps-taken: 100.00
Epoch 175 Reward [-847.59 -847.59 -847.59] Time 10.27s
Steps-taken: 100.00
Epoch 176 Reward [-775.3 -775.3 -775.3] Time 10.47s
Steps-taken: 100.00
Epoch 177 Reward [-833. -833. -833.] Time 10.46s
Steps-taken: 100.00
Epoch 178 Reward [-815.39 -815.39 -815.39] Time 10.50s
Steps-taken: 100.00
Epoch 179 Reward [-857.7 -857.7 -857.7] Time 10.49s
Steps-taken: 100.00
Epoch 180 Reward [-854.45 -854.45 -854.45] Time 10.35s
Steps-taken: 100.00
Epoch 181 Reward [-827.52 -827.52 -827.52] Time 10.31s
Steps-taken: 100.00
Epoch 182 Reward [-869.71 -869.71 -869.71] Time 10.42s
Steps-taken: 100.00
Epoch 183 Reward [-861.66 -861.66 -861.66] Time 10.49s
Steps-taken: 100.00
Epoch 184 Reward [-840.99 -840.99 -840.99] Time 11.09s
Steps-taken: 100.00
Epoch 185 Reward [-893.4 -893.4 -893.4] Time 11.36s
Steps-taken: 100.00
Epoch 186 Reward [-892.3 -892.3 -892.3] Time 11.31s
Steps-taken: 100.00
Epoch 187 Reward [-847.26 -847.26 -847.26] Time 11.19s
Steps-taken: 100.00
Epoch 188 Reward [-856.91 -856.91 -856.91] Time 10.53s
Steps-taken: 100.00
Epoch 189 Reward [-910.85 -910.85 -910.85] Time 10.47s
Steps-taken: 100.00
Epoch 190 Reward [-828.06 -828.06 -828.06] Time 10.50s
Steps-taken: 100.00
Epoch 191 Reward [-873.7 -873.7 -873.7] Time 10.63s
Steps-taken: 100.00
Epoch 192 Reward [-885.76 -885.76 -885.76] Time 10.53s
Steps-taken: 100.00
Epoch 193 Reward [-893. -893. -893.] Time 10.39s
Steps-taken: 100.00
Epoch 194 Reward [-835.27 -835.27 -835.27] Time 10.45s
Steps-taken: 100.00
Epoch 195 Reward [-845.39 -845.39 -845.39] Time 10.47s
Steps-taken: 100.00
Epoch 196 Reward [-858.31 -858.31 -858.31] Time 10.56s
Steps-taken: 100.00
Epoch 197 Reward [-840. -840. -840.] Time 10.58s
Steps-taken: 100.00
Epoch 198 Reward [-846. -846. -846.] Time 10.49s
Steps-taken: 100.00
Epoch 199 Reward [-850.42 -850.42 -850.42] Time 10.36s
Steps-taken: 100.00
Epoch 200 Reward [-847.82 -847.82 -847.82] Time 10.55s
Steps-taken: 100.00
Epoch 201 Reward [-885.95 -885.95 -885.95] Time 10.50s
Steps-taken: 100.00
Epoch 202 Reward [-841.78 -841.78 -841.78] Time 10.35s
Steps-taken: 100.00
Epoch 203 Reward [-816.29 -816.29 -816.29] Time 10.55s
Steps-taken: 100.00
Epoch 204 Reward [-872.41 -872.41 -872.41] Time 10.44s
Steps-taken: 100.00
Epoch 205 Reward [-831.9 -831.9 -831.9] Time 10.32s
Steps-taken: 100.00
Epoch 206 Reward [-897.31 -897.31 -897.31] Time 10.38s
Steps-taken: 100.00
Epoch 207 Reward [-939.79 -939.79 -939.79] Time 10.46s
Steps-taken: 100.00
Epoch 208 Reward [-901.65 -901.65 -901.65] Time 10.67s
Steps-taken: 100.00
Epoch 209 Reward [-868.98 -868.98 -868.98] Time 10.68s
Steps-taken: 100.00
Epoch 210 Reward [-829.47 -829.47 -829.47] Time 10.61s
Steps-taken: 100.00
Epoch 211 Reward [-803.12 -803.12 -803.12] Time 10.65s
Steps-taken: 100.00
Epoch 212 Reward [-806.7 -806.7 -806.7] Time 10.45s
Steps-taken: 100.00
Epoch 213 Reward [-761.64 -761.64 -761.64] Time 10.49s
Steps-taken: 100.00
Epoch 214 Reward [-793.35 -793.35 -793.35] Time 10.70s
Steps-taken: 100.00
Epoch 215 Reward [-829.59 -829.59 -829.59] Time 10.60s
Steps-taken: 100.00
Epoch 216 Reward [-831.05 -831.05 -831.05] Time 10.71s
Steps-taken: 100.00
Epoch 217 Reward [-807.39 -807.39 -807.39] Time 10.76s
Steps-taken: 100.00
Epoch 218 Reward [-842.33 -842.33 -842.33] Time 10.69s
Steps-taken: 100.00
Epoch 219 Reward [-815.9 -815.9 -815.9] Time 10.58s
Steps-taken: 100.00
Epoch 220 Reward [-845.64 -845.64 -845.64] Time 10.51s
Steps-taken: 100.00
Epoch 221 Reward [-807.25 -807.25 -807.25] Time 10.38s
Steps-taken: 100.00
Epoch 222 Reward [-796.47 -796.47 -796.47] Time 10.54s
Steps-taken: 100.00
Epoch 223 Reward [-829.94 -829.94 -829.94] Time 10.58s
Steps-taken: 100.00
Epoch 224 Reward [-770.33 -770.33 -770.33] Time 10.37s
Steps-taken: 100.00
Epoch 225 Reward [-811.77 -811.77 -811.77] Time 10.42s
Steps-taken: 100.00
Epoch 226 Reward [-845.73 -845.73 -845.73] Time 10.65s
Steps-taken: 100.00
Epoch 227 Reward [-794.91 -794.91 -794.91] Time 10.59s
Steps-taken: 100.00
Epoch 228 Reward [-845.56 -845.56 -845.56] Time 10.56s
Steps-taken: 100.00
Epoch 229 Reward [-904.09 -904.09 -904.09] Time 10.49s
Steps-taken: 100.00
Epoch 230 Reward [-900.48 -900.48 -900.48] Time 10.43s
Steps-taken: 100.00
Epoch 231 Reward [-841.79 -841.79 -841.79] Time 10.66s
Steps-taken: 100.00
Epoch 232 Reward [-808.48 -808.48 -808.48] Time 10.56s
Steps-taken: 100.00
Epoch 233 Reward [-833.49 -833.49 -833.49] Time 10.61s
Steps-taken: 100.00
Epoch 234 Reward [-777.12 -777.12 -777.12] Time 10.80s
Steps-taken: 100.00
Epoch 235 Reward [-868.05 -868.05 -868.05] Time 10.54s
Steps-taken: 100.00
Epoch 236 Reward [-775.4 -775.4 -775.4] Time 10.40s
Steps-taken: 100.00
Epoch 237 Reward [-825.34 -825.34 -825.34] Time 10.47s
Steps-taken: 100.00
Epoch 238 Reward [-811.51 -811.51 -811.51] Time 10.54s
Steps-taken: 100.00
Epoch 239 Reward [-889.49 -889.49 -889.49] Time 10.38s
Steps-taken: 100.00
Epoch 240 Reward [-781.45 -781.45 -781.45] Time 10.26s
Steps-taken: 100.00
Epoch 241 Reward [-862.75 -862.75 -862.75] Time 10.17s
Steps-taken: 100.00
Epoch 242 Reward [-798.64 -798.64 -798.64] Time 10.26s
Steps-taken: 100.00
Epoch 243 Reward [-837.68 -837.68 -837.68] Time 10.26s
Steps-taken: 100.00
Epoch 244 Reward [-812.29 -812.29 -812.29] Time 10.32s
Steps-taken: 100.00
Epoch 245 Reward [-850.04 -850.04 -850.04] Time 10.33s
Steps-taken: 100.00
Epoch 246 Reward [-876.59 -876.59 -876.59] Time 10.41s
Steps-taken: 100.00
Epoch 247 Reward [-819.65 -819.65 -819.65] Time 10.51s
Steps-taken: 100.00
Epoch 248 Reward [-848.87 -848.87 -848.87] Time 10.63s
Steps-taken: 100.00
Epoch 249 Reward [-855.57 -855.57 -855.57] Time 10.44s
Steps-taken: 100.00
Epoch 250 Reward [-813.7 -813.7 -813.7] Time 10.52s
Steps-taken: 100.00
Epoch 251 Reward [-807.77 -807.77 -807.77] Time 10.56s
Steps-taken: 100.00
Epoch 252 Reward [-814.83 -814.83 -814.83] Time 10.70s
Steps-taken: 100.00
Epoch 253 Reward [-900.6 -900.6 -900.6] Time 10.50s
Steps-taken: 100.00
Epoch 254 Reward [-809.38 -809.38 -809.38] Time 10.48s
Steps-taken: 100.00
Epoch 255 Reward [-780.97 -780.97 -780.97] Time 10.26s
Steps-taken: 100.00
Epoch 256 Reward [-796.96 -796.96 -796.96] Time 10.25s
Steps-taken: 100.00
Epoch 257 Reward [-796.46 -796.46 -796.46] Time 10.34s
Steps-taken: 100.00
Epoch 258 Reward [-829.68 -829.68 -829.68] Time 10.48s
Steps-taken: 100.00
Epoch 259 Reward [-878.11 -878.11 -878.11] Time 10.57s
Steps-taken: 100.00
Epoch 260 Reward [-854.68 -854.68 -854.68] Time 10.53s
Steps-taken: 100.00
Epoch 261 Reward [-858.35 -858.35 -858.35] Time 10.87s
Steps-taken: 100.00
Epoch 262 Reward [-792.16 -792.16 -792.16] Time 10.43s
Steps-taken: 100.00
Epoch 263 Reward [-821.87 -821.87 -821.87] Time 10.36s
Steps-taken: 100.00
Epoch 264 Reward [-825.1 -825.1 -825.1] Time 10.42s
Steps-taken: 100.00
Epoch 265 Reward [-810.05 -810.05 -810.05] Time 10.26s
Steps-taken: 100.00
Epoch 266 Reward [-835.76 -835.76 -835.76] Time 10.34s
Steps-taken: 100.00
Epoch 267 Reward [-745.59 -745.59 -745.59] Time 10.48s
Steps-taken: 100.00
Epoch 268 Reward [-839.36 -839.36 -839.36] Time 10.32s
Steps-taken: 100.00
Epoch 269 Reward [-816.26 -816.26 -816.26] Time 10.61s
Steps-taken: 100.00
Epoch 270 Reward [-899.16 -899.16 -899.16] Time 10.45s
Steps-taken: 100.00
Epoch 271 Reward [-847.2 -847.2 -847.2] Time 10.41s
Steps-taken: 100.00
Epoch 272 Reward [-843.78 -843.78 -843.78] Time 10.39s
Steps-taken: 100.00
Epoch 273 Reward [-781.59 -781.59 -781.59] Time 10.38s
Steps-taken: 100.00
Epoch 274 Reward [-896.97 -896.97 -896.97] Time 10.68s
Steps-taken: 100.00
Epoch 275 Reward [-847.72 -847.72 -847.72] Time 10.53s
Steps-taken: 100.00
Epoch 276 Reward [-864.15 -864.15 -864.15] Time 10.49s
Steps-taken: 100.00
Epoch 277 Reward [-820.55 -820.55 -820.55] Time 10.50s
Steps-taken: 100.00
Epoch 278 Reward [-820.26 -820.26 -820.26] Time 10.46s
Steps-taken: 100.00
Epoch 279 Reward [-845.92 -845.92 -845.92] Time 10.60s
Steps-taken: 100.00
Epoch 280 Reward [-794.45 -794.45 -794.45] Time 10.69s
Steps-taken: 100.00
Epoch 281 Reward [-818.15 -818.15 -818.15] Time 10.61s
Steps-taken: 100.00
Epoch 282 Reward [-869.26 -869.26 -869.26] Time 10.50s
Steps-taken: 100.00
Epoch 283 Reward [-814.26 -814.26 -814.26] Time 10.41s
Steps-taken: 100.00
Epoch 284 Reward [-790.62 -790.62 -790.62] Time 10.52s
Steps-taken: 100.00
Epoch 285 Reward [-861.09 -861.09 -861.09] Time 10.45s
Steps-taken: 100.00
Epoch 286 Reward [-826.99 -826.99 -826.99] Time 10.47s
Steps-taken: 100.00
Epoch 287 Reward [-935.9 -935.9 -935.9] Time 10.41s
Steps-taken: 100.00
Epoch 288 Reward [-937.04 -937.04 -937.04] Time 10.59s
Steps-taken: 100.00
Epoch 289 Reward [-1010.06 -1010.06 -1010.06] Time 10.50s
Steps-taken: 100.00
Epoch 290 Reward [-903.92 -903.92 -903.92] Time 10.36s
Steps-taken: 100.00
Epoch 291 Reward [-899.92 -899.92 -899.92] Time 10.20s
Steps-taken: 100.00
Epoch 292 Reward [-866.18 -866.18 -866.18] Time 10.27s
Steps-taken: 100.00
Epoch 293 Reward [-808.7 -808.7 -808.7] Time 10.56s
Steps-taken: 100.00
Epoch 294 Reward [-911.33 -911.33 -911.33] Time 10.41s
Steps-taken: 100.00
Epoch 295 Reward [-814.09 -814.09 -814.09] Time 10.52s
Steps-taken: 100.00
Epoch 296 Reward [-816.03 -816.03 -816.03] Time 10.50s
Steps-taken: 100.00
Epoch 297 Reward [-880.43 -880.43 -880.43] Time 10.33s
Steps-taken: 100.00
Epoch 298 Reward [-850.47 -850.47 -850.47] Time 10.60s
Steps-taken: 100.00
Epoch 299 Reward [-856.18 -856.18 -856.18] Time 10.25s
Steps-taken: 100.00
Epoch 300 Reward [-852.6 -852.6 -852.6] Time 10.43s
Steps-taken: 100.00
Epoch 301 Reward [-837.48 -837.48 -837.48] Time 10.43s
Steps-taken: 100.00
Epoch 302 Reward [-909.84 -909.84 -909.84] Time 10.34s
Steps-taken: 100.00
Epoch 303 Reward [-767.09 -767.09 -767.09] Time 10.46s
Steps-taken: 100.00
Epoch 304 Reward [-839.42 -839.42 -839.42] Time 10.51s
Steps-taken: 100.00
Epoch 305 Reward [-813.61 -813.61 -813.61] Time 10.41s
Steps-taken: 100.00
Epoch 306 Reward [-857.53 -857.53 -857.53] Time 10.31s
Steps-taken: 100.00
Epoch 307 Reward [-854.49 -854.49 -854.49] Time 10.28s
Steps-taken: 100.00
Epoch 308 Reward [-846.39 -846.39 -846.39] Time 10.26s
Steps-taken: 100.00
Epoch 309 Reward [-831.16 -831.16 -831.16] Time 10.28s
Steps-taken: 100.00
Epoch 310 Reward [-806.9 -806.9 -806.9] Time 10.45s
Steps-taken: 100.00
Epoch 311 Reward [-815.72 -815.72 -815.72] Time 10.25sSetting up a new session...
Setting up a new session...
'args'
{'action_scale': 1.0,
'advantages_per_action': False,
'adversary_accel': 3.0,
'adversary_max_speed': 1.0,
'adversary_size': 0.2,
'agent_size': 0.2,
'arena_size': 1.0,
'batch_size': 500,
'collaborative': True,
'comm_action_one': False,
'comm_init': 'uniform',
'comm_mask_zero': False,
'comm_mode': 'avg',
'comm_passes': 1,
'commnet': False,
'continuous': False,
'detach_gap': 10000,
'dim_actions': 1,
'display': True,
'entr': 0,
'env_name': 'simple_spread',
'epoch_size': 10,
'gamma': 1.0,
'good_accel': 1.0,
'good_max_speed': 0.5,
'good_size': 0.1,
'hard_attn': False,
'hid_size': 64,
'ic3net': False,
'landmark_size': 0.1,
'load': '',
'lrate': 0.001,
'max_steps': 100,
'mean_ratio': 1.0,
'naction_heads': [5],
'nactions': '1',
'nagents': 3,
'nfriendly': 3,
'normalize_rewards': False,
'nprocesses': 1,
'num_actions': [5],
'num_adversaries': 2,
'num_epochs': 1000,
'num_good_agents': 1,
'num_inputs': 18,
'num_landmarks': 3,
'plot': True,
'plot_env': '1pro_1000epoch',
'random': False,
'record_video': False,
'recurrent': False,
'rnn_type': 'MLP',
'save': 'model_1g_1pro',
'save_every': 10,
'seed': 210,
'share_weights': False,
'silent': True,
'tau': 1.0,
'value_coeff': 0.01,
'video_name': ''}
Epoch 1 Reward [-993.72 -993.72 -993.72] Time 11.02s
Steps-taken: 100.00
Epoch 2 Reward [-937.35 -937.35 -937.35] Time 10.58s
Steps-taken: 100.00
Epoch 3 Reward [-937.3 -937.3 -937.3] Time 10.72s
Steps-taken: 100.00
Epoch 4 Reward [-1005.1 -1005.1 -1005.1] Time 10.69s
Steps-taken: 100.00
Epoch 5 Reward [-1136.43 -1136.43 -1136.43] Time 10.65s
Steps-taken: 100.00
Epoch 6 Reward [-1345.63 -1345.63 -1345.63] Time 10.52s
Steps-taken: 100.00
Epoch 7 Reward [-1334.63 -1334.63 -1334.63] Time 10.74s
Steps-taken: 100.00
Epoch 8 Reward [-1431.3 -1431.3 -1431.3] Time 10.70s
Steps-taken: 100.00
Epoch 9 Reward [-1097.8 -1097.8 -1097.8] Time 10.54s
Steps-taken: 100.00
Epoch 10 Reward [-916.53 -916.53 -916.53] Time 10.54s
Steps-taken: 100.00
Epoch 11 Reward [-1001.31 -1001.31 -1001.31] Time 10.56s
Steps-taken: 100.00
Epoch 12 Reward [-895.57 -895.57 -895.57] Time 10.54s
Steps-taken: 100.00
Epoch 13 Reward [-966.27 -966.27 -966.27] Time 10.65s
Steps-taken: 100.00
Epoch 14 Reward [-1028.44 -1028.44 -1028.44] Time 10.62s
Steps-taken: 100.00
Epoch 15 Reward [-1093.66 -1093.66 -1093.66] Time 11.20s
Steps-taken: 100.00
Epoch 16 Reward [-1215.82 -1215.82 -1215.82] Time 10.58s
Steps-taken: 100.00
Epoch 17 Reward [-1047.41 -1047.41 -1047.41] Time 10.51s
Steps-taken: 100.00
Epoch 18 Reward [-1151.34 -1151.34 -1151.34] Time 10.71s
Steps-taken: 100.00
Epoch 19 Reward [-1138.43 -1138.43 -1138.43] Time 10.65s
Steps-taken: 100.00
Epoch 20 Reward [-1119.13 -1119.13 -1119.13] Time 10.67s
Steps-taken: 100.00
Epoch 21 Reward [-1189.5 -1189.5 -1189.5] Time 10.75s
Steps-taken: 100.00
Epoch 22 Reward [-1298.04 -1298.04 -1298.04] Time 10.46s
Steps-taken: 100.00
Epoch 23 Reward [-1310.51 -1310.51 -1310.51] Time 10.40s
Steps-taken: 100.00
Epoch 24 Reward [-1401.55 -1401.55 -1401.55] Time 10.75s
Steps-taken: 100.00
Epoch 25 Reward [-1210.56 -1210.56 -1210.56] Time 10.48s
Steps-taken: 100.00
Epoch 26 Reward [-1204.96 -1204.96 -1204.96] Time 10.56s
Steps-taken: 100.00
Epoch 27 Reward [-1302.23 -1302.23 -1302.23] Time 10.41s
Steps-taken: 100.00
Epoch 28 Reward [-1175.74 -1175.74 -1175.74] Time 10.69s
Steps-taken: 100.00
Epoch 29 Reward [-1061.83 -1061.83 -1061.83] Time 10.88s
Steps-taken: 100.00
Epoch 30 Reward [-1021.16 -1021.16 -1021.16] Time 10.49s
Steps-taken: 100.00
Epoch 31 Reward [-1054.17 -1054.17 -1054.17] Time 10.76s
Steps-taken: 100.00
Epoch 32 Reward [-1053.25 -1053.25 -1053.25] Time 10.71s
Steps-taken: 100.00
Epoch 33 Reward [-977.07 -977.07 -977.07] Time 10.73s
Steps-taken: 100.00
Epoch 34 Reward [-1001.15 -1001.15 -1001.15] Time 10.54s
Steps-taken: 100.00
Epoch 35 Reward [-953.42 -953.42 -953.42] Time 10.64s
Steps-taken: 100.00
Epoch 36 Reward [-953.18 -953.18 -953.18] Time 10.94s
Steps-taken: 100.00
Epoch 37 Reward [-979.02 -979.02 -979.02] Time 10.67s
Steps-taken: 100.00
Epoch 38 Reward [-935.91 -935.91 -935.91] Time 10.68s
Steps-taken: 100.00
Epoch 39 Reward [-1117.48 -1117.48 -1117.48] Time 10.56s
Steps-taken: 100.00
Epoch 40 Reward [-1163.9 -1163.9 -1163.9] Time 10.59s
Steps-taken: 100.00
Epoch 41 Reward [-991.65 -991.65 -991.65] Time 10.66s
Steps-taken: 100.00
Epoch 42 Reward [-1039.67 -1039.67 -1039.67] Time 10.83s
Steps-taken: 100.00
Epoch 43 Reward [-1143.46 -1143.46 -1143.46] Time 10.69s
Steps-taken: 100.00
Epoch 44 Reward [-1009.69 -1009.69 -1009.69] Time 10.65s
Steps-taken: 100.00
Epoch 45 Reward [-1020.24 -1020.24 -1020.24] Time 10.71s
Steps-taken: 100.00
Epoch 46 Reward [-923.97 -923.97 -923.97] Time 10.68s
Steps-taken: 100.00
Epoch 47 Reward [-913.14 -913.14 -913.14] Time 10.71s
Steps-taken: 100.00
Epoch 48 Reward [-886.49 -886.49 -886.49] Time 10.64s
Steps-taken: 100.00
Epoch 49 Reward [-919.46 -919.46 -919.46] Time 10.64s
Steps-taken: 100.00
Epoch 50 Reward [-925.76 -925.76 -925.76] Time 10.87s
Steps-taken: 100.00
Epoch 51 Reward [-952.74 -952.74 -952.74] Time 10.49s
Steps-taken: 100.00
Epoch 52 Reward [-947.26 -947.26 -947.26] Time 10.37s
Steps-taken: 100.00
Epoch 53 Reward [-924.48 -924.48 -924.48] Time 10.37s
Steps-taken: 100.00
Epoch 54 Reward [-913.27 -913.27 -913.27] Time 10.45s
Steps-taken: 100.00
Epoch 55 Reward [-998.99 -998.99 -998.99] Time 10.70s
Steps-taken: 100.00
Epoch 56 Reward [-1004.24 -1004.24 -1004.24] Time 10.63s
Steps-taken: 100.00
Epoch 57 Reward [-974.53 -974.53 -974.53] Time 10.65s
Steps-taken: 100.00
Epoch 58 Reward [-888.62 -888.62 -888.62] Time 10.64s
Steps-taken: 100.00
Epoch 59 Reward [-1009.46 -1009.46 -1009.46] Time 10.65s
Steps-taken: 100.00
Epoch 60 Reward [-986.13 -986.13 -986.13] Time 10.80s
Steps-taken: 100.00
Epoch 61 Reward [-988.81 -988.81 -988.81] Time 10.63s
Steps-taken: 100.00
Epoch 62 Reward [-1058.62 -1058.62 -1058.62] Time 10.36s
Steps-taken: 100.00
Epoch 63 Reward [-1054.79 -1054.79 -1054.79] Time 10.55s
Steps-taken: 100.00
Epoch 64 Reward [-1027.52 -1027.52 -1027.52] Time 10.67s
Steps-taken: 100.00
Epoch 65 Reward [-994.48 -994.48 -994.48] Time 10.66s
Steps-taken: 100.00
Epoch 66 Reward [-1106.74 -1106.74 -1106.74] Time 10.81s
Steps-taken: 100.00
Epoch 67 Reward [-1028.77 -1028.77 -1028.77] Time 10.73s
Steps-taken: 100.00
Epoch 68 Reward [-1041.59 -1041.59 -1041.59] Time 10.43s
Steps-taken: 100.00
Epoch 69 Reward [-1021.14 -1021.14 -1021.14] Time 10.65s
Steps-taken: 100.00
Epoch 70 Reward [-1176.77 -1176.77 -1176.77] Time 10.46s
Steps-taken: 100.00
Epoch 71 Reward [-1090.42 -1090.42 -1090.42] Time 10.65s
Steps-taken: 100.00
Epoch 72 Reward [-1053.52 -1053.52 -1053.52] Time 10.81s
Steps-taken: 100.00
Epoch 73 Reward [-1106.32 -1106.32 -1106.32] Time 10.55s
Steps-taken: 100.00
Epoch 74 Reward [-1092.61 -1092.61 -1092.61] Time 10.94s
Steps-taken: 100.00
Epoch 75 Reward [-1243.58 -1243.58 -1243.58] Time 10.43s
Steps-taken: 100.00
Epoch 76 Reward [-1211.03 -1211.03 -1211.03] Time 10.37s
Steps-taken: 100.00
Epoch 77 Reward [-1029.88 -1029.88 -1029.88] Time 10.63s
Steps-taken: 100.00
Epoch 78 Reward [-1271.87 -1271.87 -1271.87] Time 10.73s
Steps-taken: 100.00
Epoch 79 Reward [-1603.41 -1603.41 -1603.41] Time 10.72s
Steps-taken: 100.00
Epoch 80 Reward [-1096.26 -1096.26 -1096.26] Time 10.67s
Steps-taken: 100.00
Epoch 81 Reward [-1151.83 -1151.83 -1151.83] Time 10.77s
Steps-taken: 100.00
Epoch 82 Reward [-1055.93 -1055.93 -1055.93] Time 10.51s
Steps-taken: 100.00
Epoch 83 Reward [-1340.2 -1340.2 -1340.2] Time 10.69s
Steps-taken: 100.00
Epoch 84 Reward [-1208.33 -1208.33 -1208.33] Time 10.78s
Steps-taken: 100.00
Epoch 85 Reward [-1246.77 -1246.77 -1246.77] Time 10.88s
Steps-taken: 100.00
Epoch 86 Reward [-1174.42 -1174.42 -1174.42] Time 10.58s
Steps-taken: 100.00
Epoch 87 Reward [-1095.49 -1095.49 -1095.49] Time 10.57s
Steps-taken: 100.00
Epoch 88 Reward [-1317.44 -1317.44 -1317.44] Time 10.68s
Steps-taken: 100.00
Epoch 89 Reward [-1253.38 -1253.38 -1253.38] Time 10.53s
Steps-taken: 100.00
Epoch 90 Reward [-1342.61 -1342.61 -1342.61] Time 10.64s
Steps-taken: 100.00
Epoch 91 Reward [-1096.64 -1096.64 -1096.64] Time 10.59s
Steps-taken: 100.00
Epoch 92 Reward [-1103.03 -1103.03 -1103.03] Time 10.66s
Steps-taken: 100.00
Epoch 93 Reward [-1190.91 -1190.91 -1190.91] Time 10.72s
Steps-taken: 100.00
Epoch 94 Reward [-1123.51 -1123.51 -1123.51] Time 10.63s
Steps-taken: 100.00
Epoch 95 Reward [-1250.67 -1250.67 -1250.67] Time 10.83s
Steps-taken: 100.00
Epoch 96 Reward [-1113.49 -1113.49 -1113.49] Time 10.74s
Steps-taken: 100.00
Epoch 97 Reward [-1185.46 -1185.46 -1185.46] Time 10.71s