-
Notifications
You must be signed in to change notification settings - Fork 6
/
log_trainingTF.txt
5049 lines (4991 loc) · 674 KB
/
log_trainingTF.txt
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
1
300000.0
3000
2000
1.0
Could not find old network weights
TORCS Experiment Start.
Client connected on 3101..............
Episode : 0 Replay Buffer 0 Early Stopping: 0 Epsilon: 1.0 RN: 0.772229770844
('Episode', 0, 'Step', 0.0, 'Epsilon', 0.9999966666666666, 'Action', array([-0.5624621 , 0.45097193, 0. ]), 'Reward', -0.34245577310677805)
('Episode', 0, 'Step', 15.0, 'Epsilon', 0.9999466666666663, 'Action', array([ 0.20791999, 0.61931145, 0. ]), 'Reward', 10.749295580669827)
('Episode', 0, 'Step', 30.0, 'Epsilon', 0.999896666666666, 'Action', array([-0.46012578, 0.46310849, 0. ]), 'Reward', 6.2791675916917704)
('Episode', 0, 'Step', 45.0, 'Epsilon', 0.9998466666666657, 'Action', array([-1. , 0.54244449, 0. ]), 'Reward', -0.082728247097042573)
('Episode', 0, 'Step', 60.0, 'Epsilon', 0.9997966666666653, 'Action', array([ 0.26809669, 0.43132394, 0. ]), 'Reward', -0.19302144361034376)
('Episode', 0, 'Step', 75.0, 'Epsilon', 0.999746666666665, 'Action', array([ 0.58787989, 0.44069114, 0. ]), 'Reward', -0.035544429728506174)
('Episode', 0, 'Step', 90.0, 'Epsilon', 0.9996966666666647, 'Action', array([-0.34228575, 0.35931889, 0. ]), 'Reward', -0.54289201117067332)
('Episode', 0, 'Step', 105.0, 'Epsilon', 0.9996466666666644, 'Action', array([-1. , 0.57549499, 0. ]), 'Reward', -0.033755519678698984)
('Episode', 0, 'Step', 120.0, 'Epsilon', 0.999596666666664, 'Action', array([-1. , 0.62288573, 0. ]), 'Reward', -0.17284202390201658)
('Episode', 0, 'Step', 135.0, 'Epsilon', 0.9995466666666637, 'Action', array([-0.04374852, 0.32962293, 0. ]), 'Reward', -0.23240977859757811)
('Episode', 0, 'Step', 150.0, 'Epsilon', 0.9994966666666634, 'Action', array([ 0.32974937, 0.60484057, 0. ]), 'Reward', 0.051766415445819107)
('Episode', 0, 'Step', 165.0, 'Epsilon', 0.999446666666663, 'Action', array([-1. , 0.53907129, 0. ]), 'Reward', 0.03095714953997937)
('Episode', 0, 'Step', 180.0, 'Epsilon', 0.9993966666666627, 'Action', array([-0.76370693, 0.53984672, 0. ]), 'Reward', -0.098771349234036687)
('Episode', 0, 'Step', 195.0, 'Epsilon', 0.9993466666666624, 'Action', array([-0.96256701, 0.30261547, 0. ]), 'Reward', -0.54187257479570339)
('Episode', 0, 'Step', 210.0, 'Epsilon', 0.9992966666666621, 'Action', array([ 0.27444017, 0.48237937, 0. ]), 'Reward', 0.084966314008119007)
('Episode', 0, 'Step', 225.0, 'Epsilon', 0.9992466666666617, 'Action', array([ 0.01716274, 0.59015284, 0. ]), 'Reward', 0.074912205263301293)
('Episode', 0, 'Step', 240.0, 'Epsilon', 0.9991966666666614, 'Action', array([-1. , 0.43251441, 0. ]), 'Reward', 0.03951678204610766)
('Episode', 0, 'Step', 255.0, 'Epsilon', 0.9991466666666611, 'Action', array([-1. , 0.47463879, 0. ]), 'Reward', -0.45852346455142484)
('Episode', 0, 'Step', 270.0, 'Epsilon', 0.9990966666666607, 'Action', array([-0.58538861, 0.5309624 , 0. ]), 'Reward', -0.79275557030011712)
('Episode', 0, 'Step', 285.0, 'Epsilon', 0.9990466666666604, 'Action', array([-0.15312688, 0.43877536, 0. ]), 'Reward', -0.18761894984335381)
('Episode', 0, 'Step', 300.0, 'Epsilon', 0.9989966666666601, 'Action', array([-1. , 0.52153474, 0. ]), 'Reward', 0.032463897523703586)
('Episode', 0, 'Step', 315.0, 'Epsilon', 0.9989466666666598, 'Action', array([-1. , 0.54403512, 0. ]), 'Reward', -0.22330936775625967)
('Episode', 0, 'Step', 330.0, 'Epsilon', 0.9988966666666594, 'Action', array([ 0.1394847 , 0.49839014, 0. ]), 'Reward', 0.10253171139387082)
('Episode', 0, 'Step', 345.0, 'Epsilon', 0.9988466666666591, 'Action', array([ 0.25417762, 0.35094765, 0. ]), 'Reward', -0.17352338730550207)
('Episode', 0, 'Step', 360.0, 'Epsilon', 0.9987966666666588, 'Action', array([ 0.10610524, 0.51608259, 0. ]), 'Reward', -0.0026818867718517254)
('Episode', 0, 'Step', 375.0, 'Epsilon', 0.9987466666666585, 'Action', array([-0.63995569, 0.65167646, 0. ]), 'Reward', -0.16066336291436312)
('Episode', 0, 'Step', 390.0, 'Epsilon', 0.9986966666666581, 'Action', array([ 0.25376746, 0.48936031, 0. ]), 'Reward', 0.052315451252796671)
('Episode', 0, 'Step', 405.0, 'Epsilon', 0.9986466666666578, 'Action', array([-0.83731403, 0.47431633, 0. ]), 'Reward', -0.34488382041994969)
('Episode', 0, 'Step', 420.0, 'Epsilon', 0.9985966666666575, 'Action', array([ 0.88652626, 0.57375119, 0. ]), 'Reward', -0.29861136081432726)
('Episode', 0, 'Step', 435.0, 'Epsilon', 0.9985466666666571, 'Action', array([ 0.43713416, 0.51640796, 0. ]), 'Reward', 0.09592956748572673)
('Episode', 0, 'Step', 450.0, 'Epsilon', 0.9984966666666568, 'Action', array([-0.29186073, 0.34708768, 0. ]), 'Reward', -0.26001478447737492)
('Episode', 0, 'Step', 465.0, 'Epsilon', 0.9984466666666565, 'Action', array([-0.37029844, 0.58680629, 0. ]), 'Reward', -0.38930432717961622)
('Episode', 0, 'Step', 480.0, 'Epsilon', 0.9983966666666562, 'Action', array([-1. , 0.47851168, 0. ]), 'Reward', -0.27616275241873611)
('Episode', 0, 'Step', 495.0, 'Epsilon', 0.9983466666666558, 'Action', array([ 0.50654823, 0.54823121, 0. ]), 'Reward', -0.06803467566478516)
('Episode', 0, 'Step', 510.0, 'Epsilon', 0.9982966666666555, 'Action', array([ 0.73734036, 0.48799521, 0. ]), 'Reward', -0.11222911433304658)
('Episode', 0, 'Step', 525.0, 'Epsilon', 0.9982466666666552, 'Action', array([-0.26488633, 0.64473459, 0. ]), 'Reward', -0.50353633552703037)
('Episode', 0, 'Step', 540.0, 'Epsilon', 0.9981966666666549, 'Action', array([ 0.17044941, 0.45868447, 0. ]), 'Reward', 0.063036710038664484)
('Episode', 0, 'Step', 555.0, 'Epsilon', 0.9981466666666545, 'Action', array([-0.83703567, 0.3925826 , 0. ]), 'Reward', -0.18807028523482899)
('Episode', 0, 'Step', 570.0, 'Epsilon', 0.9980966666666542, 'Action', array([ 0.46105019, 0.51293503, 0. ]), 'Reward', -0.21327089512722108)
('Episode', 0, 'Step', 585.0, 'Epsilon', 0.9980466666666539, 'Action', array([-0.71280883, 0.51870952, 0. ]), 'Reward', -0.34615956774666112)
('Episode', 0, 'Step', 600.0, 'Epsilon', 0.9979966666666535, 'Action', array([-0.76740525, 0.45831946, 0. ]), 'Reward', 0.094491179998156663)
('Episode', 0, 'Step', 615.0, 'Epsilon', 0.9979466666666532, 'Action', array([ 0.99600918, 0.59269864, 0. ]), 'Reward', 0.025913044405273328)
('Episode', 0, 'Step', 630.0, 'Epsilon', 0.9978966666666529, 'Action', array([ 0.13222994, 0.43004592, 0. ]), 'Reward', -0.13257093775481699)
('Episode', 0, 'Step', 645.0, 'Epsilon', 0.9978466666666526, 'Action', array([-1. , 0.59738634, 0. ]), 'Reward', -0.75300295543326756)
('Episode', 0, 'Step', 660.0, 'Epsilon', 0.9977966666666522, 'Action', array([ 0.18187649, 0.5342947 , 0. ]), 'Reward', 0.0012997852889159837)
('Episode', 0, 'Step', 675.0, 'Epsilon', 0.9977466666666519, 'Action', array([-0.69387115, 0.62392103, 0. ]), 'Reward', 0.091928002737458825)
('Episode', 0, 'Step', 690.0, 'Epsilon', 0.9976966666666516, 'Action', array([ 0.026205 , 0.41971032, 0. ]), 'Reward', -0.3869187683982695)
('Episode', 0, 'Step', 705.0, 'Epsilon', 0.9976466666666512, 'Action', array([-1. , 0.43550203, 0. ]), 'Reward', 0.23515341710422663)
('Episode', 0, 'Step', 720.0, 'Epsilon', 0.9975966666666509, 'Action', array([-0.16517503, 0.55796824, 0. ]), 'Reward', 0.14046812236048783)
('Episode', 0, 'Step', 735.0, 'Epsilon', 0.9975466666666506, 'Action', array([ 0.09094228, 0.45769839, 0. ]), 'Reward', 0.041353810636969288)
('Episode', 0, 'Step', 750.0, 'Epsilon', 0.9974966666666503, 'Action', array([-0.21117203, 0.3365381 , 0. ]), 'Reward', -0.54808220605632729)
('Episode', 0, 'Step', 765.0, 'Epsilon', 0.9974466666666499, 'Action', array([-0.3536861 , 0.44413628, 0. ]), 'Reward', 0.0080022720056130391)
('Episode', 0, 'Step', 780.0, 'Epsilon', 0.9973966666666496, 'Action', array([ 0.43877278, 0.54165165, 0. ]), 'Reward', 0.14550624207865459)
('Ep
Fuel consumption disabled!
Laptime limit disabled!
Visual Properties Report
------------------------
Compatibility mode, properties unknown.
Waiting for request on port 3101
Timeout for client answer
Timeout for client answer
Timeout for client answer
Timeout for client answer
Timeout for client answer
******* RESTARTING *****
isode', 0, 'Step', 795.0, 'Epsilon', 0.9973466666666493, 'Action', array([-0.19380755, 0.42615512, 0. ]), 'Reward', 0.18818885819068848)
('Episode', 0, 'Step', 810.0, 'Epsilon', 0.997296666666649, 'Action', array([ 0.38693959, 0.7020155 , 0. ]), 'Reward', -0.024863609068227707)
('Episode', 0, 'Step', 825.0, 'Epsilon', 0.9972466666666486, 'Action', array([-0.94391496, 0.4744486 , 0. ]), 'Reward', 0.035794908146076318)
('Episode', 0, 'Step', 840.0, 'Epsilon', 0.9971966666666483, 'Action', array([ 0.31725887, 0.37058954, 0. ]), 'Reward', -0.14893408591718041)
('Episode', 0, 'Step', 855.0, 'Epsilon', 0.997146666666648, 'Action', array([-0.15352005, 0.57716383, 0. ]), 'Reward', -0.034721585011370404)
('Episode', 0, 'Step', 870.0, 'Epsilon', 0.9970966666666476, 'Action', array([ 1. , 0.6937588, 0. ]), 'Reward', -0.77967537845369472)
('Episode', 0, 'Step', 885.0, 'Epsilon', 0.9970466666666473, 'Action', array([-1. , 0.33555364, 0. ]), 'Reward', -0.14268603314995021)
('Episode', 0, 'Step', 900.0, 'Epsilon', 0.996996666666647, 'Action', array([-0.83729161, 0.63950886, 0.01388012]), 'Reward', -0.45788708194080946)
('Episode', 0, 'Step', 915.0, 'Epsilon', 0.9969466666666467, 'Action', array([-0.81376963, 0.52244441, 0. ]), 'Reward', -0.43094061848897725)
Terminating because Turned Back
Now we save model with reward -193.296652126 previous best reward was -100000
TOTAL REWARD @ 0-th Episode : Reward -193.296652126
Total Step: 920
Client connected on 3101..............
Episode : 1 Replay Buffer 920 Early Stopping: 0 Epsilon: 0.996933333333 RN: 0.288145016735
('Episode', 1, 'Step', 10.0, 'Epsilon', 0.9968966666666463, 'Action', array([-1. , 0.67585902, 0. ]), 'Reward', 8.3380028888340689)
('Episode', 1, 'Step', 25.0, 'Epsilon', 0.996846666666646, 'Action', array([ 0.62769857, 0.41247397, 0. ]), 'Reward', -81.209147038182195)
('Episode', 1, 'Step', 40.0, 'Epsilon', 0.9967966666666457, 'Action', array([-0.63510969, 0.46050319, 0. ]), 'Reward', -61.177980297195248)
('Episode', 1, 'Step', 55.0, 'Epsilon', 0.9967466666666454, 'Action', array([-0.90894125, 0.4595747 , 0. ]), 'Reward', -76.826540355439803)
('Episode', 1, 'Step', 70.0, 'Epsilon', 0.996696666666645, 'Action', array([-1. , 0.65041167, 0. ]), 'Reward', -89.341768541546926)
('Episode', 1, 'Step', 85.0, 'Epsilon', 0.9966466666666447, 'Action', array([ 1. , 0.52629981, 0. ]), 'Reward', -100.90335778218687)
('Episode', 1, 'Step', 100.0, 'Epsilon', 0.9965966666666444, 'Action', array([ 1. , 0.44532857, 0. ]), 'Reward', -93.842068894257395)
('Episode', 1, 'Step', 115.0, 'Epsilon', 0.996546666666644, 'Action', array([-1. , 0.42762726, 0. ]), 'Reward', -65.696094621022525)
('Episode', 1, 'Step', 130.0, 'Epsilon', 0.9964966666666437, 'Action', array([-0.02016197, 0.37399849, 0. ]), 'Reward', 1.1313599180106433)
('Episode', 1, 'Step', 145.0, 'Epsilon', 0.9964466666666434, 'Action', array([-0.91171367, 0.49234582, 0. ]), 'Reward', -0.061065359322348578)
('Episode', 1, 'Step', 160.0, 'Epsilon', 0.9963966666666431, 'Action', array([ 0.09429133, 0.54192143, 0. ]), 'Reward', 0.053954770474746658)
('Episode', 1, 'Step', 175.0, 'Epsilon', 0.9963466666666427, 'Action', array([ 0.00833106, 0.56077807, 0. ]), 'Reward', -0.43964395444202076)
('Episode', 1, 'Step', 190.0, 'Epsilon', 0.9962966666666424, 'Action', array([ 1. , 0.63427107, 0. ]), 'Reward', -0.16281292979745685)
('Episode', 1, 'Step', 205.0, 'Epsilon', 0.9962466666666421, 'Action', array([-1. , 0.6152962 , 0.00579812]), 'Reward', -0.51040209119934865)
('Episode', 1, 'Step', 220.0, 'Epsilon', 0.9961966666666418, 'Action', array([-0.52406261, 0.33248832, 0. ]), 'Reward', -0.12247029242884799)
('Episode', 1, 'Step', 235.0, 'Epsilon', 0.9961466666666414, 'Action', array([-0.34625529, 0.51024634, 0. ]), 'Reward', 0.048241944034979542)
('Episode', 1, 'Step', 250.0, 'Epsilon', 0.9960966666666411, 'Action', array([ 0.48168735, 0.32886615, 0. ]), 'Reward', -0.027872545189291172)
('Episode', 1, 'Step', 265.0, 'Epsilon', 0.9960466666666408, 'Action', array([ 0.92453688, 0.60342756, 0. ]), 'Reward', -0.44659056970010835)
('Episode', 1, 'Step', 280.0, 'Epsilon', 0.9959966666666404, 'Action', array([ 0.21157175, 0.62186715, 0. ]), 'Reward', -0.37071183498785204)
('Episode', 1, 'Step', 295.0, 'Epsilon', 0.9959466666666401, 'Action', array([-0.25126616, 0.40105854, 0. ]), 'Reward', -0.44336925048240439)
('Episode', 1, 'Step', 310.0, 'Epsilon', 0.9958966666666398, 'Action', array([-0.43969177, 0.66557952, 0. ]), 'Reward', -0.55742805850518706)
('Episode', 1, 'Step', 325.0, 'Epsilon', 0.9958466666666395, 'Action', array([-0.66042504, 0.46346241, 0. ]), 'Reward', -0.39266946176007855)
('Episode', 1, 'Step', 340.0, 'Epsilon', 0.9957966666666391, 'Action', array([-1. , 0.48232092, 0. ]), 'Reward', -0.49383008125878314)
('Episode', 1, 'Step', 355.0, 'Epsilon', 0.9957466666666388, 'Action', array([-0.87334682, 0.52300338, 0. ]), 'Reward', -0.51884482517069741)
('Episode', 1, 'Step', 370.0, 'Epsilon', 0.9956966666666385, 'Action', array([-1. , 0.45644473, 0. ]), 'Reward', -0.75098898242763756)
('Episode', 1, 'Step', 385.0, 'Epsilon', 0.9956466666666381, 'Action', array([-1. , 0.43819013, 0. ]), 'Reward', -0.61544150867472946)
('Episode', 1, 'Step', 400.0, 'Epsilon', 0.9955966666666378, 'Action', array([-0.51530599, 0.48533823, 0. ]), 'Reward', -0.29345932150076925)
('Episode', 1, 'Step', 415.0, 'Epsilon', 0.9955466666666375, 'Action', array([-0.93870246, 0.45431285, 0. ]), 'Reward', -0.81007334522880392)
('Episode', 1, 'Step', 430.0, 'Epsilon', 0.9954966666666372, 'Action', array([ 1. , 0.59999672, 0. ]), 'Reward', -0.4596095566767251)
('Episode', 1, 'Step', 445.0, 'Epsilon', 0.9954466666666368, 'Action', array([ 0.03226654, 0.47731807, 0. ]), 'Reward', -0.40011704422362582)
('Episode', 1, 'Step', 460.0, 'Epsilon', 0.9953966666666365, 'Action', array([-1. , 0.54775869, 0. ]), 'Reward', -4.0054143093431902)
('Episode', 1, 'Step', 475.0, 'Epsilon', 0.9953466666666362, 'Action', array([-1. , 0.49564838, 0. ]), 'Reward', -10.148354371307803)
('Episode', 1, 'Step', 490.0, 'Epsilon', 0.9952966666666359, 'Action', array([-1. , 0.48707158, 0. ]), 'Reward', -14.29340717199752)
('Episode', 1, 'Step', 505.0, 'Epsilon', 0.9952466666666355, 'Action', array([ 0.18258608, 0.55052116, 0. ]), 'Reward', -0.45947230393822786)
('Episode', 1, 'Step', 520.0, 'Epsilon', 0.9951966666666352, 'Action', array([-1. , 0.59874093, 0. ]), 'Reward', -0.31942218054763327)
('Episode', 1, 'Step', 535.0, 'Epsilon', 0.9951466666666349, 'Action', array([-0.62841091, 0.54366499, 0. ]), 'Reward', -0.31669552575181026)
('Episode', 1, 'Step', 550.0, 'Epsilon', 0.9950966666666345, 'Action', array([ 0.76229406, 0.55880244, 0. ]), 'Reward', -1.0211595618650469)
('Episode', 1, 'Step', 565.0, 'Epsilon', 0.9950466666666342, 'Action', array([ 0.96722142, 0.42408044, 0. ]), 'Reward', -1.0227118848244499)
('Episode', 1, 'Step', 580.0, 'Epsilon', 0.9949966666666339, 'Action', array([ 0.63626665, 0.58110782, 0. ]), 'Reward', -0.97451637668228042)
('Episode', 1, 'Step', 595.0, 'Epsilon', 0.9949466666666336, 'Action', array([-0.03844239, 0.55598486, 0. ]), 'Reward', -1.2573786850302122)
('Episode', 1, 'Step', 610.0, 'Epsilon', 0.9948966666666332, 'Action', array([-1. , 0.52476924, 0. ]), 'Reward', -0.81909613845991047)
('Episode', 1, 'Step', 625.0, 'Epsilon', 0.9948466666666329, 'Action', array([ 0.09372935, 0.65556869, 0. ]), 'Reward', -1.4814409924894845)
('Episode', 1, 'Step', 640.0, 'Epsilon', 0.9947966666666326, 'Action', array([-1. , 0.52732727, 0. ]), 'Reward', -0.92978418282027642)
('Episode', 1, 'Step', 655.0, 'Epsilon', 0.9947466666666323, 'Action', array([ 0.23817317, 0.51756203, 0. ]), 'Reward', -2.1347762804128072)
('Episode', 1, 'Step', 670.0, 'Epsilon', 0.9946966666666319, 'Action', array([-1. , 0.56111234, 0. ]), 'Reward', -1.5063800768062041)
('Episode', 1, 'Step', 685.0, 'Epsilon', 0.9946466666666316, 'Action', array([ 0.02990889, 0.44471322, 0. ]), 'Reward', -1.3855686356093848)
('Episode', 1, 'Step', 700.0, 'Epsilon', 0.9945966666666313, 'Action', array([-0.83494083, 0.41722177, 0. ]), 'Reward', -1.4104354507903096)
('Episode', 1, 'Step', 715.0, 'Epsilon', 0.9945466666666309, 'Action', array([-0.15266388, 0.6367864 , 0. ]), 'Reward', -4.7722672394423)
('Episode', 1, 'Step', 730.0, 'Epsilon', 0.9944966666666306, 'Action', array([-0.13687453, 0.41158722, 0. ]), 'Reward', -7.1759761661207087)
('Episode', 1, 'Step', 745.0, 'Epsilon', 0.9944466666666303, 'Action', array([-1. , 0.64631115, 0. ]), 'Reward', -14.130617953852557)
('Episode', 1, 'Step', 760.0, 'Epsilon', 0.99439666666663, 'Action', array([-0.08372943, 0.46610775, 0. ]), 'Reward', -12.457472871054833)
('Episode', 1, 'Step', 775.0, 'Epsilon', 0.9943466666666296, 'Action', array([-0.8603427 , 0.56456882, 0. ]), 'Reward', -1.6347366874879672)
('Episode', 1, 'Step', 790.0, 'Epsilon', 0.9942966666666293, 'Action', array([-0.12453984, 0.48381874, 0. ]), 'Reward', -0.40284229325018506)
('Episode', 1, 'Step', 805.0, 'Epsilon', 0.994246666666629, 'Action', array([-0.30698496, 0.72439677, 0. ]), 'Reward', -0.62681970097233886)
('Episode', 1, 'Step', 820.0, 'Epsilon', 0.9941966666666286, 'Action', array([ 0.40519484, 0.40512914, 0. ]), 'Reward', -1.4395679180978993)
('Episode', 1, 'Step', 835.0, 'Epsilon', 0.9941466666666283, 'Action', array([ 0.25866467, 0.31194429, 0. ]), 'Reward', -0.32333262776724042)
('Episode', 1, 'Step', 850.0, 'Epsilon', 0.994096666666628, 'Action', array([-0.39146909, 0.58043441, 0. ]), 'Reward', -0.44836400402185744)
('Episode', 1, 'Step', 865.0, 'Epsilon', 0.9940466666666277, 'Action', array([ 0.53735947, 0.40135706, 0. ]), 'Reward', -0.50290747032932803)
('Episode', 1, 'Step', 880.0, 'Epsilon', 0.9939966666666273, 'Action', array([-0.40340888, 0.37391448, 0. ]), 'Reward', -0.33405342092655493)
('Episode', 1, 'Step', 895.0, 'Epsilon', 0.993946666666627, 'Action', array([-1. , 0.43217911, 0. ]), 'Reward', -0.16049349810251629)
('Episode', 1, 'Step', 910.0, 'Epsilon', 0.9938966666666267, 'Action', array([-0.36341601, 0.2773313 , 0. ]), 'Reward', -0.47243779244626694)
('Episode', 1, 'Step', 925.0, 'Epsilon', 0.9938466666666264, 'Action', array([ 0.87539223, 0.36535275, 0. ]), 'Reward', -1.1734771734744318)
('Episode', 1, 'Step', 940.0, 'Epsilon', 0.993796666666626, 'Action', array([ 1. , 0.45494798, 0. ]), 'Reward', -0.72376774932502497)
('Episode', 1, 'Step', 955.0, 'Epsilon', 0.9937466666666257, 'Action', array([ 0.36839828, 0.51143321, 0. ]), 'Reward', -1.4381248566299378)
('Episode', 1, 'Step', 970.0, 'Epsilon', 0.9936966666666254, 'Action', array([-1. , 0.48938303, 0. ]), 'Reward', -0.59542682622020759)
('Episode', 1, 'Step', 985.0, 'Epsilon', 0.993646666666625, 'Action', array([ 0.94768191, 0.46362714, 0. ]), 'Reward', -1.256287080919035)
('Episode', 1, 'Step', 1000.0, 'Epsilon', 0.9935966666666247, 'Action', array([-1. , 0.4996442, 0. ]), 'Reward', -1.0579070509442658)
('Episode', 1, 'Step', 1015.0, 'Epsilon', 0.9935466666666244, 'Action', array([-0.21420125, 0.55575007, 0. ]), 'Reward', -2.7219496139467818)
('Episode', 1, 'Step', 1030.0, 'Epsilon', 0.9934966666666241, 'Action', array([ 0.0458459 , 0.51971346, 0. ]), 'Reward', -1.7801694021581325)
('Episode', 1, 'Step', 1045.0, 'Epsilon', 0.9934466666666237, 'Action', array([-0.73392032, 0.63427147, 0. ]), 'Reward', -2.7078399620775429)
('Episode', 1, 'Step', 1060.0, 'Epsilon', 0.9933966666666234, 'Action', array([ 0.22944728, 0.50883796, 0. ]), 'Reward', -9.0757429555449924)
('Episode', 1, 'Step', 1075.0, 'Epsilon', 0.9933466666666231, 'Action', array([-0.23115093, 0.48877052, 0. ]), 'Reward', -45.324713930954061)
('Episode', 1, 'Step', 1090.0, 'Epsilon', 0.9932966666666228, 'Action', array([-1. , 0.50861392, 0. ]), 'Reward', -0.3110299195348521)
('Episode', 1, 'Step', 1105.0, 'Epsilon', 0.9932466666666224, 'Action', array([-1. , 0.47232117, 0. ]), 'Reward', -0.18730478930193484)
('Episode', 1, 'Step', 1120.0, 'Epsilon', 0.9931966666666221, 'Action', array([ 0.62519486, 0.50211983, 0. ]), 'Reward', -0.24267045112107941)
('Episode', 1, 'Step', 1135.0, 'Epsilon', 0.9931466666666218, 'Action', array([-0.63409038, 0.51310379, 0. ]), 'Reward', -0.48473277543677562)
('Episode', 1, 'Step', 1150.0, 'Epsilon', 0.9930966666666214, 'Action', array([-1. , 0.40270664, 0. ]), 'Reward', -0.2590696764281788)
('Episode', 1, 'Step', 1165.0, 'Epsilon', 0.9930466666666211, 'Action', array([-0.63835643, 0.44728375, 0. ]), 'Reward', -0.39550223913711025)
('Episode', 1, 'Step', 1180.0, 'Epsilon', 0.9929966666666208, 'Action', array([ 1. , 0.42407587, 0. ]), 'Reward', -0.31443540108991352)
('Episode', 1, 'Step', 1195.0, 'Epsilon', 0.9929466666666205, 'Action', array([-0.69902666, 0.45118228, 0. ]), 'Reward', -0.27553278766886768)
('Episode', 1, 'Step', 1210.0, 'Epsilon', 0.9928966666666201, 'Action', array([-0.76086971, 0.6056412 , 0. ]), 'Reward', -0.59249250313645108)
('Episode', 1, 'Step', 1225.0, 'Epsilon', 0.9928466666666198, 'Action', array([-0.50501095, 0.42562676, 0. ]), 'Reward', -0.37234908573119119)
('Episode', 1, 'Step', 1240.0, 'Epsilon', 0.9927966666666195, 'Action', array([-0.33502362, 0.38665853, 0. ]), 'Reward', -0.46749031913560379)
('Episode', 1, 'Step', 1255.0, 'Epsilon', 0.9927466666666191, 'Action', array([-1. , 0.5119424, 0. ]), 'Reward', -0.46859707871263079)
('Episode', 1, 'Step', 1270.0, 'Epsilon', 0.9926966666666188, 'Action', array([ 0.65236215, 0.47142644, 0. ]), 'Reward', -0.26752113780140646)
('Episode', 1, 'Step', 1285.0, 'Epsilon', 0.9926466666666185, 'Action', array([-0.28958635, 0.52451681, 0. ]), 'Reward', -0.3682231588881314)
('Episode', 1, 'Step', 1300.0, 'Epsilon', 0.9925966666666182, 'Action', array([-1. , 0.41446919, 0. ]), 'Reward', -0.70737876632421959)
('Episode', 1, 'Step', 1315.0, 'Epsilon', 0.9925466666666178, 'Action', array([-0.28786125, 0.52911752, 0. ]), 'Reward', -0.47510682011318733)
('Episode', 1, 'Step', 1330.0, 'Epsilon', 0.9924966666666175, 'Action', array([-1. , 0.3741889, 0. ]), 'Reward', -0.76654295862779509)
('Episode', 1, 'Step', 1345.0, 'Epsilon', 0.9924466666666172, 'Action', array([-0.71878627, 0.73020089, 0. ]), 'Reward', -1.2524054325119094)
('Episode', 1, 'Step', 1360.0, 'Epsilon', 0.9923966666666169, 'Action', array([-0.45343495, 0.53471124, 0. ]), 'Reward', -1.9051167640705833)
('Episode', 1, 'Step', 1375.0, 'Epsilon', 0.9923466666666165, 'Action', array([-1. , 0.54585514, 0. ]), 'Reward', -2.3766647935589917)
('Episode', 1, 'Step', 1390.0, 'Epsilon', 0.9922966666666162, 'Action', array([-0.52988897, 0.7372214 , 0. ]), 'Reward', -2.3153772800350927)
('Episode', 1, 'Step', 1405.0, 'Epsilon', 0.9922466666666159, 'Action', array([-0.68497892, 0.59770123, 0. ]), 'Reward', -0.38768334496388102)
('Episode', 1, 'Step', 1420.0, 'Epsilon', 0.9921966666666155, 'Action', array([-1. , 0.51131977, 0. ]), 'Reward', -0.24049953146809119)
('Episode', 1, 'Step', 1435.0, 'Epsilon', 0.9921466666666152, 'Action', array([-0.10271778, 0.44987474, 0. ]), 'Reward', -0.48813057397713833)
('Episode', 1, 'Step', 1450.0, 'Epsilon', 0.9920966666666149, 'Action', array([-0.02971459, 0.47457656, 0. ]), 'Reward', -0.78862777095113545)
('Episode', 1, 'Step', 1465.0, 'Epsilon', 0.9920466666666146, 'Action', array([ 0.08683622, 0.60557085, 0. ]), 'Reward', -0.71484222531113928)
('Episode', 1, 'Step', 1480.0, 'Epsilon', 0.9919966666666142, 'Action', array([-1. , 0.43031083, 0. ]), 'Reward', -0.41074319844675578)
('Episode', 1, 'Step', 1495.0, 'Epsilon', 0.9919466666666139, 'Action', array([-0.2810796 , 0.65164453, 0. ]), 'Reward', -2.6836480239149747)
('Episode', 1, 'Step', 1510.0, 'Epsilon', 0.9918966666666136, 'Action', array([-0.51803081, 0.58276996, 0. ]), 'Reward', -5.176114805624227)
('Episode', 1, 'Step', 1525.0, 'Epsilon', 0.9918466666666133, 'Action', array([-0.12082993, 0.45628093, 0. ]), 'Reward', -0.0027045645038798593)
('Episode', 1, 'Step', 1540.0, 'Epsilon', 0.9917966666666129, 'Action', array([ 0.28465753, 0.62663247, 0. ]), 'Reward', -0.21756511428588082)
('Episode', 1, 'Step', 1555.0, 'Epsilon', 0.9917466666666126, 'Action', array([-1. , 0.55523546, 0. ]), 'Reward', -0.08189791546614375)
('Episode', 1, 'Step', 1570.0, 'Epsilon', 0.9916966666666123, 'Action', array([ 1. , 0.51003783, 0. ]), 'Reward', -0.21788985929316401)
('Episode', 1, 'Step', 1585.0, 'Epsilon', 0.9916466666666119, 'Action', array([-0.98891765, 0.51967475, 0. ]), 'Reward', -0.24435165139971116)
('Episode', 1, 'Step', 1600.0, 'Epsilon', 0.9915966666666116, 'Action', array([-1. , 0.45035453, 0. ]), 'Reward', -0.25009594810055008)
('Episode', 1, 'Step', 1615.0, 'Epsilon', 0.9915466666666113, 'Action', array([ 0.08026813, 0.45115506, 0. ]), 'Reward', -0.17855743303234425)
('Episode', 1, 'Step', 1630.0, 'Epsilon', 0.991496666666611, 'Action', array([-0.31550348, 0.49349873, 0. ]), 'Reward', -0.28026602093331576)
('Episode', 1, 'Step', 1645.0, 'Epsilon', 0.9914466666666106, 'Action', array([-0.72863349, 0.43258132, 0. ]), 'Reward', -0.22689861193849675)
('Episode', 1, 'Step', 1660.0, 'Epsilon', 0.9913966666666103, 'Action', array([ 1. , 0.58828713, 0. ]), 'Reward', -0.20488184718611774)
('Episode', 1, 'Step', 1675.0, 'Epsilon', 0.99134666666661, 'Action', array([-0.34370383, 0.4268948 , 0. ]), 'Reward', -0.2306720298055302)
('Episode', 1, 'Step', 1690.0, 'Epsilon', 0.9912966666666096, 'Action', array([-0.72324314, 0.41118787, 0. ]), 'Reward', -0.44960732510466334)
('Episode', 1, 'Step', 1705.0, 'Epsilon', 0.9912466666666093, 'Action', array([ 0.3232234 , 0.58592377, 0. ]), 'Reward', -0.44495689482555023)
('Episode', 1, 'Step', 1720.0, 'Epsilon', 0.991196666666609, 'Action', array([ 1. , 0.45706636, 0. ]), 'Reward', -0.3298918490724263)
('Episode', 1, 'Step', 1735.0, 'Epsilon', 0.9911466666666087, 'Action', array([-0.51230156, 0.60620778, 0. ]), 'Reward', -0.43027664178018837)
('Episode', 1, 'Step', 1750.0, 'Epsilon', 0.9910966666666083, 'Action', array([ 0.52819397, 0.51514697, 0. ]), 'Reward', -0.19588437648548154)
('Episode', 1, 'Step', 1765.0, 'Epsilon', 0.991046666666608, 'Action', array([ 0.96104107, 0.4614162 , 0. ]), 'Reward', -0.24948753601668103)
('Episode', 1, 'Step', 1780.0, 'Epsilon', 0.9909966666666077, 'Action', array([ 0.53716429, 0.47914533, 0. ]), 'Reward', -0.22522489143579608)
('Episode', 1, 'Step', 1795.0, 'Epsilon', 0.9909466666666074, 'Action', array([ 0.71185894, 0.57568351, 0. ]), 'Reward', -0.42357928694221286)
('Episode', 1, 'Step', 1810.0, 'Epsilon', 0.990896666666607, 'Action', array([ 1. , 0.2780566, 0. ]), 'Reward', -0.14004226575431861)
('Episode', 1, 'Step', 1825.0, 'Epsilon', 0.9908466666666067, 'Action', array([ 0.65642911, 0.45760956, 0. ]), 'Reward', -0.4004541771961132)
('Episode', 1, 'Step', 1840.0, 'Epsilon', 0.9907966666666064, 'Action', array([-0.24487451, 0.51097721, 0. ]), 'Reward', -0.75895083922723106)
('Episode', 1, 'Step', 1855.0, 'Epsilon', 0.990746666666606, 'Action', array([ 1. , 0.55862588, 0. ]), 'Reward', -0.45741118830410471)
('Episode', 1, 'Step', 1870.0, 'Epsilon', 0.9906966666666057, 'Action', array([-0.92519773, 0.33327451, 0. ]), 'RewaWaiting for request on port 3101
******* RESTARTING *****
rd', -0.98449690978087534)
('Episode', 1, 'Step', 1885.0, 'Epsilon', 0.9906466666666054, 'Action', array([ 0.67561267, 0.5514747 , 0. ]), 'Reward', -0.77537626083258049)
('Episode', 1, 'Step', 1900.0, 'Epsilon', 0.9905966666666051, 'Action', array([-0.99714058, 0.47504247, 0. ]), 'Reward', -1.1277430368418628)
('Episode', 1, 'Step', 1915.0, 'Epsilon', 0.9905466666666047, 'Action', array([ 0.71887166, 0.44632217, 0. ]), 'Reward', -3.3274018567268886)
('Episode', 1, 'Step', 1930.0, 'Epsilon', 0.9904966666666044, 'Action', array([ 1. , 0.56074521, 0. ]), 'Reward', -1)
('Episode', 1, 'Step', 1945.0, 'Epsilon', 0.9904466666666041, 'Action', array([ 0.54578241, 0.48130723, 0. ]), 'Reward', -0.31492777706661845)
('Episode', 1, 'Step', 1960.0, 'Epsilon', 0.9903966666666038, 'Action', array([-1. , 0.53714286, 0. ]), 'Reward', -0.26990358391220992)
('Episode', 1, 'Step', 1975.0, 'Epsilon', 0.9903466666666034, 'Action', array([ 0.63359445, 0.68176915, 0. ]), 'Reward', -0.4586501892373463)
('Episode', 1, 'Step', 1990.0, 'Epsilon', 0.9902966666666031, 'Action', array([-0.83655266, 0.37955104, 0. ]), 'Reward', -0.25121313035428172)
TOTAL REWARD @ 1-th Episode : Reward -10945.7488717
Total Step: 2920
Waiting for server on 3101............
Count Down : 5
Client connected on 3101..............
Episode : 2 Replay Buffer 2920 Early Stopping: 0 Epsilon: 0.990266666667 RN: 0.880820084325
('Episode', 2, 'Step', 5.0, 'Epsilon', 0.9902466666666028, 'Action', array([ 0.45272604, 0.46864928, 0. ]), 'Reward', 6.3199014113315943)
('Episode', 2, 'Step', 20.0, 'Epsilon', 0.9901966666666024, 'Action', array([-0.58669389, 0.50201288, 0. ]), 'Reward', -2.6101233043038139)
('Episode', 2, 'Step', 35.0, 'Epsilon', 0.9901466666666021, 'Action', array([ 0.76434924, 0.47713053, 0. ]), 'Reward', -0.10340700768693711)
('Episode', 2, 'Step', 50.0, 'Epsilon', 0.9900966666666018, 'Action', array([-1. , 0.61698899, 0. ]), 'Reward', -0.45033014184082443)
('Episode', 2, 'Step', 65.0, 'Epsilon', 0.9900466666666015, 'Action', array([-0.00198914, 0.27606085, 0. ]), 'Reward', -0.010726083092688774)
('Episode', 2, 'Step', 80.0, 'Epsilon', 0.9899966666666011, 'Action', array([ 0.40239466, 0.57439616, 0. ]), 'Reward', -0.38948637853022988)
('Episode', 2, 'Step', 95.0, 'Epsilon', 0.9899466666666008, 'Action', array([ 0.36652379, 0.3841714 , 0. ]), 'Reward', -0.088933251868835633)
('Episode', 2, 'Step', 110.0, 'Epsilon', 0.9898966666666005, 'Action', array([ 0.69853795, 0.44936668, 0. ]), 'Reward', -0.084805547072514365)
('Episode', 2, 'Step', 125.0, 'Epsilon', 0.9898466666666002, 'Action', array([ 1. , 0.70039094, 0. ]), 'Reward', -0.42253709559465191)
('Episode', 2, 'Step', 140.0, 'Epsilon', 0.9897966666665998, 'Action', array([ 0.81315824, 0.43767115, 0. ]), 'Reward', -0.17255125109664049)
('Episode', 2, 'Step', 155.0, 'Epsilon', 0.9897466666665995, 'Action', array([ 0.70534085, 0.47318363, 0. ]), 'Reward', -0.080230076658673585)
('Episode', 2, 'Step', 170.0, 'Epsilon', 0.9896966666665992, 'Action', array([ 0.40286872, 0.53800652, 0. ]), 'Reward', -0.34721590160476723)
('Episode', 2, 'Step', 185.0, 'Epsilon', 0.9896466666665988, 'Action', array([ 1. , 0.41246263, 0. ]), 'Reward', -0.17783834950541116)
('Episode', 2, 'Step', 200.0, 'Epsilon', 0.9895966666665985, 'Action', array([-0.40389667, 0.57908396, 0. ]), 'Reward', -0.48644428019333857)
('Episode', 2, 'Step', 215.0, 'Epsilon', 0.9895466666665982, 'Action', array([-0.17819201, 0.44798728, 0. ]), 'Reward', -0.17893300415602381)
('Episode', 2, 'Step', 230.0, 'Epsilon', 0.9894966666665979, 'Action', array([ 0.80019168, 0.51444285, 0. ]), 'Reward', -0.17786219137907625)
('Episode', 2, 'Step', 245.0, 'Epsilon', 0.9894466666665975, 'Action', array([ 0.40048147, 0.42563922, 0. ]), 'Reward', -0.22813050577666238)
('Episode', 2, 'Step', 260.0, 'Epsilon', 0.9893966666665972, 'Action', array([ 0.67603467, 0.61054217, 0. ]), 'Reward', -0.28906362958087961)
('Episode', 2, 'Step', 275.0, 'Epsilon', 0.9893466666665969, 'Action', array([ 1. , 0.54595649, 0. ]), 'Reward', -0.31633358634102693)
('Episode', 2, 'Step', 290.0, 'Epsilon', 0.9892966666665965, 'Action', array([ 1. , 0.49165773, 0. ]), 'Reward', -0.18664372010164462)
('Episode', 2, 'Step', 305.0, 'Epsilon', 0.9892466666665962, 'Action', array([-0.40005008, 0.43933866, 0. ]), 'Reward', -0.51337898862081555)
('Episode', 2, 'Step', 320.0, 'Epsilon', 0.9891966666665959, 'Action', array([ 0.43827966, 0.33896538, 0. ]), 'Reward', -0.13258794761827114)
('Episode', 2, 'Step', 335.0, 'Epsilon', 0.9891466666665956, 'Action', array([-0.46651907, 0.45220036, 0. ]), 'Reward', -0.56221745265210477)
('Episode', 2, 'Step', 350.0, 'Epsilon', 0.9890966666665952, 'Action', array([ 0.68568827, 0.50928354, 0. ]), 'Reward', -0.26729486188912355)
('Episode', 2, 'Step', 365.0, 'Epsilon', 0.9890466666665949, 'Action', array([ 0.49547907, 0.64778294, 0. ]), 'Reward', -0.41310493080913291)
('Episode', 2, 'Step', 380.0, 'Epsilon', 0.9889966666665946, 'Action', array([ 0.08058957, 0.46522594, 0. ]), 'Reward', -0.51790396245954029)
('Episode', 2, 'Step', 395.0, 'Epsilon', 0.9889466666665943, 'Action', array([ 0.26383312, 0.53588314, 0. ]), 'Reward', -0.40516190776946676)
('Episode', 2, 'Step', 410.0, 'Epsilon', 0.9888966666665939, 'Action', array([ 0.21087338, 0.32807054, 0. ]), 'Reward', -0.19745147444179556)
('Episode', 2, 'Step', 425.0, 'Epsilon', 0.9888466666665936, 'Action', array([ 1. , 0.4751352, 0. ]), 'Reward', -0.12541396217452722)
('Episode', 2, 'Step', 440.0, 'Epsilon', 0.9887966666665933, 'Action', array([ 0.01856511, 0.57787763, 0. ]), 'Reward', -0.67005580619921168)
('Episode', 2, 'Step', 455.0, 'Epsilon', 0.9887466666665929, 'Action', array([ 0.58094314, 0.7209174 , 0. ]), 'Reward', -0.85893997403248812)
('Episode', 2, 'Step', 470.0, 'Epsilon', 0.9886966666665926, 'Action', array([ 1. , 0.44575845, 0. ]), 'Reward', -0.18877024574991058)
('Episode', 2, 'Step', 485.0, 'Epsilon', 0.9886466666665923, 'Action', array([-0.03755302, 0.71473465, 0. ]), 'Reward', -1.0586196556290506)
('Episode', 2, 'Step', 500.0, 'Epsilon', 0.988596666666592, 'Action', array([ 0.46723824, 0.35607 , 0. ]), 'Reward', -0.22217518426427318)
('Episode', 2, 'Step', 515.0, 'Epsilon', 0.9885466666665916, 'Action', array([-0.20441749, 0.48441062, 0. ]), 'Reward', -0.55355139267791809)
('Episode', 2, 'Step', 530.0, 'Epsilon', 0.9884966666665913, 'Action', array([ 0.52812996, 0.46730003, 0. ]), 'Reward', -0.24208965991872566)
('Episode', 2, 'Step', 545.0, 'Epsilon', 0.988446666666591, 'Action', array([-1. , 0.45278775, 0. ]), 'Reward', -0.97258871213857612)
('Episode', 2, 'Step', 560.0, 'Epsilon', 0.9883966666665907, 'Action', array([ 0.48635804, 0.43642385, 0. ]), 'Reward', -0.35028492900358121)
('Episode', 2, 'Step', 575.0, 'Epsilon', 0.9883466666665903, 'Action', array([ 0.89859608, 0.31673875, 0. ]), 'Reward', -0.13126081830387171)
('Episode', 2, 'Step', 590.0, 'Epsilon', 0.98829666666659, 'Action', array([ 0.77621736, 0.54338108, 0. ]), 'Reward', -0.37956566181940243)
('Episode', 2, 'Step', 605.0, 'Epsilon', 0.9882466666665897, 'Action', array([ 0.49388287, 0.3804371 , 0. ]), 'Reward', -0.34912543050690881)
('Episode', 2, 'Step', 620.0, 'Epsilon', 0.9881966666665893, 'Action', array([ 0.64617361, 0.51333092, 0. ]), 'Reward', -0.30695545602697882)
('Episode', 2, 'Step', 635.0, 'Epsilon', 0.988146666666589, 'Action', array([-0.18000785, 0.55269329, 0. ]), 'Reward', -1.1062525582706657)
('Episode', 2, 'Step', 650.0, 'Epsilon', 0.9880966666665887, 'Action', array([ 0.90671701, 0.49791099, 0. ]), 'Reward', -0.20272236115693437)
('Episode', 2, 'Step', 665.0, 'Epsilon', 0.9880466666665884, 'Action', array([-0.20104415, 0.65473061, 0. ]), 'Reward', -1.3302464482994263)
('Episode', 2, 'Step', 680.0, 'Epsilon', 0.987996666666588, 'Action', array([-0.41517426, 0.54055194, 0. ]), 'Reward', -1.1683877932912594)
('Episode', 2, 'Step', 695.0, 'Epsilon', 0.9879466666665877, 'Action', array([ 0.1872271 , 0.54972926, 0. ]), 'Reward', -0.55569952347400342)
('Episode', 2, 'Step', 710.0, 'Epsilon', 0.9878966666665874, 'Action', array([ 0.38269217, 0.61885989, 0. ]), 'Reward', -1.2746141344093269)
('Episode', 2, 'Step', 725.0, 'Epsilon', 0.987846666666587, 'Action', array([ 0.41788333, 0.24436476, 0. ]), 'Reward', -1.1625682932078547)
('Episode', 2, 'Step', 740.0, 'Epsilon', 0.9877966666665867, 'Action', array([ 0.900866 , 0.62236753, 0. ]), 'Reward', -0.66607607745727115)
('Episode', 2, 'Step', 755.0, 'Epsilon', 0.9877466666665864, 'Action', array([-0.24939121, 0.63890104, 0. ]), 'Reward', -1.1267478133265461)
('Episode', 2, 'Step', 770.0, 'Epsilon', 0.9876966666665861, 'Action', array([-0.32277862, 0.40823723, 0. ]), 'Reward', -0.64798097574514468)
('Episode', 2, 'Step', 785.0, 'Epsilon', 0.9876466666665857, 'Action', array([ 1. , 0.26894635, 0. ]), 'Reward', -0.11227833505147455)
('Episode', 2, 'Step', 800.0, 'Epsilon', 0.9875966666665854, 'Action', array([ 0.57991965, 0.47285981, 0.01164939]), 'Reward', -0.59173662004067107)
('Episode', 2, 'Step', 815.0, 'Epsilon', 0.9875466666665851, 'Action', array([ 0.34148985, 0.66837289, 0. ]), 'Reward', -1.0881793778188218)
('Episode', 2, 'Step', 830.0, 'Epsilon', 0.9874966666665848, 'Action', array([ 1.00000000e+00, 4.41323916e-01, 9.79888892e-04]), 'Reward', -0.24390535635807864)
('Episode', 2, 'Step', 845.0, 'Epsilon', 0.9874466666665844, 'Action', array([ 0.34800112, 0.58256306, 0. ]), 'Reward', -1.1300444283518034)
('Episode', 2, 'Step', 860.0, 'Epsilon', 0.9873966666665841, 'Action', array([-0.50666735, 0.38975678, 0. ]), 'Reward', -0.79733214414456643)
('Episode', 2, 'Step', 875.0, 'Epsilon', 0.9873466666665838, 'Action', array([ 0.56835777, 0.56243665, 0. ]), 'Reward', -0.65936696868004741)
('Episode', 2, 'Step', 890.0, 'Epsilon', 0.9872966666665834, 'Action', array([ 0.4610323 , 0.59411969, 0. ]), 'Reward', -0.57116235615798505)
('Episode', 2, 'Step', 905.0, 'Epsilon', 0.9872466666665831, 'Action', array([-1. , 0.56617814, 0. ]), 'Reward', -1.8090446279174861)
('Episode', 2, 'Step', 920.0, 'Epsilon', 0.9871966666665828, 'Action', array([ 1. , 0.26346781, 0.02418782]), 'Reward', -0.2692023998660798)
('Episode', 2, 'Step', 935.0, 'Epsilon', 0.9871466666665825, 'Action', array([ 0.36792533, 0.51646739, 0. ]), 'Reward', -0.60995271590715461)
('Episode', 2, 'Step', 950.0, 'Epsilon', 0.9870966666665821, 'Action', array([ 1. , 0.18052944, 0. ]), 'Reward', -0.9027397356414042)
('Episode', 2, 'Step', 965.0, 'Epsilon', 0.9870466666665818, 'Action', array([ 0.52998064, 0.46994128, 0. ]), 'Reward', -0.86534568473706575)
('Episode', 2, 'Step', 980.0, 'Epsilon', 0.9869966666665815, 'Action', array([ 1. , 0.74243729, 0.00175937]), 'Reward', -0.61912514017261344)
('Episode', 2, 'Step', 995.0, 'Epsilon', 0.9869466666665812, 'Action', array([ 0.11513682, 0.56275851, 0. ]), 'Reward', -1.0852881366735052)
('Episode', 2, 'Step', 1010.0, 'Epsilon', 0.9868966666665808, 'Action', array([-0.1855699 , 0.49176691, 0. ]), 'Reward', -2.7773887095700189)
('Episode', 2, 'Step', 1025.0, 'Epsilon', 0.9868466666665805, 'Action', array([ 0.8527479, 0.4810884, 0. ]), 'Reward', -0.97214073060076078)
('Episode', 2, 'Step', 1040.0, 'Epsilon', 0.9867966666665802, 'Action', array([ 0.13211562, 0.61146693, 0. ]), 'Reward', -1.2127758411213443)
('Episode', 2, 'Step', 1055.0, 'Epsilon', 0.9867466666665798, 'Action', array([ 0.21748626, 0.55738113, 0. ]), 'Reward', -1.7516562089564065)
('Episode', 2, 'Step', 1070.0, 'Epsilon', 0.9866966666665795, 'Action', array([ 0.47234488, 0.34431383, 0. ]), 'Reward', -1.6497768005836155)
('Episode', 2, 'Step', 1085.0, 'Epsilon', 0.9866466666665792, 'Action', array([ 0.52593222, 0.59565136, 0. ]), 'Reward', -2.8795828396642049)
('Episode', 2, 'Step', 1100.0, 'Epsilon', 0.9865966666665789, 'Action', array([ 1. , 0.47496231, 0. ]), 'Reward', -1.2076623236994148)
('Episode', 2, 'Step', 1115.0, 'Epsilon', 0.9865466666665785, 'Action', array([ 0.06146156, 0.4194814 , 0. ]), 'Reward', -0.90315176001333564)
('Episode', 2, 'Step', 1130.0, 'Epsilon', 0.9864966666665782, 'Action', array([-0.22506514, 0.43976699, 0. ]), 'Reward', -0.8987135292377979)
('Episode', 2, 'Step', 1145.0, 'Epsilon', 0.9864466666665779, 'Action', array([ 1. , 0.56482333, 0. ]), 'Reward', -0.77844076598053147)
('Episode', 2, 'Step', 1160.0, 'Epsilon', 0.9863966666665775, 'Action', array([-0.24858828, 0.37370769, 0. ]), 'Reward', -4.9241250742975566)
('Episode', 2, 'Step', 1175.0, 'Epsilon', 0.9863466666665772, 'Action', array([ 0.25612862, 0.56711967, 0. ]), 'Reward', -3.7271197250226988)
('Episode', 2, 'Step', 1190.0, 'Epsilon', 0.9862966666665769, 'Action', array([-0.05122922, 0.50844702, 0. ]), 'Reward', -3.0847003877676666)
('Episode', 2, 'Step', 1205.0, 'Epsilon', 0.9862466666665766, 'Action', array([-0.94636008, 0.5627674 , 0. ]), 'Reward', -3.073251963819553)
('Episode', 2, 'Step', 1220.0, 'Epsilon', 0.9861966666665762, 'Action', array([ 0.18487978, 0.5359168 , 0. ]), 'Reward', -3.1168622593354254)
('Episode', 2, 'Step', 1235.0, 'Epsilon', 0.9861466666665759, 'Action', array([ 1. , 0.6560754, 0. ]), 'Reward', -3.3078332111024658)
('Episode', 2, 'Step', 1250.0, 'Epsilon', 0.9860966666665756, 'Action', array([ 0.03769147, 0.45686203, 0. ]), 'Reward', -3.4769487787562259)
('Episode', 2, 'Step', 1265.0, 'Epsilon', 0.9860466666665753, 'Action', array([ 1. , 0.55911239, 0. ]), 'Reward', -7.5868710059300568)
('Episode', 2, 'Step', 1280.0, 'Epsilon', 0.9859966666665749, 'Action', array([-0.70423718, 0.51603599, 0. ]), 'Reward', -14.463240455524037)
('Episode', 2, 'Step', 1295.0, 'Epsilon', 0.9859466666665746, 'Action', array([ 0.85043197, 0.50495414, 0. ]), 'Reward', 16.963627389353483)
('Episode', 2, 'Step', 1310.0, 'Epsilon', 0.9858966666665743, 'Action', array([-1. , 0.5873796, 0. ]), 'Reward', -0.46909899759251572)
('Episode', 2, 'Step', 1325.0, 'Epsilon', 0.985846666666574, 'Action', array([-0.75211087, 0.67317488, 0. ]), 'Reward', -0.35793505769928669)
('Episode', 2, 'Step', 1340.0, 'Epsilon', 0.9857966666665736, 'Action', array([-0.88837421, 0.51987371, 0. ]), 'Reward', -0.42923037589998392)
('Episode', 2, 'Step', 1355.0, 'Epsilon', 0.9857466666665733, 'Action', array([-0.82995181, 0.49213293, 0. ]), 'Reward', -0.19344172218382838)
('Episode', 2, 'Step', 1370.0, 'Epsilon', 0.985696666666573, 'Action', array([-1. , 0.54217822, 0. ]), 'Reward', -0.45940555784016912)
('Episode', 2, 'Step', 1385.0, 'Epsilon', 0.9856466666665726, 'Action', array([-1. , 0.5147585, 0. ]), 'Reward', -0.37363159915707472)
('Episode', 2, 'Step', 1400.0, 'Epsilon', 0.9855966666665723, 'Action', array([-0.57287729, 0.65148113, 0. ]), 'Reward', -0.48238429845363739)
('Episode', 2, 'Step', 1415.0, 'Epsilon', 0.985546666666572, 'Action', array([ 0.61223698, 0.44016366, 0. ]), 'Reward', -0.45136941851658779)
('Episode', 2, 'Step', 1430.0, 'Epsilon', 0.9854966666665717, 'Action', array([-0.84986036, 0.34461764, 0.04079204]), 'Reward', -0.0060826848446048163)
('Episode', 2, 'Step', 1445.0, 'Epsilon', 0.9854466666665713, 'Action', array([ 0.65388081, 0.45993332, 0. ]), 'Reward', -0.52806601674945997)
('Episode', 2, 'Step', 1460.0, 'Epsilon', 0.985396666666571, 'Action', array([-0.02680964, 0.47737651, 0. ]), 'Reward', -0.30009450960464229)
('Episode', 2, 'Step', 1475.0, 'Epsilon', 0.9853466666665707, 'Action', array([ 0.17143186, 0.43513585, 0. ]), 'Reward', -0.29721525868584864)
('Episode', 2, 'Step', 1490.0, 'Epsilon', 0.9852966666665703, 'Action', array([-0.09709966, 0.60803898, 0. ]), 'Reward', -0.48014370119828537)
('Episode', 2, 'Step', 1505.0, 'Epsilon', 0.98524666666657, 'Action', array([-1. , 0.52423914, 0. ]), 'Reward', -0.20756740895047668)
('Episode', 2, 'Step', 1520.0, 'Epsilon', 0.9851966666665697, 'Action', array([ 0.80893873, 0.42781064, 0. ]), 'Reward', -0.70496694091588996)
('Episode', 2, 'Step', 1535.0, 'Epsilon', 0.9851466666665694, 'Action', array([-0.28703727, 0.55320089, 0. ]), 'Reward', -4.2527928144355958)
('Episode', 2, 'Step', 1550.0, 'Epsilon', 0.985096666666569, 'Action', array([ 1. , 0.53445279, 0. ]), 'Reward', 23.18100265370115)
('Episode', 2, 'Step', 1565.0, 'Epsilon', 0.9850466666665687, 'Action', array([-1. , 0.54402032, 0. ]), 'Reward', 6.6098693982739647)
('Episode', 2, 'Step', 1580.0, 'Epsilon', 0.9849966666665684, 'Action', array([-0.10417523, 0.43434308, 0. ]), 'Reward', -21.704949428797597)
('Episode', 2, 'Step', 1595.0, 'Epsilon', 0.984946666666568, 'Action', array([-0.65038707, 0.40750745, 0. ]), 'Reward', -12.438653228303195)
('Episode', 2, 'Step', 1610.0, 'Epsilon', 0.9848966666665677, 'Action', array([-0.04846539, 0.5242638 , 0. ]), 'Reward', -2.1071891848737376)
('Episode', 2, 'Step', 1625.0, 'Epsilon', 0.9848466666665674, 'Action', array([-0.69925587, 0.57732664, 0. ]), 'Reward', -0.25580729332211738)
('Episode', 2, 'Step', 1640.0, 'Epsilon', 0.9847966666665671, 'Action', array([ 0.85001417, 0.39740325, 0. ]), 'Reward', -0.62053717514408113)
('Episode', 2, 'Step', 1655.0, 'Epsilon', 0.9847466666665667, 'Action', array([-1. , 0.62580172, 0. ]), 'Reward', -0.28413720050989122)
('Episode', 2, 'Step', 1670.0, 'Epsilon', 0.9846966666665664, 'Action', array([ 1. , 0.55091785, 0. ]), 'Reward', -0.59241966065482021)
('Episode', 2, 'Step', 1685.0, 'Epsilon', 0.9846466666665661, 'Action', array([-0.31215099, 0.5870226 , 0. ]), 'Reward', -0.2400391569924166)
('Episode', 2, 'Step', 1700.0, 'Epsilon', 0.9845966666665658, 'Action', array([-1. , 0.37844948, 0. ]), 'Reward', -0.23177333413446852)
('Episode', 2, 'Step', 1715.0, 'Epsilon', 0.9845466666665654, 'Action', array([-0.48694893, 0.58985133, 0. ]), 'Reward', -0.22709193740875272)
('Episode', 2, 'Step', 1730.0, 'Epsilon', 0.9844966666665651, 'Action', array([-0.88429758, 0.34604398, 0. ]), 'Reward', -0.20678938375770747)
('Episode', 2, 'Step', 1745.0, 'Epsilon', 0.9844466666665648, 'Action', array([-0.255548 , 0.48416749, 0. ]), 'Reward', -0.32602420498539469)
('Episode', 2, 'Step', 1760.0, 'Epsilon', 0.9843966666665644, 'Action', array([-0.85196282, 0.53421856, 0. ]), 'Reward', -0.39535123375516068)
('Episode', 2, 'Step', 1775.0, 'Epsilon', 0.9843466666665641, 'Action', array([ 0.22984243, 0.64289773, 0. ]), 'Reward', -0.60215456761490938)
('Episode', 2, 'Step', 1790.0, 'Epsilon', 0.9842966666665638, 'Action', array([ 0.27233294, 0.49430655, 0. ]), 'Reward', -0.55807149158494762)
('Episode', 2, 'Step', 1805.0, 'Epsilon', 0.9842466666665635, 'Action', array([-1. , 0.5820964, 0. ]), 'Reward', -0.32430783671200319)
('Episode', 2, 'Step', 1820.0, 'Epsilon', 0.9841966666665631, 'Action', array([-0.50754637, 0.51243127, 0. ]), 'Reward', -0.2154876854511143)
('Episode', 2, 'Step', 1835.0, 'Epsilon', 0.9841466666665628, 'Action', array([-0.76496711, 0.64529423, 0. ]), 'Reward', -0.25548156224635965)
('Episode', 2, 'Step', 1850.0, 'Epsilon', 0.9840966666665625, 'Action', array([-1. , 0.4087014, 0. ]), 'Reward', -0.079185250006722385)
('Episode', 2, 'Step', 1865.0, 'Epsilon', 0.9840466666665622, 'Action', array([-1. , 0.46774941, 0. ]), 'Reward', -0.22527724700693549)
('Episode', 2, 'Step', 1880.0, 'Epsilon', 0.9839966666665618, 'Action', array([ 0.90761395, 0.48025558, 0. ]), 'Reward', -0.8338Waiting for request on port 3101
******* RESTARTING *****
4752383913707)
('Episode', 2, 'Step', 1895.0, 'Epsilon', 0.9839466666665615, 'Action', array([-0.02144435, 0.44598368, 0. ]), 'Reward', -0.28013243503065599)
('Episode', 2, 'Step', 1910.0, 'Epsilon', 0.9838966666665612, 'Action', array([ 0.16616002, 0.50134067, 0. ]), 'Reward', -0.50103101566289854)
('Episode', 2, 'Step', 1925.0, 'Epsilon', 0.9838466666665608, 'Action', array([-0.49128994, 0.49395466, 0. ]), 'Reward', -0.33311254603530949)
('Episode', 2, 'Step', 1940.0, 'Epsilon', 0.9837966666665605, 'Action', array([ 0.92056198, 0.53715188, 0. ]), 'Reward', -0.46733531589318733)
('Episode', 2, 'Step', 1955.0, 'Epsilon', 0.9837466666665602, 'Action', array([-0.8934868, 0.5132811, 0. ]), 'Reward', -0.21834105703880707)
('Episode', 2, 'Step', 1970.0, 'Epsilon', 0.9836966666665599, 'Action', array([ 0.02354248, 0.45561807, 0. ]), 'Reward', -0.26447763116963857)
('Episode', 2, 'Step', 1985.0, 'Epsilon', 0.9836466666665595, 'Action', array([-1. , 0.50411206, 0. ]), 'Reward', -0.19626376204997723)
TOTAL REWARD @ 2-th Episode : Reward -1142.43940635
Total Step: 4920
### TORCS is RELAUNCHED ###
Client connected on 3101..............
Episode : 3 Replay Buffer 4920 Early Stopping: 0 Epsilon: 0.9836 RN: 0.981380822998
('Episode', 3, 'Step', 0.0, 'Epsilon', 0.9835966666665592, 'Action', array([ 1. , 0.54956346, 0. ]), 'Reward', -0.17312116951548964)
('Episode', 3, 'Step', 15.0, 'Epsilon', 0.9835466666665589, 'Action', array([ 0.09009489, 0.4539019 , 0. ]), 'Reward', 13.140864647802481)
('Episode', 3, 'Step', 30.0, 'Epsilon', 0.9834966666665585, 'Action', array([ 1. , 0.48278559, 0. ]), 'Reward', 3.3494604556243779)
('Episode', 3, 'Step', 45.0, 'Epsilon', 0.9834466666665582, 'Action', array([-0.54832819, 0.39027201, 0. ]), 'Reward', -20.371886066206663)
('Episode', 3, 'Step', 60.0, 'Epsilon', 0.9833966666665579, 'Action', array([-0.19762464, 0.59168516, 0. ]), 'Reward', -25.903937504448571)
('Episode', 3, 'Step', 75.0, 'Epsilon', 0.9833466666665576, 'Action', array([ 0.66634547, 0.42169236, 0. ]), 'Reward', 24.033200464167443)
('Episode', 3, 'Step', 90.0, 'Epsilon', 0.9832966666665572, 'Action', array([-0.56473595, 0.34209659, 0.03211617]), 'Reward', 27.681384763169625)
('Episode', 3, 'Step', 105.0, 'Epsilon', 0.9832466666665569, 'Action', array([ 0.32126256, 0.3428289 , 0. ]), 'Reward', -103.10878116223412)
('Episode', 3, 'Step', 120.0, 'Epsilon', 0.9831966666665566, 'Action', array([ 1. , 0.44328625, 0. ]), 'Reward', -0.29469474035070964)
('Episode', 3, 'Step', 135.0, 'Epsilon', 0.9831466666665563, 'Action', array([ 0.16148715, 0.57533318, 0. ]), 'Reward', -0.22143349708893875)
('Episode', 3, 'Step', 150.0, 'Epsilon', 0.9830966666665559, 'Action', array([-0.12912166, 0.50798294, 0. ]), 'Reward', -0.1360947895979229)
('Episode', 3, 'Step', 165.0, 'Epsilon', 0.9830466666665556, 'Action', array([ 1. , 0.47174098, 0. ]), 'Reward', -0.62802071332002629)
('Episode', 3, 'Step', 180.0, 'Epsilon', 0.9829966666665553, 'Action', array([ 0.02921438, 0.65146379, 0. ]), 'Reward', -0.090051197392334525)
('Episode', 3, 'Step', 195.0, 'Epsilon', 0.982946666666555, 'Action', array([-0.22574656, 0.5012917 , 0. ]), 'Reward', 0.043419510672268312)
('Episode', 3, 'Step', 210.0, 'Epsilon', 0.9828966666665546, 'Action', array([ 1. , 0.4946997, 0. ]), 'Reward', 0.31933836642462121)
('Episode', 3, 'Step', 225.0, 'Epsilon', 0.9828466666665543, 'Action', array([ 1. , 0.43223843, 0. ]), 'Reward', 0.0080505903379223809)
('Episode', 3, 'Step', 240.0, 'Epsilon', 0.982796666666554, 'Action', array([ 0.96901082, 0.49249712, 0. ]), 'Reward', -0.40032168678199009)
('Episode', 3, 'Step', 255.0, 'Epsilon', 0.9827466666665536, 'Action', array([ 1. , 0.66763547, 0. ]), 'Reward', -0.19913455560842147)
('Episode', 3, 'Step', 270.0, 'Epsilon', 0.9826966666665533, 'Action', array([ 0.50517964, 0.40501366,
Fuel consumption disabled!
Laptime limit disabled!
Visual Properties Report
------------------------
Compatibility mode, properties unknown.
Waiting for request on port 3101
******* RESTARTING *****
0. ]), 'Reward', -0.63442121909677063)
('Episode', 3, 'Step', 285.0, 'Epsilon', 0.982646666666553, 'Action', array([ 1. , 0.5976473, 0. ]), 'Reward', 0.1059519791456893)
('Episode', 3, 'Step', 300.0, 'Epsilon', 0.9825966666665527, 'Action', array([ 1. , 0.49877776, 0. ]), 'Reward', -0.080760747534275701)
('Episode', 3, 'Step', 315.0, 'Epsilon', 0.9825466666665523, 'Action', array([-1. , 0.50210861, 0. ]), 'Reward', 0.13442696995235459)
('Episode', 3, 'Step', 330.0, 'Epsilon', 0.982496666666552, 'Action', array([-0.55315285, 0.40793026, 0. ]), 'Reward', -0.56073276568670138)
('Episode', 3, 'Step', 345.0, 'Epsilon', 0.9824466666665517, 'Action', array([ 0.40380695, 0.59548998, 0. ]), 'Reward', 0.15747990279313612)
('Episode', 3, 'Step', 360.0, 'Epsilon', 0.9823966666665513, 'Action', array([ 1. , 0.45468452, 0. ]), 'Reward', 0.24097211456325268)
('Episode', 3, 'Step', 375.0, 'Epsilon', 0.982346666666551, 'Action', array([-0.07903306, 0.48454435, 0. ]), 'Reward', -0.8087382883322638)
('Episode', 3, 'Step', 390.0, 'Epsilon', 0.9822966666665507, 'Action', array([ 0.22575579, 0.53038381, 0. ]), 'Reward', 0.1978125970487794)
('Episode', 3, 'Step', 405.0, 'Epsilon', 0.9822466666665504, 'Action', array([ 1. , 0.42931751, 0.01712526]), 'Reward', -0.63216379585908689)
('Episode', 3, 'Step', 420.0, 'Epsilon', 0.98219666666655, 'Action', array([ 0.68944025, 0.58506962, 0. ]), 'Reward', -0.66638125902083556)
('Episode', 3, 'Step', 435.0, 'Epsilon', 0.9821466666665497, 'Action', array([ 1. , 0.43336588, 0. ]), 'Reward', -0.44451484224292731)
('Episode', 3, 'Step', 450.0, 'Epsilon', 0.9820966666665494, 'Action', array([ 0.83334874, 0.50793458, 0. ]), 'Reward', -0.13391611995556307)
('Episode', 3, 'Step', 465.0, 'Epsilon', 0.982046666666549, 'Action', array([ 1. , 0.4134703, 0. ]), 'Reward', 0.090469329140268229)
('Episode', 3, 'Step', 480.0, 'Epsilon', 0.9819966666665487, 'Action', array([ 1. , 0.51059685, 0. ]), 'Reward', -0.70237041725607274)
('Episode', 3, 'Step', 495.0, 'Epsilon', 0.9819466666665484, 'Action', array([-0.36597914, 0.47551735, 0. ]), 'Reward', 0.0083072073403859144)
('Episode', 3, 'Step', 510.0, 'Epsilon', 0.9818966666665481, 'Action', array([-0.16052383, 0.47954686, 0. ]), 'Reward', -0.36697981440966077)
('Episode', 3, 'Step', 525.0, 'Epsilon', 0.9818466666665477, 'Action', array([ 1. , 0.44870638, 0. ]), 'Reward', -0.10879273127409453)
('Episode', 3, 'Step', 540.0, 'Epsilon', 0.9817966666665474, 'Action', array([-0.03634571, 0.45888541, 0. ]), 'Reward', -0.58297451749146667)
('Episode', 3, 'Step', 555.0, 'Epsilon', 0.9817466666665471, 'Action', array([-0.31179622, 0.60376152, 0. ]), 'Reward', -0.33316360201050038)
('Episode', 3, 'Step', 570.0, 'Epsilon', 0.9816966666665468, 'Action', array([-0.92571204, 0.61583892, 0. ]), 'Reward', -1.4286635385773812)
('Episode', 3, 'Step', 585.0, 'Epsilon', 0.9816466666665464, 'Action', array([ 0.26006028, 0.51531583, 0.04389267]), 'Reward', -1.4239050065356702)
('Episode', 3, 'Step', 600.0, 'Epsilon', 0.9815966666665461, 'Action', array([-0.54979587, 0.51220709, 0. ]), 'Reward', -0.63092701335696044)
Terminating because Turned Back
TOTAL REWARD @ 3-th Episode : Reward -673.909722024
Total Step: 5526
Waiting for server on 3101............
Count Down : 5
Client connected on 3101..............
Episode : 4 Replay Buffer 5526 Early Stopping: 0 Epsilon: 0.98158 RN: 0.158244683739
('Episode', 4, 'Step', 9.0, 'Epsilon', 0.9815466666665458, 'Action', array([-1. , 0.41466682, 0. ]), 'Reward', 9.9819926773297833)
('Episode', 4, 'Step', 24.0, 'Epsilon', 0.9814966666665454, 'Action', array([-0.06199954, 0.51899887, 0. ]), 'Reward', -9.9164703141886807)
('Episode', 4, 'Step', 39.0, 'Epsilon', 0.9814466666665451, 'Action', array([ 1. , 0.36209543, 0. ]), 'Reward', 27.613496451365105)
('Episode', 4, 'Step', 54.0, 'Epsilon', 0.9813966666665448, 'Action', array([-1. , 0.47091977, 0. ]), 'Reward', -111.3610142776048)
('Episode', 4, 'Step', 69.0, 'Epsilon', 0.9813466666665445, 'Action', array([-1. , 0.52490289, 0. ]), 'Reward', -0.1077079225812734)
('Episode', 4, 'Step', 84.0, 'Epsilon', 0.9812966666665441, 'Action', array([-0.31360197, 0.50085284, 0. ]), 'Reward', 0.027373249199458011)
('Episode', 4, 'Step', 99.0, 'Epsilon', 0.9812466666665438, 'Action', array([ 0.78644066, 0.66691339, 0. ]), 'Reward', -0.5836201111552779)
('Episode', 4, 'Step', 114.0, 'Epsilon', 0.9811966666665435, 'Action', array([-1. , 0.4347904, 0. ]), 'Reward', -0.68588936735273631)
('Episode', 4, 'Step', 129.0, 'Epsilon', 0.9811466666665432, 'Action', array([ 1. , 0.42121026, 0. ]), 'Reward', 0.066095854494839013)
('Episode', 4, 'Step', 144.0, 'Epsilon', 0.9810966666665428, 'Action', array([-1. , 0.41412474, 0. ]), 'Reward', 0.0066946703059877445)
('Episode', 4, 'Step', 159.0, 'Epsilon', 0.9810466666665425, 'Action', array([-0.59487547, 0.47796122, 0. ]), 'Reward', -0.20957781329114997)
('Episode', 4, 'Step', 174.0, 'Epsilon', 0.9809966666665422, 'Action', array([-1. , 0.46142494, 0. ]), 'Reward', -0.82757176981260694)
('Episode', 4, 'Step', 189.0, 'Epsilon', 0.9809466666665418, 'Action', array([ 0.31172567, 0.23346568, 0. ]), 'Reward', 0.11674748577802901)
('Episode', 4, 'Step', 204.0, 'Epsilon', 0.9808966666665415, 'Action', array([-0.07830573, 0.4068186 , 0. ]), 'Reward', -0.5000705656149983)
('Episode', 4, 'Step', 219.0, 'Epsilon', 0.9808466666665412, 'Action', array([-0.51621367, 0.53577975, 0. ]), 'Reward', -0.21743370052066152)
('Episode', 4, 'Step', 234.0, 'Epsilon', 0.9807966666665409, 'Action', array([ 0.94670993, 0.64080529, 0. ]), 'Reward', -0.45840651929494874)
('Episode', 4, 'Step', 249.0, 'Epsilon', 0.9807466666665405, 'Action', array([ 0.79650715, 0.520876 , 0. ]), 'Reward', -0.60281353453119813)
('Episode', 4, 'Step', 264.0, 'Epsilon', 0.9806966666665402, 'Action', array([-0.87578026, 0.50839947, 0. ]), 'Reward', -0.34502144606834056)
('Episode', 4, 'Step', 279.0, 'Epsilon', 0.9806466666665399, 'Action', array([-0.88356567, 0.61211342, 0.02388654]), 'Reward', -0.4058462861815828)
('Episode', 4, 'Step', 294.0, 'Epsilon', 0.9805966666665396, 'Action', array([-0.47816543, 0.43287186, 0. ]), 'Reward', -0.11516623047317043)
('Episode', 4, 'Step', 309.0, 'Epsilon', 0.9805466666665392, 'Action', array([-0.51902565, 0.4556304 , 0. ]), 'Reward', -0.62161082869651008)
('Episode', 4, 'Step', 324.0, 'Epsilon', 0.9804966666665389, 'Action', array([-0.13081399, 0.36171745, 0. ]), 'Reward', -0.82353787782860521)
('Episode', 4, 'Step', 339.0, 'Epsilon', 0.9804466666665386, 'Action', array([ 0.08199057, 0.51773916, 0. ]), 'Reward', -0.93353830428631512)
('Episode', 4, 'Step', 354.0, 'Epsilon', 0.9803966666665382, 'Action', array([-0.58417564, 0.31946672, 0. ]), 'Reward', -0.063891936478118028)
('Episode', 4, 'Step', 369.0, 'Epsilon', 0.9803466666665379, 'Action', array([-0.46698364, 0.53850999, 0. ]), 'Reward', -0.76036206809405238)
('Episode', 4, 'Step', 384.0, 'Epsilon', 0.9802966666665376, 'Action', array([-0.02766777, 0.58329633, 0. ]), 'Reward', -0.29921637207950963)
('Episode', 4, 'Step', 399.0, 'Epsilon', 0.9802466666665373, 'Action', array([ 0.86084223, 0.49243629, 0. ]), 'Reward', -0.70813614635669464)
('Episode', 4, 'Step', 414.0, 'Epsilon', 0.9801966666665369, 'Action', array([ 0.35386072, 0.47728848, 0. ]), 'Reward', -0.7492530293220061)
('Episode', 4, 'Step', 429.0, 'Epsilon', 0.9801466666665366, 'Action', array([-0.14394912, 0.46595736, 0. ]), 'Reward', -0.61265035223677611)
('Episode', 4, 'Step', 444.0, 'Epsilon', 0.9800966666665363, 'Action', array([-0.65926592, 0.40360366, 0. ]), 'Reward', -0.45580824173155238)
('Episode', 4, 'Step', 459.0, 'Epsilon', 0.980046666666536, 'Action', array([-0.55401011, 0.41618939, 0. ]), 'Reward', -0.20780680029780818)
('Episode', 4, 'Step', 474.0, 'Epsilon', 0.9799966666665356, 'Action', array([ 0.37025717, 0.59878315, 0. ]), 'Reward', -1.0782022217772556)
('Episode', 4, 'Step', 489.0, 'Epsilon', 0.9799466666665353, 'Action', array([-0.59904075, 0.43950679, 0. ]), 'Reward', -0.72368678076925608)
('Episode', 4, 'Step', 504.0, 'Epsilon', 0.979896666666535, 'Action', array([-0.58688552, 0.58733538, 0. ]), 'Reward', -0.77562154055186172)
('Episode', 4, 'Step', 519.0, 'Epsilon', 0.9798466666665346, 'Action', array([ 0.08663786, 0.52872828, 0. ]), 'Reward', -1.2351468182868055)
('Episode', 4, 'Step', 534.0, 'Epsilon', 0.9797966666665343, 'Action', array([ 0.31092438, 0.44731409, 0. ]), 'Reward', -1.0574270982923522)
('Episode', 4, 'Step', 549.0, 'Epsilon', 0.979746666666534, 'Action', array([-0.2207914 , 0.51019746, 0. ]), 'Reward', -0.9650067217942464)
('Episode', 4, 'Step', 564.0, 'Epsilon', 0.9796966666665337, 'Action', array([-0.58394202, 0.55590213, 0. ]), 'Reward', -1.1109219182145071)
('Episode', 4, 'Step', 579.0, 'Epsilon', 0.9796466666665333, 'Action', array([-1. , 0.44499125, 0. ]), 'Reward', -0.50499770701361302)
('Episode', 4, 'Step', 594.0, 'Epsilon', 0.979596666666533, 'Action', array([-0.78787341, 0.48321963, 0. ]), 'Reward', -0.53215364710571911)
('Episode', 4, 'Step', 609.0, 'Epsilon', 0.9795466666665327, 'Action', array([-0.20850708, 0.45309357, 0.03586109]), 'Reward', -0.75136358145674154)
('Episode', 4, 'Step', 624.0, 'Epsilon', 0.9794966666665323, 'Action', array([-0.40478379, 0.33198835, 0. ]), 'Reward', -0.65944396621826606)
('Episode', 4, 'Step', 639.0, 'Epsilon', 0.979446666666532, 'Action', array([-1. , 0.51407867, 0. ]), 'Reward', -1.112679835759621)
('Episode', 4, 'Step', 654.0, 'Epsilon', 0.9793966666665317, 'Action', array([-0.20539301, 0.54455113, 0. ]), 'Reward', -2.4177058024592606)
('Episode', 4, 'Step', 669.0, 'Epsilon', 0.9793466666665314, 'Action', array([ 0.45121031, 0.35023506, 0. ]), 'Reward', -2.6535749443942835)
('Episode', 4, 'Step', 684.0, 'Epsilon', 0.979296666666531, 'Action', array([-0.26907347, 0.54709808, 0. ]), 'Reward', -2.0135948526326639)
('Episode', 4, 'Step', 699.0, 'Epsilon', 0.9792466666665307, 'Action', array([-1. , 0.41640384, 0. ]), 'Reward', -0.88794376829119848)
('Episode', 4, 'Step', 714.0, 'Epsilon', 0.9791966666665304, 'Action', array([-1. , 0.46811307, 0. ]), 'Reward', -1.3028637203843647)
('Episode', 4, 'Step', 729.0, 'Epsilon', 0.97914666666653, 'Action', array([-1. , 0.50543274, 0. ]), 'Reward', -1.5942071620973863)
('Episode', 4, 'Step', 744.0, 'Epsilon', 0.9790966666665297, 'Action', array([-0.64029333, 0.35503565, 0. ]), 'Reward', -1.2354505681069368)
('Episode', 4, 'Step', 759.0, 'Epsilon', 0.9790466666665294, 'Action', array([-1. , 0.5543577, 0. ]), 'Reward', -2.6695382948063529)
('Episode', 4, 'Step', 774.0, 'Epsilon', 0.9789966666665291, 'Action', array([-0.35320731, 0.48026711, 0. ]), 'Reward', -3.4208067610042523)
('Episode', 4, 'Step', 789.0, 'Epsilon', 0.9789466666665287, 'Action', array([-1. , 0.4393465, 0. ]), 'Reward', -2.610455265339747)
('Episode', 4, 'Step', 804.0, 'Epsilon', 0.9788966666665284, 'Action', array([ 0.1093769 , 0.60327388, 0. ]), 'Reward', -3.6877003715436594)
('Episode', 4, 'Step', 819.0, 'Epsilon', 0.9788466666665281, 'Action', array([-0.42904625, 0.45777719, 0. ]), 'Reward', -2.8735362924909378)
('Episode', 4, 'Step', 834.0, 'Epsilon', 0.9787966666665278, 'Action', array([-0.5547464 , 0.60118569, 0. ]), 'Reward', -5.2756310579133183)
('Episode', 4, 'Step', 849.0, 'Epsilon', 0.9787466666665274, 'Action', array([-1. , 0.39057962, 0. ]), 'Reward', -7.6742419885569735)
('Episode', 4, 'Step', 864.0, 'Epsilon', 0.9786966666665271, 'Action', array([-0.4316263 , 0.46892668, 0. ]), 'Reward', -8.9342120101118674)
('Episode', 4, 'Step', 879.0, 'Epsilon', 0.9786466666665268, 'Action', array([ 0.05797573, 0.38900849, 0. ]), 'Reward', -7.848548072657767)
('Episode', 4, 'Step', 894.0, 'Epsilon', 0.9785966666665264, 'Action', array([-0.64434069, 0.59429503, 0. ]), 'Reward', -7.3269521777662625)
('Episode', 4, 'Step', 909.0, 'Epsilon', 0.9785466666665261, 'Action', array([-1. , 0.55019886, 0. ]), 'Reward', -9.8991021025734316)
('Episode', 4, 'Step', 924.0, 'Epsilon', 0.9784966666665258, 'Action', array([-0.42068109, 0.45681841, 0. ]), 'Reward', -18.782437712784471)
('Episode', 4, 'Step', 939.0, 'Epsilon', 0.9784466666665255, 'Action', array([-0.20678446, 0.53079371, 0. ]), 'Reward', -32.295341276663152)
('Episode', 4, 'Step', 954.0, 'Epsilon', 0.9783966666665251, 'Action', array([-0.76215546, 0.38023984, 0. ]), 'Reward', -70.779612843689748)
('Episode', 4, 'Step', 969.0, 'Epsilon', 0.9783466666665248, 'Action', array([-0.36699103, 0.31001791, 0. ]), 'Reward', -69.883372079675226)
('Episode', 4, 'Step', 984.0, 'Epsilon', 0.9782966666665245, 'Action', array([-0.38433214, 0.41042349, 0. ]), 'Reward', -46.402635361983045)
('Episode', 4, 'Step', 999.0, 'Epsilon', 0.9782466666665242, 'Action', array([ 0.57877788, 0.49956984, 0. ]), 'Reward', -115.79165098485689)
('Episode', 4, 'Step', 1014.0, 'Epsilon', 0.9781966666665238, 'Action', array([ 0.41678633, 0.42910908, 0. ]), 'Reward', -0.062949138949759634)
('Episode', 4, 'Step', 1029.0, 'Epsilon', 0.9781466666665235, 'Action', array([-0.48113435, 0.46472486, 0. ]), 'Reward', -0.32036243352506999)
('Episode', 4, 'Step', 1044.0, 'Epsilon', 0.9780966666665232, 'Action', array([-1. , 0.47163834, 0. ]), 'Reward', -0.28340172048664675)
('Episode', 4, 'Step', 1059.0, 'Epsilon', 0.9780466666665228, 'Action', array([ 0.05947766, 0.57121824, 0. ]), 'Reward', -0.26207677625106868)
('Episode', 4, 'Step', 1074.0, 'Epsilon', 0.9779966666665225, 'Action', array([ 0.95847132, 0.43052631, 0. ]), 'Reward', -0.12967024064797161)
('Episode', 4, 'Step', 1089.0, 'Epsilon', 0.9779466666665222, 'Action', array([ 0.86674746, 0.63824956, 0. ]), 'Reward', -0.15397725944642812)
('Episode', 4, 'Step', 1104.0, 'Epsilon', 0.9778966666665219, 'Action', array([ 0.35997161, 0.30008712, 0. ]), 'Reward', -0.068135024446678807)
('Episode', 4, 'Step', 1119.0, 'Epsilon', 0.9778466666665215, 'Action', array([ 0.6257248 , 0.52771542, 0.01406848]), 'Reward', -0.40936590747415136)
('Episode', 4, 'Step', 1134.0, 'Epsilon', 0.9777966666665212, 'Action', array([-1. , 0.42675751, 0.01165007]), 'Reward', -0.2114534054864956)
('Episode', 4, 'Step', 1149.0, 'Epsilon', 0.9777466666665209, 'Action', array([-1. , 0.52790333, 0. ]), 'Reward', -0.19120791034800974)
('Episode', 4, 'Step', 1164.0, 'Epsilon', 0.9776966666665206, 'Action', array([-0.15099529, 0.3978564 , 0. ]), 'Reward', -0.25596952870119194)
('Episode', 4, 'Step', 1179.0, 'Epsilon', 0.9776466666665202, 'Action', array([ 0.59550116, 0.40151631, 0. ]), 'Reward', -0.17252795293270221)
('Episode', 4, 'Step', 1194.0, 'Epsilon', 0.9775966666665199, 'Action', array([-0.54270798, 0.59344107, 0. ]), 'Reward', -0.19815300624401666)
('Episode', 4, 'Step', 1209.0, 'Epsilon', 0.9775466666665196, 'Action', array([-0.47084156, 0.40546321, 0. ]), 'Reward', -0.33940771022847072)
('Episode', 4, 'Step', 1224.0, 'Epsilon', 0.9774966666665192, 'Action', array([ 0.86212941, 0.37000348, 0. ]), 'Reward', -0.12897285345698978)
('Episode', 4, 'Step', 1239.0, 'Epsilon', 0.9774466666665189, 'Action', array([ 0.92540443, 0.47426653, 0. ]), 'Reward', -0.25431803319222002)
('Episode', 4, 'Step', 1254.0, 'Epsilon', 0.9773966666665186, 'Action', array([ 1. , 0.57421506, 0. ]), 'Reward', -0.30569807345986599)
('Episode', 4, 'Step', 1269.0, 'Epsilon', 0.9773466666665183, 'Action', array([ 1. , 0.57345605, 0. ]), 'Reward', -0.45036884999701821)
('Episode', 4, 'Step', 1284.0, 'Epsilon', 0.9772966666665179, 'Action', array([ 0.92919718, 0.56775355, 0. ]), 'Reward', -0.14047308749995963)
('Episode', 4, 'Step', 1299.0, 'Epsilon', 0.9772466666665176, 'Action', array([-0.24040216, 0.49660977, 0. ]), 'Reward', -0.2858283757355467)
('Episode', 4, 'Step', 1314.0, 'Epsilon', 0.9771966666665173, 'Action', array([ 1. , 0.409398, 0. ]), 'Reward', -0.13164675322653913)
('Episode', 4, 'Step', 1329.0, 'Epsilon', 0.977146666666517, 'Action', array([-1. , 0.38568995, 0. ]), 'Reward', -0.2955664809679075)
('Episode', 4, 'Step', 1344.0, 'Epsilon', 0.9770966666665166, 'Action', array([ 0.56683292, 0.54738411, 0. ]), 'Reward', -0.11219496403395512)
('Episode', 4, 'Step', 1359.0, 'Epsilon', 0.9770466666665163, 'Action', array([-0.97645936, 0.46385555, 0. ]), 'Reward', -0.26418226259733246)
('Episode', 4, 'Step', 1374.0, 'Epsilon', 0.976996666666516, 'Action', array([-0.06340879, 0.39847622, 0. ]), 'Reward', -0.12771968679387713)
('Episode', 4, 'Step', 1389.0, 'Epsilon', 0.9769466666665156, 'Action', array([ 1. , 0.28128107, 0. ]), 'Reward', -1.7430545094554253)
('Episode', 4, 'Step', 1404.0, 'Epsilon', 0.9768966666665153, 'Action', array([-1. , 0.37285505, 0. ]), 'Reward', -2.55039407964275)
('Episode', 4, 'Step', 1419.0, 'Epsilon', 0.976846666666515, 'Action', array([-1. , 0.51737203, 0. ]), 'Reward', 0.39623160443596817)
('Episode', 4, 'Step', 1434.0, 'Epsilon', 0.9767966666665147, 'Action', array([-0.58882561, 0.3008818 , 0. ]), 'Reward', -0.050133415684117194)
('Episode', 4, 'Step', 1449.0, 'Epsilon', 0.9767466666665143, 'Action', array([-1. , 0.46803449, 0. ]), 'Reward', -0.33557605510524369)
('Episode', 4, 'Step', 1464.0, 'Epsilon', 0.976696666666514, 'Action', array([-0.0974848 , 0.50700396, 0. ]), 'Reward', -0.21707764191542095)
('Episode', 4, 'Step', 1479.0, 'Epsilon', 0.9766466666665137, 'Action', array([-0.03863792, 0.70016003, 0. ]), 'Reward', -0.36693110350666419)
('Episode', 4, 'Step', 1494.0, 'Epsilon', 0.9765966666665133, 'Action', array([-0.12596531, 0.62482804, 0. ]), 'Reward', -0.37066364845279681)
('Episode', 4, 'Step', 1509.0, 'Epsilon', 0.976546666666513, 'Action', array([-1. , 0.50975382, 0. ]), 'Reward', -0.39803888476318794)
('Episode', 4, 'Step', 1524.0, 'Epsilon', 0.9764966666665127, 'Action', array([-0.43547382, 0.37645756, 0. ]), 'Reward', -0.2591538576179877)
('Episode', 4, 'Step', 1539.0, 'Epsilon', 0.9764466666665124, 'Action', array([-0.33151481, 0.36312057, 0. ]), 'Reward', -0.286628669136753)
('Episode', 4, 'Step', 1554.0, 'Epsilon', 0.976396666666512, 'Action', array([-0.73505275, 0.54529415, 0. ]), 'Reward', -0.33117504328741498)
('Episode', 4, 'Step', 1569.0, 'Epsilon', 0.9763466666665117, 'Action', array([-0.74258541, 0.52591139, 0. ]), 'Reward', -0.37261949730215366)
('Episode', 4, 'Step', 1584.0, 'Epsilon', 0.9762966666665114, 'Action', array([ 0.06577104, 0.39651385, 0.01900151]), 'Reward', -0.30028410151169793)
('Episode', 4, 'Step', 1599.0, 'Epsilon', 0.976246666666511, 'Action', array([ 0.55585417, 0.46677357, 0.00834084]), 'Reward', -0.39950764470745936)
('Episode', 4, 'Step', 1614.0, 'Epsilon', 0.9761966666665107, 'Action', array([ 0.28547063, 0.49431582, 0. ]), 'Reward', -0.37478577818849895)
('Episode', 4, 'Step', 1629.0, 'Epsilon', 0.9761466666665104, 'Action', array([-0.48513116, 0.53567708, 0. ]), 'Reward', -0.37124862980923928)
('Episode', 4, 'Step', 1644.0, 'Epsilon', 0.9760966666665101, 'Action', array([-0.14223149, 0.58111285, 0. ]), 'Reward', -0.34345106122834801)
('Episode', 4, 'Step', 1659.0, 'Epsilon', 0.9760466666665097, 'Action', array([-1. , 0.60846404, 0. ]), 'Reward', -0.33459155416546876)
('Episode', 4, 'Step', 1674.0, 'Epsilon', 0.9759966666665094, 'Action', array([ 0.04749604, 0.49666624, 0. ]), 'Reward', -0.4Waiting for request on port 3101
******* RESTARTING *****
1013557593665489)
('Episode', 4, 'Step', 1689.0, 'Epsilon', 0.9759466666665091, 'Action', array([ 0.51419299, 0.72851485, 0. ]), 'Reward', -1.2814654464219069)
('Episode', 4, 'Step', 1704.0, 'Epsilon', 0.9758966666665088, 'Action', array([-0.46815438, 0.65578222, 0. ]), 'Reward', -0.39149560550815016)
('Episode', 4, 'Step', 1719.0, 'Epsilon', 0.9758466666665084, 'Action', array([ 0.41457411, 0.44416173, 0.01526275]), 'Reward', -0.52551925023310209)
('Episode', 4, 'Step', 1734.0, 'Epsilon', 0.9757966666665081, 'Action', array([ 0.66917001, 0.53415878, 0. ]), 'Reward', -0.7953693280256493)
('Episode', 4, 'Step', 1749.0, 'Epsilon', 0.9757466666665078, 'Action', array([ 0.49957174, 0.28839894, 0. ]), 'Reward', -0.43210223727288632)
('Episode', 4, 'Step', 1764.0, 'Epsilon', 0.9756966666665075, 'Action', array([-0.70514413, 0.44215817, 0. ]), 'Reward', -0.237444874140118)
('Episode', 4, 'Step', 1779.0, 'Epsilon', 0.9756466666665071, 'Action', array([ 0.70886998, 0.37162786, 0.00395482]), 'Reward', -0.66895133586982936)
('Episode', 4, 'Step', 1794.0, 'Epsilon', 0.9755966666665068, 'Action', array([-0.18230993, 0.55655731, 0. ]), 'Reward', -0.60611989909682951)
('Episode', 4, 'Step', 1809.0, 'Epsilon', 0.9755466666665065, 'Action', array([-0.16061396, 0.66604536, 0. ]), 'Reward', -0.63873502248222191)
('Episode', 4, 'Step', 1824.0, 'Epsilon', 0.9754966666665061, 'Action', array([-0.96038168, 0.42203155, 0. ]), 'Reward', -0.54995835009800209)
('Episode', 4, 'Step', 1839.0, 'Epsilon', 0.9754466666665058, 'Action', array([ 0.67508844, 0.62823516, 0. ]), 'Reward', -0.99642105033927431)
('Episode', 4, 'Step', 1854.0, 'Epsilon', 0.9753966666665055, 'Action', array([-0.75072616, 0.38359486, 0. ]), 'Reward', -0.30842109752031233)
('Episode', 4, 'Step', 1869.0, 'Epsilon', 0.9753466666665052, 'Action', array([ 0.38352181, 0.51821043, 0.02079597]), 'Reward', -1.040842438671687)
('Episode', 4, 'Step', 1884.0, 'Epsilon', 0.9752966666665048, 'Action', array([-0.63926996, 0.48944226, 0. ]), 'Reward', -0.44395463993999318)
('Episode', 4, 'Step', 1899.0, 'Epsilon', 0.9752466666665045, 'Action', array([-0.82148813, 0.29297358, 0. ]), 'Reward', -0.2076330679595943)
('Episode', 4, 'Step', 1914.0, 'Epsilon', 0.9751966666665042, 'Action', array([-0.4397864 , 0.50319373, 0. ]), 'Reward', -0.3789414601739205)
('Episode', 4, 'Step', 1929.0, 'Epsilon', 0.9751466666665038, 'Action', array([ 0.31943101, 0.49121185, 0. ]), 'Reward', -1.0514138425744204)
('Episode', 4, 'Step', 1944.0, 'Epsilon', 0.9750966666665035, 'Action', array([-1. , 0.68980696, 0. ]), 'Reward', -1.108065019767182)
('Episode', 4, 'Step', 1959.0, 'Epsilon', 0.9750466666665032, 'Action', array([ 0.46892455, 0.45492565, 0. ]), 'Reward', -1.6418711567034476)
('Episode', 4, 'Step', 1974.0, 'Epsilon', 0.9749966666665029, 'Action', array([ 0.04245005, 0.4034898 , 0. ]), 'Reward', -2.1282370525554972)
('Episode', 4, 'Step', 1989.0, 'Epsilon', 0.9749466666665025, 'Action', array([-1. , 0.43022428, 0.01439218]), 'Reward', -0.87734413325926619)
TOTAL REWARD @ 4-th Episode : Reward -5871.96649828
Total Step: 7526
Waiting for server on 3101............
Count Down : 5
Client connected on 3101..............
Episode : 5 Replay Buffer 7526 Early Stopping: 0 Epsilon: 0.974913333333 RN: 0.587303164698
('Episode', 5, 'Step', 4.0, 'Epsilon', 0.9748966666665022, 'Action', array([-0.96467978, 0.54364478, 0. ]), 'Reward', 5.1491179752151224)
('Episode', 5, 'Step', 19.0, 'Epsilon', 0.9748466666665019, 'Action', array([-0.25536381, 0.4406988 , 0. ]), 'Reward', -1.7485701170422736)
('Episode', 5, 'Step', 34.0, 'Epsilon', 0.9747966666665016, 'Action', array([-0.50879842, 0.48832055, 0. ]), 'Reward', -40.064242948424734)
('Episode', 5, 'Step', 49.0, 'Epsilon', 0.9747466666665012, 'Action', array([-0.74866795, 0.6068589 , 0. ]), 'Reward', -4.6680319744402858)
('Episode', 5, 'Step', 64.0, 'Epsilon', 0.9746966666665009, 'Action', array([-1. , 0.61984164, 0. ]), 'Reward', -11.678199087507805)
('Episode', 5, 'Step', 79.0, 'Epsilon', 0.9746466666665006, 'Action', array([-0.42963964, 0.41655725, 0. ]), 'Reward', -10.00197842311167)
('Episode', 5, 'Step', 94.0, 'Epsilon', 0.9745966666665002, 'Action', array([-0.87640849, 0.32061921, 0. ]), 'Reward', -14.362305985937951)
('Episode', 5, 'Step', 109.0, 'Epsilon', 0.9745466666664999, 'Action', array([ 0.48667756, 0.37765952, 0. ]), 'Reward', -7.7749514576574494)
('Episode', 5, 'Step', 124.0, 'Epsilon', 0.9744966666664996, 'Action', array([-1. , 0.32913482, 0. ]), 'Reward', -3.1840994831587013)
('Episode', 5, 'Step', 139.0, 'Epsilon', 0.9744466666664993, 'Action', array([-0.23014576, 0.4823125 , 0. ]), 'Reward', -4.7850912154632912)
('Episode', 5, 'Step', 154.0, 'Epsilon', 0.9743966666664989, 'Action', array([-0.84829149, 0.50914758, 0. ]), 'Reward', -3.3234276596374093)
('Episode', 5, 'Step', 169.0, 'Epsilon', 0.9743466666664986, 'Action', array([-0.58439793, 0.55534532, 0. ]), 'Reward', -4.2645465455112426)
('Episode', 5, 'Step', 184.0, 'Epsilon', 0.9742966666664983, 'Action', array([ 0.00087654, 0.50671486, 0. ]), 'Reward', -3.1181441747785739)
('Episode', 5, 'Step', 199.0, 'Epsilon', 0.974246666666498, 'Action', array([-0.50097945, 0.37256953, 0. ]), 'Reward', -1.5477610134473578)
('Episode', 5, 'Step', 214.0, 'Epsilon', 0.9741966666664976, 'Action', array([ 0.44899646, 0.61223953, 0. ]), 'Reward', -4.8965337107425579)
('Episode', 5, 'Step', 229.0, 'Epsilon', 0.9741466666664973, 'Action', array([ 0.22196971, 0.43474381, 0. ]), 'Reward', -3.5278617157126115)
('Episode', 5, 'Step', 244.0, 'Epsilon', 0.974096666666497, 'Action', array([-0.77870464, 0.38632014, 0. ]), 'Reward', -2.2168960263841475)
('Episode', 5, 'Step', 259.0, 'Epsilon', 0.9740466666664966, 'Action', array([-0.16417254, 0.62515249, 0. ]), 'Reward', -5.4276802242289914)
('Episode', 5, 'Step', 274.0, 'Epsilon', 0.9739966666664963, 'Action', array([ 0.56964009, 0.70677657, 0. ]), 'Reward', -13.628396297042556)
('Episode', 5, 'Step', 289.0, 'Epsilon', 0.973946666666496, 'Action', array([-0.14149692, 0.18509324, 0. ]), 'Reward', -41.071938067416596)
('Episode', 5, 'Step', 304.0, 'Epsilon', 0.9738966666664957, 'Action', array([-0.54738189, 0.46397704, 0. ]), 'Reward', -42.794114630661454)
('Episode', 5, 'Step', 319.0, 'Epsilon', 0.9738466666664953, 'Action', array([-1. , 0.49580227, 0. ]), 'Reward', -28.641465804110492)
('Episode', 5, 'Step', 334.0, 'Epsilon', 0.973796666666495, 'Action', array([-0.07976349, 0.43530082, 0. ]), 'Reward', -15.214987525188921)
('Episode', 5, 'Step', 349.0, 'Epsilon', 0.9737466666664947, 'Action', array([-0.12557296, 0.2984005 , 0. ]), 'Reward', -8.4175753545572682)
('Episode', 5, 'Step', 364.0, 'Epsilon', 0.9736966666664943, 'Action', array([-1. , 0.41887175, 0. ]), 'Reward', -7.2346277037347075)
('Episode', 5, 'Step', 379.0, 'Epsilon', 0.973646666666494, 'Action', array([-1. , 0.43504912, 0. ]), 'Reward', -15.142664448483886)
('Episode', 5, 'Step', 394.0, 'Epsilon', 0.9735966666664937, 'Action', array([-1. , 0.43834705, 0. ]), 'Reward', -10.666921277270999)
('Episode', 5, 'Step', 409.0, 'Epsilon', 0.9735466666664934, 'Action', array([ 0.1965397 , 0.42188085, 0. ]), 'Reward', -16.828641748370142)
('Episode', 5, 'Step', 424.0, 'Epsilon', 0.973496666666493, 'Action', array([-0.79034357, 0.45497087, 0. ]), 'Reward', -22.88077235471259)
('Episode', 5, 'Step', 439.0, 'Epsilon', 0.9734466666664927, 'Action', array([-0.86736529, 0.47403144, 0. ]), 'Reward', -20.884718082532078)
('Episode', 5, 'Step', 454.0, 'Epsilon', 0.9733966666664924, 'Action', array([-1. , 0.41565061, 0. ]), 'Reward', -42.073325368226392)
('Episode', 5, 'Step', 469.0, 'Epsilon', 0.973346666666492, 'Action', array([-0.6271833 , 0.46950489, 0. ]), 'Reward', -65.300381478650095)
('Episode', 5, 'Step', 484.0, 'Epsilon', 0.9732966666664917, 'Action', array([-1. , 0.53636153, 0. ]), 'Reward', -40.657043130067443)
('Episode', 5, 'Step', 499.0, 'Epsilon', 0.9732466666664914, 'Action', array([-1. , 0.48921308, 0. ]), 'Reward', -103.44167785359875)
('Episode', 5, 'Step', 514.0, 'Epsilon', 0.9731966666664911, 'Action', array([ 0.03325307, 0.50686972, 0. ]), 'Reward', -1.0236085516352729)
('Episode', 5, 'Step', 529.0, 'Epsilon', 0.9731466666664907, 'Action', array([ 0.62403497, 0.51799943, 0.0193695 ]), 'Reward', -0.45720639300866667)
('Episode', 5, 'Step', 544.0, 'Epsilon', 0.9730966666664904, 'Action', array([ 0.49687651, 0.59922317, 0. ]), 'Reward', -0.83620689655085112)
('Episode', 5, 'Step', 559.0, 'Epsilon', 0.9730466666664901, 'Action', array([ 1. , 0.37587716, 0. ]), 'Reward', -0.83867342747946194)
('Episode', 5, 'Step', 574.0, 'Epsilon', 0.9729966666664898, 'Action', array([ 0.3854111 , 0.58583477, 0. ]), 'Reward', -1.5285163310288499)
('Episode', 5, 'Step', 589.0, 'Epsilon', 0.9729466666664894, 'Action', array([ 0.82693256, 0.31751008, 0. ]), 'Reward', -0.75682600136308409)
('Episode', 5, 'Step', 604.0, 'Epsilon', 0.9728966666664891, 'Action', array([ 0.70124447, 0.36426185, 0.01981027]), 'Reward', -0.36531444100070054)
('Episode', 5, 'Step', 619.0, 'Epsilon', 0.9728466666664888, 'Action', array([ 1. , 0.55776404, 0. ]), 'Reward', -1.7689229666395301)
('Episode', 5, 'Step', 634.0, 'Epsilon', 0.9727966666664885, 'Action', array([ 0.19833181, 0.45649835, 0. ]), 'Reward', -2.0508495952679153)
('Episode', 5, 'Step', 649.0, 'Epsilon', 0.9727466666664881, 'Action', array([-0.79166244, 0.40120033, 0. ]), 'Reward', -1.3699152172457285)
('Episode', 5, 'Step', 664.0, 'Epsilon', 0.9726966666664878, 'Action', array([ 0.26012158, 0.48278466, 0. ]), 'Reward', -1.8289055743803897)
('Episode', 5, 'Step', 679.0, 'Epsilon', 0.9726466666664875, 'Action', array([ 0.30762589, 0.50124435, 0. ]), 'Reward', -1.5742945576006484)
('Episode', 5, 'Step', 694.0, 'Epsilon', 0.9725966666664871, 'Action', array([-1. , 0.51641516, 0. ]), 'Reward', -4.3889447530642327)
('Episode', 5, 'Step', 709.0, 'Epsilon', 0.9725466666664868, 'Action', array([ 1. , 0.45612511, 0. ]), 'Reward', -1.9999282627017732)
('Episode', 5, 'Step', 724.0, 'Epsilon', 0.9724966666664865, 'Action', array([ 0.88457624, 0.63214866, 0. ]), 'Reward', -1.8356432029436076)
('Episode', 5, 'Step', 739.0, 'Epsilon', 0.9724466666664862, 'Action', array([ 0.21641477, 0.4518931 , 0. ]), 'Reward', -0.72446781207129129)
('Episode', 5, 'Step', 754.0, 'Epsilon', 0.9723966666664858, 'Action', array([-0.14672155, 0.39699864, 0. ]), 'Reward', -0.64219143937493683)
('Episode', 5, 'Step', 769.0, 'Epsilon', 0.9723466666664855, 'Action', array([ 1. , 0.49628791, 0. ]), 'Reward', -0.18630272194813882)
('Episode', 5, 'Step', 784.0, 'Epsilon', 0.9722966666664852, 'Action', array([ 0.08174302, 0.61920829, 0. ]), 'Reward', -0.64217794676265416)
('Episode', 5, 'Step', 799.0, 'Epsilon', 0.9722466666664848, 'Action', array([-0.48940658, 0.51595547, 0. ]), 'Reward', -0.10579832110207713)
('Episode', 5, 'Step', 814.0, 'Epsilon', 0.9721966666664845, 'Action', array([ 1. , 0.40804627, 0. ]), 'Reward', -0.58945929607485392)
('Episode', 5, 'Step', 829.0, 'Epsilon', 0.9721466666664842, 'Action', array([ 0.86273564, 0.33259649, 0. ]), 'Reward', -0.10929013848626726)
('Episode', 5, 'Step', 844.0, 'Epsilon', 0.9720966666664839, 'Action', array([ 0.41335423, 0.45342767, 0. ]), 'Reward', -0.79822393688401561)
('Episode', 5, 'Step', 859.0, 'Epsilon', 0.9720466666664835, 'Action', array([-0.07739368, 0.49448803, 0. ]), 'Reward', -0.092397445203755563)
('Episode', 5, 'Step', 874.0, 'Epsilon', 0.9719966666664832, 'Action', array([ 0.05326231, 0.43674468, 0. ]), 'Reward', -0.95607552182044475)
('Episode', 5, 'Step', 889.0, 'Epsilon', 0.9719466666664829, 'Action', array([ 0.01756711, 0.42521155, 0. ]), 'Reward', -0.72398855147950203)
('Episode', 5, 'Step', 904.0, 'Epsilon', 0.9718966666664826, 'Action', array([ 0.60526062, 0.5967067 , 0. ]), 'Reward', -0.91175501404122627)
('Episode', 5, 'Step', 919.0, 'Epsilon', 0.9718466666664822, 'Action', array([ 0.01197471, 0.41372556, 0. ]), 'Reward', -0.93975726786476566)
('Episode', 5, 'Step', 934.0, 'Epsilon', 0.9717966666664819, 'Action', array([ 0.40089678, 0.58620752, 0. ]), 'Reward', -1.4146338658623323)
('Episode', 5, 'Step', 949.0, 'Epsilon', 0.9717466666664816, 'Action', array([ 1. , 0.54889817, 0. ]), 'Reward', -0.93185901164344154)
('Episode', 5, 'Step', 964.0, 'Epsilon', 0.9716966666664812, 'Action', array([ 0.70944774, 0.60153976, 0. ]), 'Reward', -1.1395191573596026)
('Episode', 5, 'Step', 979.0, 'Epsilon', 0.9716466666664809, 'Action', array([-0.33881893, 0.36766304, 0. ]), 'Reward', -1.0927756922260401)
('Episode', 5, 'Step', 994.0, 'Epsilon', 0.9715966666664806, 'Action', array([-0.19308828, 0.52705687, 0. ]), 'Reward', -1.3156772952438902)
('Episode', 5, 'Step', 1009.0, 'Epsilon', 0.9715466666664803, 'Action', array([ 0.31818009, 0.54488802, 0. ]), 'Reward', -1.2879103004188341)
('Episode', 5, 'Step', 1024.0, 'Epsilon', 0.9714966666664799, 'Action', array([-1. , 0.50536963, 0. ]), 'Reward', -3.491086706230274)
('Episode', 5, 'Step', 1039.0, 'Epsilon', 0.9714466666664796, 'Action', array([ 0.54991217, 0.47536412, 0. ]), 'Reward', -1.1803078801146705)
('Episode', 5, 'Step', 1054.0, 'Epsilon', 0.9713966666664793, 'Action', array([-0.11096922, 0.52415206, 0. ]), 'Reward', -2.9103972401801421)
('Episode', 5, 'Step', 1069.0, 'Epsilon', 0.971346666666479, 'Action', array([ 0.36543824, 0.53860045, 0. ]), 'Reward', -1.6990100651580127)
('Episode', 5, 'Step', 1084.0, 'Epsilon', 0.9712966666664786, 'Action', array([ 0.41914628, 0.53104398, 0. ]), 'Reward', -3.4268706667672393)
('Episode', 5, 'Step', 1099.0, 'Epsilon', 0.9712466666664783, 'Action', array([ 0.31798583, 0.35483789, 0. ]), 'Reward', -1.5671454890046883)
('Episode', 5, 'Step', 1114.0, 'Epsilon', 0.971196666666478, 'Action', array([ 0.30205444, 0.35322234, 0. ]), 'Reward', -1.6497663391044357)
('Episode', 5, 'Step', 1129.0, 'Epsilon', 0.9711466666664776, 'Action', array([ 1. , 0.47049111, 0. ]), 'Reward', -1.3182020218581167)
('Episode', 5, 'Step', 1144.0, 'Epsilon', 0.9710966666664773, 'Action', array([ 0.03253665, 0.41913645, 0.07461839]), 'Reward', -1.6323833072601901)
('Episode', 5, 'Step', 1159.0, 'Epsilon', 0.971046666666477, 'Action', array([ 0.57624471, 0.66234136, 0. ]), 'Reward', -2.8732318877196867)
('Episode', 5, 'Step', 1174.0, 'Epsilon', 0.9709966666664767, 'Action', array([ 1. , 0.26561766, 0.00555467]), 'Reward', -0.7719302771984593)
('Episode', 5, 'Step', 1189.0, 'Epsilon', 0.9709466666664763, 'Action', array([-0.66046534, 0.47173273, 0. ]), 'Reward', -1.9291468147176984)
('Episode', 5, 'Step', 1204.0, 'Epsilon', 0.970896666666476, 'Action', array([-0.46900336, 0.2409656 , 0. ]), 'Reward', -5.0262754914377386)
('Episode', 5, 'Step', 1219.0, 'Epsilon', 0.9708466666664757, 'Action', array([ 0.30486844, 0.50393026, 0. ]), 'Reward', -0.38306159975639675)
('Episode', 5, 'Step', 1234.0, 'Epsilon', 0.9707966666664753, 'Action', array([-0.22301726, 0.34048265, 0. ]), 'Reward', -0.14411479199516339)
('Episode', 5, 'Step', 1249.0, 'Epsilon', 0.970746666666475, 'Action', array([-1. , 0.48316149, 0. ]), 'Reward', -0.42413606546189614)
('Episode', 5, 'Step', 1264.0, 'Epsilon', 0.9706966666664747, 'Action', array([-0.31920881, 0.32718674, 0. ]), 'Reward', -0.29856372422577526)
('Episode', 5, 'Step', 1279.0, 'Epsilon', 0.9706466666664744, 'Action', array([-0.01631069, 0.43725201, 0. ]), 'Reward', -0.34666114046574181)
('Episode', 5, 'Step', 1294.0, 'Epsilon', 0.970596666666474, 'Action', array([-0.92755448, 0.38677906, 0. ]), 'Reward', -0.1803229572387538)
('Episode', 5, 'Step', 1309.0, 'Epsilon', 0.9705466666664737, 'Action', array([-1. , 0.43297693, 0. ]), 'Reward', -0.13160196406459607)
('Episode', 5, 'Step', 1324.0, 'Epsilon', 0.9704966666664734, 'Action', array([ 0.86170961, 0.47669969, 0. ]), 'Reward', -0.63299701325827185)
('Episode', 5, 'Step', 1339.0, 'Epsilon', 0.9704466666664731, 'Action', array([-0.78345359, 0.53659749, 0. ]), 'Reward', -0.23390147943786196)
('Episode', 5, 'Step', 1354.0, 'Epsilon', 0.9703966666664727, 'Action', array([-1. , 0.52127521, 0. ]), 'Reward', -0.23426336944108556)
('Episode', 5, 'Step', 1369.0, 'Epsilon', 0.9703466666664724, 'Action', array([ 0.196183 , 0.38335122, 0. ]), 'Reward', -0.27675709966121365)
('Episode', 5, 'Step', 1384.0, 'Epsilon', 0.9702966666664721, 'Action', array([-1. , 0.51938387, 0.00387955]), 'Reward', -0.22712567489046331)
('Episode', 5, 'Step', 1399.0, 'Epsilon', 0.9702466666664717, 'Action', array([-1. , 0.36709996, 0. ]), 'Reward', -0.30429571039712022)
('Episode', 5, 'Step', 1414.0, 'Epsilon', 0.9701966666664714, 'Action', array([-0.08377641, 0.47007125, 0. ]), 'Reward', -0.66569973957252171)
('Episode', 5, 'Step', 1429.0, 'Epsilon', 0.9701466666664711, 'Action', array([-0.09257858, 0.4745668 , 0. ]), 'Reward', -0.44783860408438936)
('Episode', 5, 'Step', 1444.0, 'Epsilon', 0.9700966666664708, 'Action', array([-0.27715451, 0.44309225, 0.01719579]), 'Reward', -0.34260243262443246)
('Episode', 5, 'Step', 1459.0, 'Epsilon', 0.9700466666664704, 'Action', array([-1. , 0.50595108, 0. ]), 'Reward', -0.32689071352054877)
('Episode', 5, 'Step', 1474.0, 'Epsilon', 0.9699966666664701, 'Action', array([ 0.02966928, 0.64938885, 0. ]), 'Reward', -1.0547843108278754)
('Episode', 5, 'Step', 1489.0, 'Epsilon', 0.9699466666664698, 'Action', array([ 0.22856284, 0.6003991 , 0. ]), 'Reward', -1.0387045207194578)
('Episode', 5, 'Step', 1504.0, 'Epsilon', 0.9698966666664695, 'Action', array([-1. , 0.39377476, 0. ]), 'Reward', -0.49143536155460588)
('Episode', 5, 'Step', 1519.0, 'Epsilon', 0.9698466666664691, 'Action', array([-1. , 0.43145824, 0. ]), 'Reward', -0.34150181893207443)
('Episode', 5, 'Step', 1534.0, 'Epsilon', 0.9697966666664688, 'Action', array([-1. , 0.44553892, 0. ]), 'Reward', -0.36275303509145002)
('Episode', 5, 'Step', 1549.0, 'Epsilon', 0.9697466666664685, 'Action', array([-0.73179166, 0.20101934, 0. ]), 'Reward', -0.13812469213325948)
('Episode', 5, 'Step', 1564.0, 'Epsilon', 0.9696966666664681, 'Action', array([-0.40163716, 0.47940506, 0. ]), 'Reward', -0.39197005473531654)
('Episode', 5, 'Step', 1579.0, 'Epsilon', 0.9696466666664678, 'Action', array([-1. , 0.42460123, 0. ]), 'Reward', -0.26966764468814725)
('Episode', 5, 'Step', 1594.0, 'Epsilon', 0.9695966666664675, 'Action', array([-0.09863815, 0.5779727 , 0. ]), 'Reward', -0.73582426438968485)
('Episode', 5, 'Step', 1609.0, 'Epsilon', 0.9695466666664672, 'Action', array([-0.31342228, 0.43471324, 0. ]), 'Reward', -0.33003556213111623)
('Episode', 5, 'Step', 1624.0, 'Epsilon', 0.9694966666664668, 'Action', array([-1. , 0.58358689, 0. ]), 'Reward', -0.54421014856293204)
('Episode', 5, 'Step', 1639.0, 'Epsilon', 0.9694466666664665, 'Action', array([ 0.28719676, 0.41456827, 0. ]), 'Reward', -0.60180485917713034)
('Episode', 5, 'Step', 1654.0, 'Epsilon', 0.9693966666664662, 'Action', array([ 0.16220117, 0.4044741 , 0. ]), 'Reward', -1.836511806939547)
('Episode', 5, 'Step', 1669.0, 'Epsilon', 0.9693466666664659, 'Action', array([-0.64349927, 0.43629611, 0. ]), 'Reward', -0.86770060063630794)
('Episode', 5, 'Step', 1684.0, 'Epsilon', 0.9692966666664655, 'Action', array([-0.48181309, 0.64065058, 0.0110835 ]), 'Reward', -4.3374228055856126)
('Episode'Waiting for request on port 3101
******* RESTARTING *****
, 5, 'Step', 1699.0, 'Epsilon', 0.9692466666664652, 'Action', array([-1. , 0.46783983, 0. ]), 'Reward', -2.8985601080377563)
('Episode', 5, 'Step', 1714.0, 'Epsilon', 0.9691966666664649, 'Action', array([-1. , 0.72114107, 0. ]), 'Reward', -5.6901256051031481)
('Episode', 5, 'Step', 1729.0, 'Epsilon', 0.9691466666664645, 'Action', array([ 0.05993269, 0.6009537 , 0. ]), 'Reward', -1)
('Episode', 5, 'Step', 1744.0, 'Epsilon', 0.9690966666664642, 'Action', array([ 0.65710536, 0.52279632, 0. ]), 'Reward', -0.94041178370920719)
('Episode', 5, 'Step', 1759.0, 'Epsilon', 0.9690466666664639, 'Action', array([-0.14240071, 0.53860314, 0. ]), 'Reward', -0.43216716386548604)
('Episode', 5, 'Step', 1774.0, 'Epsilon', 0.9689966666664636, 'Action', array([ 0.07237955, 0.50393743, 0. ]), 'Reward', -0.27438837199374627)
('Episode', 5, 'Step', 1789.0, 'Epsilon', 0.9689466666664632, 'Action', array([ 0.28397237, 0.41151277, 0.01054853]), 'Reward', -0.2851774314525829)
('Episode', 5, 'Step', 1804.0, 'Epsilon', 0.9688966666664629, 'Action', array([ 0.48852715, 0.43759496, 0. ]), 'Reward', -0.38846068079784041)
('Episode', 5, 'Step', 1819.0, 'Epsilon', 0.9688466666664626, 'Action', array([-1. , 0.3541882, 0. ]), 'Reward', -0.19430400532708689)
('Episode', 5, 'Step', 1834.0, 'Epsilon', 0.9687966666664622, 'Action', array([ 0.02008634, 0.58985617, 0. ]), 'Reward', -0.38723973341438733)
('Episode', 5, 'Step', 1849.0, 'Epsilon', 0.9687466666664619, 'Action', array([ 0.0651333 , 0.62501177, 0. ]), 'Reward', -0.54811737716942899)
('Episode', 5, 'Step', 1864.0, 'Epsilon', 0.9686966666664616, 'Action', array([ 0.38423414, 0.41776543, 0. ]), 'Reward', -0.4987708507229065)
('Episode', 5, 'Step', 1879.0, 'Epsilon', 0.9686466666664613, 'Action', array([ 0.16808162, 0.44408579, 0. ]), 'Reward', -0.37093233683243299)
('Episode', 5, 'Step', 1894.0, 'Epsilon', 0.9685966666664609, 'Action', array([-1. , 0.52758461, 0. ]), 'Reward', -0.30550952319208824)
('Episode', 5, 'Step', 1909.0, 'Epsilon', 0.9685466666664606, 'Action', array([ 0.15691841, 0.59203375, 0. ]), 'Reward', -0.38970013863188846)
('Episode', 5, 'Step', 1924.0, 'Epsilon', 0.9684966666664603, 'Action', array([-0.42652431, 0.47653803, 0. ]), 'Reward', -0.29552970559992775)
('Episode', 5, 'Step', 1939.0, 'Epsilon', 0.96844666666646, 'Action', array([-1. , 0.41505223, 0.02216953]), 'Reward', -0.09130685785044633)
('Episode', 5, 'Step', 1954.0, 'Epsilon', 0.9683966666664596, 'Action', array([-0.84735165, 0.39039483, 0. ]), 'Reward', -0.1491095240114596)
('Episode', 5, 'Step', 1969.0, 'Epsilon', 0.9683466666664593, 'Action', array([ 0.49301051, 0.42518305, 0. ]), 'Reward', -0.38064999602604077)
('Episode', 5, 'Step', 1984.0, 'Epsilon', 0.968296666666459, 'Action', array([ 0.3983997 , 0.48417584, 0. ]), 'Reward', -0.51197288429640331)
('Episode', 5, 'Step', 1999.0, 'Epsilon', 0.9682466666664586, 'Action', array([-0.05153783, 0.40412834, 0. ]), 'Reward', -0.35447706602071799)
TOTAL REWARD @ 5-th Episode : Reward -10532.7389575
Total Step: 9526
### TORCS is RELAUNCHED ###
Client connected on 3101..............
Episode : 6 Replay Buffer 9526 Early Stopping: 0 Epsilon: 0.968246666666 RN: 0.337942408009
('Episode', 6, 'Step', 14.0, 'Epsilon', 0.9681966666664583, 'Action', array([ 0.56695546, 0.53707546, 0. ]), 'Reward', 7.229529076207915)
('Episode', 6, 'Step', 29.0, 'Epsilon', 0.968146666666458, 'Action', array([ 0.1566624 , 0.43671694, 0. ]), 'Reward', -72.007395843852308)
('Episode', 6, 'Step', 44.0, 'Epsilon', 0.9680966666664577, 'Action', array([-0.18358633, 0.58836417, 0. ]), 'Reward', -96.740772196165352)
('Episode', 6, 'Step', 59.0, 'Epsilon', 0.9680466666664573, 'Action', array([-0.40259632, 0.50175894, 0. ]), 'Reward', -90.507618102885971)
('Episode', 6, 'Step', 74.0, 'Epsilon', 0.967996666666457, 'Action', array([-1. , 0.51725817, 0. ]), 'Reward', -95.552797086126731)
('Episode', 6, 'Step', 89.0, 'Epsilon', 0.9679466666664567, 'Action', array([-0.3805397 , 0.61343807, 0. ]), 'Reward', -96.591459040415771)
('Episode', 6, 'Step', 104.0, 'Epsilon', 0.9678966666664564, 'Action', array([-1. , 0.51016492, 0.02234666]), 'Reward', -67.690275097090336)
('Episode', 6, 'Step', 119.0, 'Epsilon', 0.967846666666456, 'Action', array([ 0.19503368, 0.56680462, 0. ]), 'Reward', -19.964715439986826)
('Episode', 6, 'Step', 134.0, 'Epsilon', 0.9677966666664557, 'Action', array([ 0.49300363, 0.49437201, 0. ]), 'Reward', -1)
('Episode', 6, 'Step', 149.0, 'Epsilon', 0.9677466666664554, 'Action', array([-0.76824034, 0.46781558, 0. ]), 'Reward', -4.1806817228484654)
('Episode', 6, 'Step', 164.0, 'Epsilon', 0.967696666666455, 'Action', array([ 0.07481461, 0.46082133, 0. ]), 'Reward', -2.4417363640084693)
('Episode', 6, 'Step', 179.0, 'Epsilon', 0.9676466666664547, 'Action', array([-0.32021001, 0.66241168, 0. ]), 'Reward', -5.8709897984283153)
('Episode', 6, 'Step', 194.0, 'Epsilon', 0.9675966666664544, 'Action', array([-0.33948714, 0.6059091 , 0. ]), 'Reward', -5.4242925915017661)
('Episode', 6, 'Step', 209.0, 'Epsilon', 0.9675466666664541, 'Action', array([ 1. , 0.43296697, 0.00500557]), 'Reward', -1.4064075829703064)
('Episode', 6, 'Step', 224.0, 'Epsilon', 0.9674966666664537, 'Action', array([-0.59202438, 0.54764078, 0. ]), 'Reward', -6.9288207240626756)
('Episode', 6, 'Step', 239.0, 'Epsilon', 0.9674466666664534, 'Action', array([ 0.95654888, 0.50894858, 0. ]), 'Reward', -1.7269176862585822)
('Episode', 6, 'Step', 254.0, 'Epsilon', 0.9673966666664531, 'Action', array([-0.59319356, 0.48393428, 0. ]), 'Reward', -0.35136518056729737)
('Episode', 6, 'Step', 269.0, 'Epsilon', 0.9673466666664527, 'Action', array([-1. , 0.51639969, 0.01397991]), 'Reward', -0.76357434660147505)
('Episode', 6, 'Step', 284.0, 'Epsilon', 0.9672966666664524, 'Action', array([ 0.06894456, 0.54995559, 0. ]), 'Reward', -0.47052609720969907)
('Episode', 6, 'Step', 299.0, 'Epsilon', 0.9672466666664521, 'Action', array([ 0.90979203, 0.49174482, 0. ]), 'Reward', -0.64979774556457337)
('Episode', 6, 'Step', 314.0, 'Epsilon', 0.9671966666664518, 'Action', array([-0.48287663, 0.3460518 , 0. ]), 'Reward', -0.34580212329700866)
('Episode', 6, 'Step', 329.0, 'Epsilon', 0.9671466666664514, 'Action', array([ 0.66096661, 0.4739966 , 0. ]), 'Reward', -0.87924594782163534)
('Episode', 6, 'Step', 344.0, 'Epsilon', 0.9670966666664511, 'Action', array([ 1. , 0.47194962, 0. ]), 'Reward', -0.61204422392206514)
('Episode', 6, 'Step', 359.0, 'Epsilon', 0.9670466666664508, 'Action', array([-0.62174796, 0.6310072 , 0.00458957]), 'Reward', -1.3343055641302266)
('Episode', 6, 'Step', 374.0, 'Epsilon', 0.9669966666664505, 'Action', array([ 1. , 0.70374349, 0. ]), 'Reward', -1.0541837942413288)
('Episode', 6, 'Step', 389.0, 'Epsilon', 0.9669466666664501, 'Action', array([ 0.10044916, 0.27034353, 0. ]), 'Reward', -0.73794371654009849)
('Episode', 6, 'Step', 404.0, 'Epsilon', 0.9668966666664498, 'Action', array([ 1. , 0.55786089, 0. ]), 'Reward', -0.87996093895692051)
('Episode', 6, 'Step', 419.0, 'Epsilon', 0.9668466666664495, 'Action', array([ 1. , 0.43070582, 0.02038361]), 'Reward', -0.75533322314782714)
('Episode', 6, 'Step', 434.0, 'Epsilon', 0.9667966666664491, 'Action', array([ 0.04629152, 0.4234644 , 0. ]), 'Reward', -0.67170673224130018)
('Episode', 6, 'Step', 449.0, 'Epsilon', 0.9667466666664488, 'Action', array([ 1. , 0.57642585, 0. ]), 'Reward', -1.0614264203675452)
('Episode', 6, 'Step', 464.0, 'Epsilon', 0.9666966666664485, 'Action', array([-0.1157202 , 0.38468101, 0. ]), 'Reward', -0.77851606286736619)
('Episode', 6, 'Step', 479.0, 'Epsilon', 0.9666466666664482, 'Action', array([-0.69375265, 0.58394089, 0. ]), 'Reward', -2.4160424726863416)
('Episode', 6, 'Step', 494.0, 'Epsilon', 0.9665966666664478, 'Action', array([-0.37089375, 0.55131777, 0. ]), 'Reward', -1.7021800135657754)
('Episode', 6, 'Step', 509.0, 'Epsilon', 0.9665466666664475, 'Action', array([-1. , 0.47120476, 0. ]), 'Reward', -3.0075964558855612)
('Episode', 6, 'Step', 524.0, 'Epsilon', 0.9664966666664472, 'Action', array([-0.52195412, 0.5576066 , 0. ]), 'Reward', -2.5532318486137657)
('Episode', 6, 'Step', 539.0, 'Epsilon', 0.9664466666664469, 'Action', array([-0.39014917, 0.32555939, 0.03135493]), 'Reward', -2.3203721915872899)
('Episode', 6, 'Step', 554.0, 'Epsilon', 0.9663966666664465, 'Action', array([ 1. , 0.44361933, 0. ]), 'Reward', -1.0715082430558247)
('Episode', 6, 'Step', 569.0, 'Epsilon', 0.9663466666664462, 'Action', array([ 0.86718254, 0.19772527, 0. ]), 'Reward', -0.48325335444343831)
('Episode', 6, 'Step', 584.0, 'Epsilon', 0.9662966666664459, 'Action', array([ 0.53736823, 0.64876699, 0. ]), 'Reward', -2.2195526118333637)
('Episode', 6, 'Step', 599.0, 'Epsilon', 0.9662466666664455, 'Action', array([ 1. , 0.53433691, 0. ]), 'Reward', -1.5167270630141261)
('Episode', 6, 'Step', 614.0, 'Epsilon', 0.9661966666664452, 'Action', array([ 1. , 0.2592347, 0. ]), 'Reward', -0.33648663673213342)
('Episode', 6, 'Step', 629.0, 'Epsilon', 0.9661466666664449, 'Action', array([ 0.73766562, 0.46031162, 0. ]), 'Reward', -0.83908367826229013)
('Episode', 6, 'Step', 644.0, 'Epsilon', 0.9660966666664446, 'Action', array([ 1. , 0.57434126, 0. ]), 'Reward', -1.2020268345521075)
('Episode', 6, 'Step', 659.0, 'Epsilon', 0.9660466666664442, 'Action', array([ 0.38869103, 0.44906787, 0. ]), 'Reward', -1.9274528735915331)
('Episode', 6, 'Step', 674.0, 'Epsilon', 0.9659966666664439, 'Action', array([ 1. , 0.6291666, 0. ]), 'Reward', -0.93359577581307773)
('Episode', 6, 'Step', 689.0, 'Epsilon', 0.9659466666664436, 'Action', array([-0.26670131, 0.42345296, 0. ]), 'Reward', -1.5332097091701455)
('Episode', 6, 'Step', 704.0, 'Epsilon', 0.9658966666664432, 'Action', array([ 0.54472468, 0.56514547, 0. ]), 'Reward', -0.99648766051569804)
('Episode', 6, 'Step', 719.0, 'Epsilon', 0.9658466666664429, 'Action', array([-1. , 0.54599636, 0. ]), 'Reward', -4.2145798634948015)
('Episode', 6, 'Step', 734.0, 'Epsilon', 0.9657966666664426, 'Action', array([ 1. , 0.46900585, 0. ]), 'Reward', -0.70760465440311826)
('Episode', 6, 'Step', 749.0, 'Epsilon', 0.9657466666664423, 'Action', array([ 1. , 0.57126357, 0. ]), 'Reward', -2.4222194899365341)
('Episode', 6, 'Step', 764.0, 'Epsilon', 0.9656966666664419, 'Action', array([ 0.96315905, 0.51245405, 0. ]), 'Reward', -2.19836787628455)
('Episode', 6, 'Step', 779.0, 'Epsilon', 0.9656466666664416, 'Action', array([-0.52821968, 0.59129508, 0. ]), 'Reward', -13.171424637873729)
('Episode', 6, 'Step', 794.0, 'Epsilon', 0.9655966666664413, 'Action', array([-0.26106975, 0.50024251, 0. ]), 'Reward', -0.33411732002271283)
('Episode', 6, 'Step', 809.0, 'Epsilon', 0.965546666666441, 'Action', array([-0.44417581, 0.44886186, 0. ]), 'Reward', -0.32055765064357028)
('Episode', 6, 'Step', 824.0, 'Epsilon', 0.9654966666664406, 'Action', array([-0.7236589 , 0.38034423, 0.01749302]), 'Reward', -0.19146639218278183)
('Episode', 6, 'Step', 839.0, 'Epsilon', 0.9654466666664403, 'Action', array([-1. , 0.51561252, 0. ]), 'Reward', -0.15322341978640996)
('Episode', 6, 'Step', 854.0, 'Epsilon', 0.96539666666644, 'Action', array([-1. , 0.65140721, 0. ]), 'Reward', -0.30792956516259107)
('Episode', 6, 'Step', 869.0, 'Epsilon', 0.9653466666664396, 'Action', array([-0.76173451, 0.31628179, 0. ]), 'Reward', -0.27224079223520342)
('Episode', 6, 'Step', 884.0, 'Epsilon', 0.9652966666664393, 'Action', array([ 0.87536082, 0.42811936, 0. ]), 'Reward', -0.80266997714075972)
('Episode', 6, 'Step', 899.0, 'Epsilon', 0.965246666666439, 'Action', array([-0.077291 , 0.45199643, 0. ]), 'Reward', -0.49727817060274937)
('Episode', 6, 'Step', 914.0, 'Epsilon', 0.9651966666664387, 'Action', array([-0.11013275, 0.63990731, 0. ]), 'Reward', -0.81058506400171682)
('Episode', 6, 'Step', 929.0, 'Epsilon', 0.9651466666664383, 'Action', array([-0.3931495 , 0.63320352, 0. ]), 'Reward', -0.67838941111175732)
('Episode', 6, 'Step', 944.0, 'Epsilon', 0.965096666666438, 'Action', array([-1. , 0.37986793, 0. ]), 'Reward', -0.19686098334540256)
('Episode', 6, 'Step', 959.0, 'Epsilon', 0.9650466666664377, 'Action', array([-0.05930888, 0.52054809, 0. ]), 'Reward', -1.3840908175525488)
('Episode', 6, 'Step', 974.0, 'Epsilon', 0.9649966666664374, 'Action', array([-0.04737171, 0.56124266, 0. ]), 'Reward', -0.77291862902618469)
('Episode', 6, 'Step', 989.0, 'Epsilon', 0.964946666666437, 'Action', array([-0.73043066, 0.6258066 , 0. ]), 'Reward', -0.84298003270609012)
('Episode', 6, 'Step', 1004.0, 'Epsilon', 0.9648966666664367, 'Action', array([ 0.22325382, 0.47545091, 0. ]), 'Reward', -1.8077448255539528)
('Episode', 6, 'Step', 1019.0, 'Epsilon', 0.9648466666664364, 'Action', array([ 0.52261772, 0.36805715, 0. ]), 'Reward', -1.7430839328982444)
('Episode', 6, 'Step', 1034.0, 'Epsilon', 0.964796666666436, 'Action', array([-1. , 0.59357971, 0. ]), 'Reward', -1.6027187133253484)
('Episode', 6, 'Step', 1049.0, 'Epsilon', 0.9647466666664357, 'Action', array([-0.5863584 , 0.61303843, 0. ]), 'Reward', -0.99008574775184632)
('Episode', 6, 'Step', 1064.0, 'Epsilon', 0.9646966666664354, 'Action', array([-1. , 0.34483528, 0. ]), 'Reward', -3.1702259573069238)
('Episode', 6, 'Step', 1079.0, 'Epsilon', 0.9646466666664351, 'Action', array([-0.86357241, 0.57678683, 0. ]), 'Reward', -3.447457152171328)
('Episode', 6, 'Step', 1094.0, 'Epsilon', 0.9645966666664347, 'Action', array([-0.34873704, 0.32778128, 0. ]), 'Reward', -7.0065065514230795)
('Episode', 6, 'Step', 1109.0, 'Epsilon', 0.9645466666664344, 'Action', array([ 0.23692111, 0.50634233, 0. ]), 'Reward', -10.596332947056361)
('Episode', 6, 'Step', 1124.0, 'Epsilon', 0.9644966666664341, 'Action', array([ 0.76459397, 0.27861854, 0. ]), 'Reward', -2.2999284135331175)
('Episode', 6, 'Step', 1139.0, 'Epsilon', 0.9644466666664337, 'Action', array([-0.3069764 , 0.51373127, 0. ]), 'Reward', -0.33613580099191998)
('Episode', 6, 'Step', 1154.0, 'Epsilon', 0.9643966666664334, 'Action', array([-0.94564533, 0.41353091, 0. ]), 'Reward', -0.24419320192882718)
('Episode', 6, 'Step', 1169.0, 'Epsilon', 0.9643466666664331, 'Action', array([-0.08335282, 0.54052858, 0. ]), 'Reward', -0.5169735565049105)
('Episode', 6, 'Step', 1184.0, 'Epsilon', 0.9642966666664328, 'Action', array([-0.42969579, 0.2328426 , 0. ]), 'Reward', -0.19232855250719411)
('Episode', 6, 'Step', 1199.0, 'Epsilon', 0.9642466666664324, 'Action', array([-1. , 0.5466598, 0. ]), 'Reward', -0.41244511445901028)
('Episode', 6, 'Step', 1214.0, 'Epsilon', 0.9641966666664321, 'Action', array([ 0.63826694, 0.50488469, 0. ]), 'Reward', -0.36334416550929477)
('Episode', 6, 'Step', 1229.0, 'Epsilon', 0.9641466666664318, 'Action', array([ 0.52969827, 0.29084981, 0.0223636 ]), 'Reward', -0.2589561514480393)
('Episode', 6, 'Step', 1244.0, 'Epsilon', 0.9640966666664315, 'Action', array([-1. , 0.30449746, 0. ]), 'Reward', -0.27180322237016785)
('Episode', 6, 'Step', 1259.0, 'Epsilon', 0.9640466666664311, 'Action', array([-0.94202242, 0.45595305, 0. ]), 'Reward', -0.28689607474014778)
('Episode', 6, 'Step', 1274.0, 'Epsilon', 0.9639966666664308, 'Action', array([-1. , 0.65081929, 0. ]), 'Reward', -0.34227353368024793)
('Episode', 6, 'Step', 1289.0, 'Epsilon', 0.9639466666664305, 'Action', array([ 0.40929725, 0.51321353, 0. ]), 'Reward', -0.4397361397754655)
('Episode', 6, 'Step', 1304.0, 'Epsilon', 0.9638966666664301, 'Action', array([ 0.27819432, 0.44375128, 0. ]), 'Reward', -0.28354123048358604)
('Episode', 6, 'Step', 1319.0, 'Epsilon', 0.9638466666664298, 'Action', array([-0.42377413, 0.45789518, 0.0295305 ]), 'Reward', -0.28835222394744964)
('Episode', 6, 'Step', 1334.0, 'Epsilon', 0.9637966666664295, 'Action', array([ 1. , 0.32531878, 0. ]), 'Reward', -0.66775041540130198)
('Episode', 6, 'Step', 1349.0, 'Epsilon', 0.9637466666664292, 'Action', array([-0.20622023, 0.35869985, 0. ]), 'Reward', -0.19175830537462116)
('Episode', 6, 'Step', 1364.0, 'Epsilon', 0.9636966666664288, 'Action', array([-1. , 0.57044133, 0. ]), 'Reward', -0.15589258227521585)
('Episode', 6, 'Step', 1379.0, 'Epsilon', 0.9636466666664285, 'Action', array([-0.38016481, 0.31161241, 0.05998814]), 'Reward', -0.18000148500946656)
('Episode', 6, 'Step', 1394.0, 'Epsilon', 0.9635966666664282, 'Action', array([-0.57069454, 0.4913347 , 0. ]), 'Reward', -0.29569895343080654)
('Episode', 6, 'Step', 1409.0, 'Epsilon', 0.9635466666664279, 'Action', array([-1. , 0.48386349, 0. ]), 'Reward', -0.15423610611157312)
('Episode', 6, 'Step', 1424.0, 'Epsilon', 0.9634966666664275, 'Action', array([-0.90633829, 0.44779907, 0. ]), 'Reward', -0.30877369343822852)
('Episode', 6, 'Step', 1439.0, 'Epsilon', 0.9634466666664272, 'Action', array([-0.86875903, 0.36222848, 0. ]), 'Reward', -0.14411410123789442)
('Episode', 6, 'Step', 1454.0, 'Epsilon', 0.9633966666664269, 'Action', array([-1. , 0.6523388, 0. ]), 'Reward', -0.31671693022236125)
('Episode', 6, 'Step', 1469.0, 'Epsilon', 0.9633466666664265, 'Action', array([-1. , 0.56043624, 0. ]), 'Reward', -0.22777134708319474)
('Episode', 6, 'Step', 1484.0, 'Epsilon', 0.9632966666664262, 'Action', array([-1. , 0.51916462, 0. ]), 'Reward', -0.314006588843325)
('Episode', 6, 'Step', 1499.0, 'Epsilon', 0.9632466666664259, 'Action', array([-0.45246706, 0.57668935, 0. ]), 'Reward', -0.28203976648679729)
('Episode', 6, 'Step', 1514.0, 'Epsilon', 0.9631966666664256, 'Action', array([-0.79691943, 0.43840267, 0. ]), 'Reward', -0.21186576128442475)
('Episode', 6, 'Step', 1529.0, 'Epsilon', 0.9631466666664252, 'Action', array([ 0.71819827, 0.54396456, 0. ]), 'Reward', -0.50250623300660791)
('Episode', 6, 'Step', 1544.0, 'Epsilon', 0.9630966666664249, 'Action', array([ 0.0091736 , 0.43967298, 0. ]), 'Reward', -0.17472217926357136)
('Episode', 6, 'Step', 1559.0, 'Epsilon', 0.9630466666664246, 'Action', array([-0.89949736, 0.44929234, 0. ]), 'Reward', -0.26503486202199333)
('Episode', 6, 'Step', 1574.0, 'Epsilon', 0.9629966666664243, 'Action', array([ 1. , 0.55525277, 0. ]), 'Reward', -0.72367583517828449)
('Episode', 6, 'Step', 1589.0, 'Epsilon', 0.9629466666664239, 'Action', array([-0.00261784, 0.53624304, 0.01363069]), 'Reward', -0.50715893186961947)
('Episode', 6, 'Step', 1604.0, 'Epsilon', 0.9628966666664236, 'Action', array([-0.29150888, 0.44400469, 0. ]), 'Reward', -0.45221767039628613)
('Episode', 6, 'Step', 1619.0, 'Epsilon', 0.9628466666664233, 'Action', array([-0.22481156, 0.42528468, 0. ]), 'Reward', -0.31915201376266128)
('Episode', 6, 'Step', 1634.0, 'Epsilon', 0.9627966666664229, 'Action', array([-0.07305498, 0.26994642, 0. ]), 'Reward', -0.19086071760724568)
('Episode', 6, 'Step', 1649.0, 'Epsilon', 0.9627466666664226, 'Action', array([-0.25483195, 0.49269107, 0. ]), 'Reward', -0.21927614905064469)
('Episode', 6, 'Step', 1664.0, 'Epsilon', 0.9626966666664223, 'Action', array([-0.92104195, 0.44774736, 0. ]), 'Reward', -0.25318774847253778)
('Episode', 6, 'Step', 1679.0, 'Epsilon', 0.962646666666422, 'Action', array([-0.71487277, 0.59320405, 0. ]), 'Reward', -0.36802819134169124)
('Episode', 6, 'Step', 1694.0, 'Epsilon', 0.9625966666664216, 'Action', array([-1. , 0.51110434, 0. ]), 'Reward', -0.3061213601457497)
('Episode', 6, 'Step', 1709.0, 'Epsilon', 0.9625466666664213, 'Action', array([-0.875019
Fuel consumption disabled!
Laptime limit disabled!
Visual Properties Report
------------------------
Compatibility mode, properties unknown.
Waiting for request on port 3101
******* RESTARTING *****
64, 0.54164219, 0. ]), 'Reward', -0.19261727666335637)
('Episode', 6, 'Step', 1724.0, 'Epsilon', 0.962496666666421, 'Action', array([ 0.19869585, 0.48916946, 0.00288554]), 'Reward', -0.27247378952808449)
('Episode', 6, 'Step', 1739.0, 'Epsilon', 0.9624466666664206, 'Action', array([ 0.64397715, 0.51191994, 0. ]), 'Reward', -0.64297252250313064)
('Episode', 6, 'Step', 1754.0, 'Epsilon', 0.9623966666664203, 'Action', array([ 0.11093755, 0.74076498, 0. ]), 'Reward', -0.65200829907728874)
('Episode', 6, 'Step', 1769.0, 'Epsilon', 0.96234666666642, 'Action', array([-0.58088503, 0.39807565, 0. ]), 'Reward', -0.25875274764829548)
('Episode', 6, 'Step', 1784.0, 'Epsilon', 0.9622966666664197, 'Action', array([ 1. , 0.59004667, 0. ]), 'Reward', -0.62124035414339263)
('Episode', 6, 'Step', 1799.0, 'Epsilon', 0.9622466666664193, 'Action', array([-0.83086896, 0.50597699, 0. ]), 'Reward', -0.13010320273649428)
('Episode', 6, 'Step', 1814.0, 'Epsilon', 0.962196666666419, 'Action', array([ 0.19750357, 0.56009745, 0. ]), 'Reward', -0.4134923058952043)
('Episode', 6, 'Step', 1829.0, 'Epsilon', 0.9621466666664187, 'Action', array([-1. , 0.33036452, 0. ]), 'Reward', -0.10016366869763853)
('Episode', 6, 'Step', 1844.0, 'Epsilon', 0.9620966666664184, 'Action', array([-0.89600434, 0.32236058, 0. ]), 'Reward', -0.023405890393458122)
('Episode', 6, 'Step', 1859.0, 'Epsilon', 0.962046666666418, 'Action', array([-1. , 0.32828205, 0. ]), 'Reward', -0.036727521769834459)
('Episode', 6, 'Step', 1874.0, 'Epsilon', 0.9619966666664177, 'Action', array([-0.82757666, 0.54222551, 0. ]), 'Reward', -0.4207849225246767)
('Episode', 6, 'Step', 1889.0, 'Epsilon', 0.9619466666664174, 'Action', array([ 0.76436241, 0.47215792, 0. ]), 'Reward', -0.54848296102747762)
('Episode', 6, 'Step', 1904.0, 'Epsilon', 0.961896666666417, 'Action', array([ 0.30952555, 0.4568929 , 0.02492074]), 'Reward', -0.44712954979280378)
('Episode', 6, 'Step', 1919.0, 'Epsilon', 0.9618466666664167, 'Action', array([-1. , 0.53356133, 0. ]), 'Reward', -0.28330669814561238)
('Episode', 6, 'Step', 1934.0, 'Epsilon', 0.9617966666664164, 'Action', array([ 0.07321457, 0.47670248, 0. ]), 'Reward', -0.26516881765729694)
('Episode', 6, 'Step', 1949.0, 'Epsilon', 0.9617466666664161, 'Action', array([-1. , 0.4166946, 0. ]), 'Reward', -0.34738805772599357)
('Episode', 6, 'Step', 1964.0, 'Epsilon', 0.9616966666664157, 'Action', array([ 0.02984318, 0.44417095, 0. ]), 'Reward', -0.35487868657238647)
('Episode', 6, 'Step', 1979.0, 'Epsilon', 0.9616466666664154, 'Action', array([ 0.17293496, 0.36503443, 0. ]), 'Reward', -0.15837560627904479)
('Episode', 6, 'Step', 1994.0, 'Epsilon', 0.9615966666664151, 'Action', array([-0.78573759, 0.46457112, 0. ]), 'Reward', -0.35858621579024291)
TOTAL REWARD @ 6-th Episode : Reward -9752.90057957
Total Step: 11526
Waiting for server on 3101............
Count Down : 5
Client connected on 3101..............
Episode : 7 Replay Buffer 11526 Early Stopping: 0 Epsilon: 0.96158 RN: 0.512499988681
('Episode', 7, 'Step', 9.0, 'Epsilon', 0.9615466666664148, 'Action', array([-0.78833877, 0.51587888, 0. ]), 'Reward', 8.8290772132283397)
('Episode', 7, 'Step', 24.0, 'Epsilon', 0.9614966666664144, 'Action', array([ 1. , 0.34094359, 0.03375663]), 'Reward', -32.941122293879687)
('Episode', 7, 'Step', 39.0, 'Epsilon', 0.9614466666664141, 'Action', array([ 0.03541434, 0.42832621, 0. ]), 'Reward', -0.043967851966594057)
('Episode', 7, 'Step', 54.0, 'Epsilon', 0.9613966666664138, 'Action', array([-0.31075317, 0.33305923, 0. ]), 'Reward', 0.049294720952766935)
('Episode', 7, 'Step', 69.0, 'Epsilon', 0.9613466666664134, 'Action', array([-1. , 0.48675958, 0. ]), 'Reward', -0.34147106209520972)
('Episode', 7, 'Step', 84.0, 'Epsilon', 0.9612966666664131, 'Action', array([-0.12326815, 0.44502403, 0.08504427]), 'Reward', 0.048998320437405457)
('Episode', 7, 'Step', 99.0, 'Epsilon', 0.9612466666664128, 'Action', array([-1. , 0.53199435, 0. ]), 'Reward', -0.31834879676333028)
('Episode', 7, 'Step', 114.0, 'Epsilon', 0.9611966666664125, 'Action', array([-0.92742687, 0.4655893 , 0. ]), 'Reward', 0.015992761351096473)
('Episode', 7, 'Step', 129.0, 'Epsilon', 0.9611466666664121, 'Action', array([-0.6602806 , 0.59267756, 0. ]), 'Reward', -0.78920694114337431)
('Episode', 7, 'Step', 144.0, 'Epsilon', 0.9610966666664118, 'Action', array([-1. , 0.59701185, 0. ]), 'Reward', -0.46402886940415949)
('Episode', 7, 'Step', 159.0, 'Epsilon', 0.9610466666664115, 'Action', array([ 1. , 0.31764345, 0. ]), 'Reward', -0.46785835284061345)
('Episode', 7, 'Step', 174.0, 'Epsilon', 0.9609966666664111, 'Action', array([-0.58710622, 0.67600733, 0. ]), 'Reward', -0.708281685500179)
('Episode', 7, 'Step', 189.0, 'Epsilon', 0.9609466666664108, 'Action', array([-0.61857344, 0.38776958, 0. ]), 'Reward', -0.16744515824339781)
('Episode', 7, 'Step', 204.0, 'Epsilon', 0.9608966666664105, 'Action', array([-0.74731905, 0.37628554, 0. ]), 'Reward', -0.15865541985040099)
('Episode', 7, 'Step', 219.0, 'Epsilon', 0.9608466666664102, 'Action', array([-1. , 0.41417997, 0. ]), 'Reward', -0.76452441491080037)
('Episode', 7, 'Step', 234.0, 'Epsilon', 0.9607966666664098, 'Action', array([-0.31619555, 0.45047305, 0. ]), 'Reward', -0.45761879084905782)
('Episode', 7, 'Step', 249.0, 'Epsilon', 0.9607466666664095, 'Action', array([ 0.62055199, 0.43782367, 0. ]), 'Reward', -0.96688134529349012)
('Episode', 7, 'Step', 264.0, 'Epsilon', 0.9606966666664092, 'Action', array([ 0.45609561, 0.50648884, 0. ]), 'Reward', -1.2635299764315784)
('Episode', 7, 'Step', 279.0, 'Epsilon', 0.9606466666664089, 'Action', array([ 0.71456296, 0.48845338, 0. ]), 'Reward', -1.4506248440542955)
('Episode', 7, 'Step', 294.0, 'Epsilon', 0.9605966666664085, 'Action', array([-0.29919631, 0.46378079, 0. ]), 'Reward', -0.75532944614351927)
('Episode', 7, 'Step', 309.0, 'Epsilon', 0.9605466666664082, 'Action', array([-0.8250363 , 0.48245666, 0. ]), 'Reward', -0.68468946602577829)
('Episode', 7, 'Step', 324.0, 'Epsilon', 0.9604966666664079, 'Action', array([-1. , 0.44224268, 0. ]), 'Reward', -0.661904378347832)
('Episode', 7, 'Step', 339.0, 'Epsilon', 0.9604466666664075, 'Action', array([-1. , 0.46237886, 0. ]), 'Reward', -0.46910006775612478)
('Episode', 7, 'Step', 354.0, 'Epsilon', 0.9603966666664072, 'Action', array([ 0.27772644, 0.41315437, 0. ]), 'Reward', -1.2440659657848099)
('Episode', 7, 'Step', 369.0, 'Epsilon', 0.9603466666664069, 'Action', array([-0.88263336, 0.66820364, 0. ]), 'Reward', -1.387968125920493)
('Episode', 7, 'Step', 384.0, 'Epsilon', 0.9602966666664066, 'Action', array([-1. , 0.59148614, 0. ]), 'Reward', -0.87997182028044096)
('Episode', 7, 'Step', 399.0, 'Epsilon', 0.9602466666664062, 'Action', array([-0.63930923, 0.50800196, 0. ]), 'Reward', -1.2533565664299924)
('Episode', 7, 'Step', 414.0, 'Epsilon', 0.9601966666664059, 'Action', array([ 0.04330672, 0.50736807, 0. ]), 'Reward', -1.9917804766547778)
('Episode', 7, 'Step', 429.0, 'Epsilon', 0.9601466666664056, 'Action', array([-0.32860418, 0.5944005 , 0. ]), 'Reward', -1.8469372878625254)
('Episode', 7, 'Step', 444.0, 'Epsilon', 0.9600966666664053, 'Action', array([-1. , 0.34400508, 0. ]), 'Reward', -0.27433011475267893)
('Episode', 7, 'Step', 459.0, 'Epsilon', 0.9600466666664049, 'Action', array([ 0.23718339, 0.39549617, 0. ]), 'Reward', -2.600026435495856)
('Episode', 7, 'Step', 474.0, 'Epsilon', 0.9599966666664046, 'Action', array([-0.76905728, 0.21761838, 0.03999264]), 'Reward', -0.047150766485336157)
('Episode', 7, 'Step', 489.0, 'Epsilon', 0.9599466666664043, 'Action', array([-0.0746662 , 0.43417216, 0. ]), 'Reward', -1.351296629836656)
('Episode', 7, 'Step', 504.0, 'Epsilon', 0.9598966666664039, 'Action', array([-1. , 0.59983615, 0. ]), 'Reward', -1.2552768643445049)
('Episode', 7, 'Step', 519.0, 'Epsilon', 0.9598466666664036, 'Action', array([-0.26717636, 0.38576308, 0. ]), 'Reward', -2.4313601780531684)
('Episode', 7, 'Step', 534.0, 'Epsilon', 0.9597966666664033, 'Action', array([ 0.69688597, 0.51682653, 0. ]), 'Reward', -2.8926429887808816)
('Episode', 7, 'Step', 549.0, 'Epsilon', 0.959746666666403, 'Action', array([-1. , 0.45597983, 0. ]), 'Reward', -2.1576877117922488)
('Episode', 7, 'Step', 564.0, 'Epsilon', 0.9596966666664026, 'Action', array([ 1. , 0.47668034, 0. ]), 'Reward', -3.9964961118492179)
('Episode', 7, 'Step', 579.0, 'Epsilon', 0.9596466666664023, 'Action', array([ 0.49357511, 0.42283634, 0.02485279]), 'Reward', -3.0605281648689964)
('Episode', 7, 'Step', 594.0, 'Epsilon', 0.959596666666402, 'Action', array([ 0.96385971, 0.41772116, 0. ]), 'Reward', -6.3922303342125986)
('Episode', 7, 'Step', 609.0, 'Epsilon', 0.9595466666664016, 'Action', array([ 1. , 0.33339983, 0. ]), 'Reward', -2.3498646575495172)
('Episode', 7, 'Step', 624.0, 'Epsilon', 0.9594966666664013, 'Action', array([-0.67469903, 0.53665917, 0.01282115]), 'Reward', -10.119271403850817)
('Episode', 7, 'Step', 639.0, 'Epsilon', 0.959446666666401, 'Action', array([-0.20052954, 0.54754026, 0. ]), 'Reward', -10.613756142364974)
('Episode', 7, 'Step', 654.0, 'Epsilon', 0.9593966666664007, 'Action', array([-0.09235049, 0.36417766, 0.01379638]), 'Reward', -11.962718295363135)
('Episode', 7, 'Step', 669.0, 'Epsilon', 0.9593466666664003, 'Action', array([ 0.00576772, 0.59998205, 0. ]), 'Reward', -8.1793551238486568)
('Episode', 7, 'Step', 684.0, 'Epsilon', 0.9592966666664, 'Action', array([ 0.27025722, 0.51869806, 0. ]), 'Reward', -4.883981741097644)
('Episode', 7, 'Step', 699.0, 'Epsilon', 0.9592466666663997, 'Action', array([-0.83687457, 0.55533007, 0. ]), 'Reward', -5.5022344428193168)
('Episode', 7, 'Step', 714.0, 'Epsilon', 0.9591966666663994, 'Action', array([ 0.43443574, 0.48134406, 0.02188136]), 'Reward', -7.0435706571345582)
('Episode', 7, 'Step', 729.0, 'Epsilon', 0.959146666666399, 'Action', array([-1. , 0.42848001, 0. ]), 'Reward', -6.0223072194058123)
('Episode', 7, 'Step', 744.0, 'Epsilon', 0.9590966666663987, 'Action', array([ 0.51854804, 0.32208452, 0.0277097 ]), 'Reward', -3.7596723263898335)
('Episode', 7, 'Step', 759.0, 'Epsilon', 0.9590466666663984, 'Action', array([ 0.61563558, 0.40418956, 0.05476596]), 'Reward', -3.204972911446442)
('Episode', 7, 'Step', 774.0, 'Epsilon', 0.958996666666398, 'Action', array([-0.95363219, 0.56602732, 0. ]), 'Reward', -7.176206256310981)
('Episode', 7, 'Step', 789.0, 'Epsilon', 0.9589466666663977, 'Action', array([-0.41653442, 0.54375416, 0. ]), 'Reward', -5.0648728108200283)
('Episode', 7, 'Step', 804.0, 'Epsilon', 0.9588966666663974, 'Action', array([-0.13385529, 0.5481912 , 0. ]), 'Reward', -8.5113477624831191)
('Episode', 7, 'Step', 819.0, 'Epsilon', 0.9588466666663971, 'Action', array([ 0.03519107, 0.55677102, 0. ]), 'Reward', -16.022876488489217)
('Episode', 7, 'Step', 834.0, 'Epsilon', 0.9587966666663967, 'Action', array([ 1.11624055e-01, 5.56811346e-01, 2.01012154e-05]), 'Reward', -13.362288129736745)
('Episode', 7, 'Step', 849.0, 'Epsilon', 0.9587466666663964, 'Action', array([ 0.12074657, 0.36475389, 0. ]), 'Reward', -21.357819322766595)
('Episode', 7, 'Step', 864.0, 'Epsilon', 0.9586966666663961, 'Action', array([-1. , 0.3435461, 0. ]), 'Reward', -12.522538153104534)
('Episode', 7, 'Step', 879.0, 'Epsilon', 0.9586466666663958, 'Action', array([ 0.45558407, 0.48408638, 0. ]), 'Reward', -31.550182942535237)
('Episode', 7, 'Step', 894.0, 'Epsilon', 0.9585966666663954, 'Action', array([-0.24969239, 0.41077806, 0. ]), 'Reward', -78.834928342623755)
('Episode', 7, 'Step', 909.0, 'Epsilon', 0.9585466666663951, 'Action', array([-1. , 0.5311903, 0. ]), 'Reward', -106.73705644740114)
('Episode', 7, 'Step', 924.0, 'Epsilon', 0.9584966666663948, 'Action', array([-1. , 0.4661485, 0. ]), 'Reward', -84.368367267732907)
('Episode', 7, 'Step', 939.0, 'Epsilon', 0.9584466666663944, 'Action', array([-1. , 0.52327156, 0. ]), 'Reward', -1)
('Episode', 7, 'Step', 954.0, 'Epsilon', 0.9583966666663941, 'Action', array([ 1. , 0.58668862, 0. ]), 'Reward', 0.036111284565679552)
('Episode', 7, 'Step', 969.0, 'Epsilon', 0.9583466666663938, 'Action', array([ 0.58359597, 0.31973098, 0. ]), 'Reward', -0.57621272138037405)
('Episode', 7, 'Step', 984.0, 'Epsilon', 0.9582966666663935, 'Action', array([-0.11834378, 0.46884575, 0. ]), 'Reward', -0.41881335212244708)
('Episode', 7, 'Step', 999.0, 'Epsilon', 0.9582466666663931, 'Action', array([ 1. , 0.44948964, 0. ]), 'Reward', -0.42997891666037685)
('Episode', 7, 'Step', 1014.0, 'Epsilon', 0.9581966666663928, 'Action', array([ 0.91046585, 0.25244396, 0. ]), 'Reward', 0.0092889027285927295)
('Episode', 7, 'Step', 1029.0, 'Epsilon', 0.9581466666663925, 'Action', array([ 0.60005303, 0.57327775, 0. ]), 'Reward', -0.41180069745972575)
('Episode', 7, 'Step', 1044.0, 'Epsilon', 0.9580966666663921, 'Action', array([-0.86686503, 0.62174346, 0. ]), 'Reward', -0.27786411045766457)
('Episode', 7, 'Step', 1059.0, 'Epsilon', 0.9580466666663918, 'Action', array([ 1. , 0.50547711, 0. ]), 'Reward', -0.34033429322054465)
('Episode', 7, 'Step', 1074.0, 'Epsilon', 0.9579966666663915, 'Action', array([-0.28407424, 0.6457937 , 0. ]), 'Reward', -0.72202126723583337)
('Episode', 7, 'Step', 1089.0, 'Epsilon', 0.9579466666663912, 'Action', array([ 0.18872556, 0.62282834, 0. ]), 'Reward', -0.45471388046739464)
('Episode', 7, 'Step', 1104.0, 'Epsilon', 0.9578966666663908, 'Action', array([-0.53150597, 0.43230017, 0. ]), 'Reward', -0.61864314030340628)
('Episode', 7, 'Step', 1119.0, 'Epsilon', 0.9578466666663905, 'Action', array([ 0.08784029, 0.50795309, 0. ]), 'Reward', -0.49044346889089918)
('Episode', 7, 'Step', 1134.0, 'Epsilon', 0.9577966666663902, 'Action', array([ 0.31766282, 0.48111711, 0. ]), 'Reward', -0.52785575110987137)
('Episode', 7, 'Step', 1149.0, 'Epsilon', 0.9577466666663899, 'Action', array([-1. , 0.25680722, 0. ]), 'Reward', -0.53626179623968162)
('Episode', 7, 'Step', 1164.0, 'Epsilon', 0.9576966666663895, 'Action', array([ 0.83576178, 0.48741358, 0. ]), 'Reward', -0.50614464224206834)
('Episode', 7, 'Step', 1179.0, 'Epsilon', 0.9576466666663892, 'Action', array([ 1. , 0.36363098, 0. ]), 'Reward', -0.35066652621321159)
('Episode', 7, 'Step', 1194.0, 'Epsilon', 0.9575966666663889, 'Action', array([-0.61751529, 0.47865824, 0. ]), 'Reward', -0.62112872505238692)
('Episode', 7, 'Step', 1209.0, 'Epsilon', 0.9575466666663885, 'Action', array([ 1. , 0.40678836, 0. ]), 'Reward', -0.27064717059075677)
('Episode', 7, 'Step', 1224.0, 'Epsilon', 0.9574966666663882, 'Action', array([-1. , 0.59486736, 0. ]), 'Reward', -1.0545668936199384)
('Episode', 7, 'Step', 1239.0, 'Epsilon', 0.9574466666663879, 'Action', array([-0.68331369, 0.28073834, 0.00965428]), 'Reward', -0.51967379824498583)
('Episode', 7, 'Step', 1254.0, 'Epsilon', 0.9573966666663876, 'Action', array([ 1. , 0.54170689, 0. ]), 'Reward', -0.37873411097757131)
('Episode', 7, 'Step', 1269.0, 'Epsilon', 0.9573466666663872, 'Action', array([ 1. , 0.5205659 , 0.03492186]), 'Reward', -0.25925253725692365)
('Episode', 7, 'Step', 1284.0, 'Epsilon', 0.9572966666663869, 'Action', array([ 0.93730241, 0.61198159, 0. ]), 'Reward', -0.33328202246098165)
('Episode', 7, 'Step', 1299.0, 'Epsilon', 0.9572466666663866, 'Action', array([-0.24681415, 0.3864277 , 0. ]), 'Reward', -0.49327774931402624)
('Episode', 7, 'Step', 1314.0, 'Epsilon', 0.9571966666663863, 'Action', array([-0.09427508, 0.59561449, 0. ]), 'Reward', -0.70299129746041134)
('Episode', 7, 'Step', 1329.0, 'Epsilon', 0.9571466666663859, 'Action', array([ 0.07187269, 0.4219616 , 0. ]), 'Reward', -0.57598748048985948)
('Episode', 7, 'Step', 1344.0, 'Epsilon', 0.9570966666663856, 'Action', array([ 0.47239705, 0.41613333, 0. ]), 'Reward', -0.29420848723806203)
('Episode', 7, 'Step', 1359.0, 'Epsilon', 0.9570466666663853, 'Action', array([-0.1446814 , 0.49781619, 0. ]), 'Reward', -0.51998874452457233)
('Episode', 7, 'Step', 1374.0, 'Epsilon', 0.9569966666663849, 'Action', array([ 0.38107252, 0.3673363 , 0. ]), 'Reward', -0.3493624948295222)
('Episode', 7, 'Step', 1389.0, 'Epsilon', 0.9569466666663846, 'Action', array([ 0.58871601, 0.5318817 , 0. ]), 'Reward', -1.9927340416179922)
('Episode', 7, 'Step', 1404.0, 'Epsilon', 0.9568966666663843, 'Action', array([ 0.29898655, 0.48798831, 0. ]), 'Reward', -3.3901490083905532)
('Episode', 7, 'Step', 1419.0, 'Epsilon', 0.956846666666384, 'Action', array([ 0.99650442, 0.1710446 , 0.02785745]), 'Reward', -0.70695501363940272)
('Episode', 7, 'Step', 1434.0, 'Epsilon', 0.9567966666663836, 'Action', array([ 0.8837717 , 0.44766986, 0. ]), 'Reward', -1.8084806626577201)
('Episode', 7, 'Step', 1449.0, 'Epsilon', 0.9567466666663833, 'Action', array([ 0.35596623, 0.41039535, 0. ]), 'Reward', -1.0485377609017745)
('Episode', 7, 'Step', 1464.0, 'Epsilon', 0.956696666666383, 'Action', array([-0.90520273, 0.44529901, 0. ]), 'Reward', -1.3511782604233811)
('Episode', 7, 'Step', 1479.0, 'Epsilon', 0.9566466666663827, 'Action', array([ 0.86892148, 0.42081393, 0. ]), 'Reward', -2.1836112140982138)
('Episode', 7, 'Step', 1494.0, 'Epsilon', 0.9565966666663823, 'Action', array([-0.34099229, 0.63758888, 0. ]), 'Reward', -3.113382309488145)
('Episode', 7, 'Step', 1509.0, 'Epsilon', 0.956546666666382, 'Action', array([-0.01096187, 0.47594153, 0. ]), 'Reward', 19.12068894541374)
('Episode', 7, 'Step', 1524.0, 'Epsilon', 0.9564966666663817, 'Action', array([-0.94900119, 0.25334754, 0. ]), 'Reward', -0.26676699998303433)
('Episode', 7, 'Step', 1539.0, 'Epsilon', 0.9564466666663813, 'Action', array([-0.0035195 , 0.64337805, 0. ]), 'Reward', -0.54800266227185124)
('Episode', 7, 'Step', 1554.0, 'Epsilon', 0.956396666666381, 'Action', array([-0.87216082, 0.2354265 , 0.01377198]), 'Reward', -0.18486932251002214)
('Episode', 7, 'Step', 1569.0, 'Epsilon', 0.9563466666663807, 'Action', array([-0.41828945, 0.39325583, 0. ]), 'Reward', -0.19182914598422957)
('Episode', 7, 'Step', 1584.0, 'Epsilon', 0.9562966666663804, 'Action', array([-1. , 0.34397954, 0. ]), 'Reward', -0.2937348616027754)
('Episode', 7, 'Step', 1599.0, 'Epsilon', 0.95624666666638, 'Action', array([-0.69574714, 0.38747992, 0. ]), 'Reward', -0.33698753496453804)
('Episode', 7, 'Step', 1614.0, 'Epsilon', 0.9561966666663797, 'Action', array([-0.83154285, 0.49207152, 0. ]), 'Reward', -0.31924181275539121)
('Episode', 7, 'Step', 1629.0, 'Epsilon', 0.9561466666663794, 'Action', array([-0.01145087, 0.6149766 , 0. ]), 'Reward', -0.55160642434874074)
('Episode', 7, 'Step', 1644.0, 'Epsilon', 0.956096666666379, 'Action', array([-0.03235341, 0.52544277, 0. ]), 'Reward', -0.4904776521615305)
('Episode', 7, 'Step', 1659.0, 'Epsilon', 0.9560466666663787, 'Action', array([-1. , 0.46205631, 0. ]), 'Reward', -0.16493270400107291)
('Episode', 7, 'Step', 1674.0, 'Epsilon', 0.9559966666663784, 'Action', array([ 0.10680864, 0.41731277, 0.01064063]), 'Reward', -0.26043715211816165)
('Episode', 7, 'Step', 1689.0, 'Epsilon', 0.9559466666663781, 'Action', array([-0.04042453, 0.55752157, 0. ]), 'Reward', -0.48090997590748907)
('Episode', 7, 'Step', 1704.0, 'Epsilon', 0.9558966666663777, 'Action', array([-0.53447112, 0.5101927 , 0. ]), 'Reward', -0.74700994607889926)
('Episode', 7, 'Step', 1719.0, 'Epsilon', 0.9558466666663774, 'Action', array([ 0.20768129, 0.42395412, 0. ]), 'ReWaiting for request on port 3101
******* RESTARTING *****
ward', -0.99295569119212845)
('Episode', 7, 'Step', 1734.0, 'Epsilon', 0.9557966666663771, 'Action', array([-0.99037139, 0.64133345, 0. ]), 'Reward', -0.81716075305851299)
('Episode', 7, 'Step', 1749.0, 'Epsilon', 0.9557466666663768, 'Action', array([-0.22981971, 0.54919937, 0. ]), 'Reward', -0.77515079204486037)
('Episode', 7, 'Step', 1764.0, 'Epsilon', 0.9556966666663764, 'Action', array([ 0.03673034, 0.43840769, 0. ]), 'Reward', -0.73024430861619072)
('Episode', 7, 'Step', 1779.0, 'Epsilon', 0.9556466666663761, 'Action', array([-0.09021953, 0.47308313, 0. ]), 'Reward', -0.76979554075835588)
('Episode', 7, 'Step', 1794.0, 'Epsilon', 0.9555966666663758, 'Action', array([-0.21401817, 0.43302149, 0. ]), 'Reward', -1.0252797005130629)
('Episode', 7, 'Step', 1809.0, 'Epsilon', 0.9555466666663754, 'Action', array([ 0.19328832, 0.38882148, 0. ]), 'Reward', -1.5936138184603506)
('Episode', 7, 'Step', 1824.0, 'Epsilon', 0.9554966666663751, 'Action', array([-0.98821021, 0.61852637, 0. ]), 'Reward', -0.53237759512871707)
('Episode', 7, 'Step', 1839.0, 'Epsilon', 0.9554466666663748, 'Action', array([-0.10071132, 0.436809 , 0.04815257]), 'Reward', -0.53107755202985762)
('Episode', 7, 'Step', 1854.0, 'Epsilon', 0.9553966666663745, 'Action', array([ 0.28476709, 0.53436826, 0. ]), 'Reward', -1.2994423159790496)
('Episode', 7, 'Step', 1869.0, 'Epsilon', 0.9553466666663741, 'Action', array([-1. , 0.50640053, 0. ]), 'Reward', -1.2986250527811314)
('Episode', 7, 'Step', 1884.0, 'Epsilon', 0.9552966666663738, 'Action', array([-0.39510894, 0.44182184, 0. ]), 'Reward', -1.1808510684020721)
('Episode', 7, 'Step', 1899.0, 'Epsilon', 0.9552466666663735, 'Action', array([ 0.34714828, 0.60501386, 0.07153318]), 'Reward', -1.7077563362151755)
('Episode', 7, 'Step', 1914.0, 'Epsilon', 0.9551966666663732, 'Action', array([-1. , 0.47030295, 0. ]), 'Reward', -1.9022530207348272)
('Episode', 7, 'Step', 1929.0, 'Epsilon', 0.9551466666663728, 'Action', array([-0.70972868, 0.36113165, 0. ]), 'Reward', -1.4203710412194397)
('Episode', 7, 'Step', 1944.0, 'Epsilon', 0.9550966666663725, 'Action', array([-1. , 0.33704069, 0. ]), 'Reward', -1.2915570217395747)
('Episode', 7, 'Step', 1959.0, 'Epsilon', 0.9550466666663722, 'Action', array([-0.857862 , 0.64653197, 0. ]), 'Reward', -2.7637076920644024)
('Episode', 7, 'Step', 1974.0, 'Epsilon', 0.9549966666663718, 'Action', array([-1. , 0.41503463, 0.03257087]), 'Reward', -3.4360324359783743)
('Episode', 7, 'Step', 1989.0, 'Epsilon', 0.9549466666663715, 'Action', array([-0.98248126, 0.41954133, 0. ]), 'Reward', -0.29154791462708518)
TOTAL REWARD @ 7-th Episode : Reward -9130.07800835
Total Step: 13526