-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathbot-0.log
1139 lines (1139 loc) · 213 KB
/
bot-0.log
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
INFO:root:Successfully created bot! My Player ID is 0.
INFO:root:=============== TURN 001 ================
INFO:root:Time: 0.0
INFO:root:=============== TURN 002 ================
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (3, 0), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 0), (4, 3), (4, 5), (4, 7), (4, 8), (5, 1), (5, 2), (5, 4), (5, 5), (5, 6), (5, 8), (6, 3), (6, 5), (6, 7), (6, 8), (7, 3), (7, 5), (7, 6), (7, 7), (7, 8), (8, 2), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[5340, 2780, 2520, 2960, 6700, 4560, 1420, 3160, 2960], [1700, 2000, 2140, 1580, 4600, 1660, 2440, 1800, 700], [320, 380, 140, 320, 920, 420, 180, 920, -12], [2480, 20, 1400, 2280, 320, 400, 1920, 240, 1520], [2540, -12, -88, 1100, -160, 1240, -36, 420, 780], [-84, 620, 160, -52, 520, 1000, 600, -24, 740], [-160, -156, -148, 1120, -24, 360, -12, 20, 400], [-76, -4, -108, 820, -32, 1960, 560, 440, 1500], [-40, -64, 140, -36, -72, 20, 3340, 820, 880]]
INFO:root:Count MDP: 5
INFO:root:Ship 0 command: s actual position: Position(14, 28) new position: Position(14, 29)
INFO:root:Time: 0.009771585464477539
INFO:root:=============== TURN 003 ================
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 8), (3, 0), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 2), (4, 4), (4, 6), (4, 7), (4, 8), (5, 0), (5, 1), (5, 3), (5, 4), (5, 5), (5, 7), (5, 8), (6, 2), (6, 4), (6, 6), (6, 7), (6, 8), (7, 2), (7, 4), (7, 5), (7, 6), (7, 7), (7, 8), (8, 1), (8, 4), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[2780, 2520, 2960, 6700, 4560, 1420, 3160, 2960, 3160], [2000, 2140, 1580, 4600, 1660, 2440, 1800, 700, 1900], [380, 140, 320, 920, 420, 180, 920, -12, 860], [20, 1400, 2280, 320, 400, 1920, 240, 1520, 1600], [-12, -88, 1100, -160, 20000, -36, 420, 780, 1380], [620, 160, -52, 520, 1000, 600, -24, 740, 2980], [-156, -148, 1120, -24, 360, -12, 20, 400, 780], [-4, -108, 820, -32, 1960, 560, 440, 1500, 940], [-64, 140, -36, -72, 20, 3340, 820, 880, 2520]]
INFO:root:Count MDP: 3
INFO:root:Ship 0 command: o actual position: Position(14, 29) new position: Position(14, 29)
INFO:root:Time: 0.00684046745300293
INFO:root:=============== TURN 004 ================
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 8), (3, 0), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 2), (4, 4), (4, 6), (4, 7), (4, 8), (5, 0), (5, 1), (5, 3), (5, 4), (5, 5), (5, 7), (5, 8), (6, 2), (6, 4), (6, 6), (6, 7), (6, 8), (7, 2), (7, 4), (7, 5), (7, 6), (7, 7), (7, 8), (8, 1), (8, 4), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[2780, 2520, 2960, 6700, 4560, 1420, 3160, 2960, 3160], [2000, 2140, 1580, 4600, 1660, 2440, 1800, 700, 1900], [380, 140, 320, 920, 420, 180, 920, -12, 860], [20, 1400, 2280, 320, 400, 1920, 240, 1520, 1600], [-12, -88, 1100, -8000, 720, -36, 420, 780, 1380], [620, 160, -52, 520, 1000, 600, -24, 740, 2980], [-156, -148, 1120, -24, 360, -12, 20, 400, 780], [-4, -108, 820, -32, 1960, 560, 440, 1500, 940], [-64, 140, -36, -72, 20, 3340, 820, 880, 2520]]
INFO:root:Count MDP: 3
INFO:root:Ship 0 command: o actual position: Position(14, 29) new position: Position(14, 29)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (3, 0), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 0), (4, 3), (4, 5), (4, 7), (4, 8), (5, 1), (5, 2), (5, 4), (5, 5), (5, 6), (5, 8), (6, 3), (6, 5), (6, 7), (6, 8), (7, 3), (7, 5), (7, 6), (7, 7), (7, 8), (8, 2), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[5340, 2780, 2520, 2960, 6700, 4560, 1420, 3160, 2960], [1700, 2000, 2140, 1580, 4600, 1660, 2440, 1800, 700], [320, 380, 140, 320, 920, 420, 180, 920, -12], [2480, 20, 1400, 2280, 320, 400, 1920, 240, 1520], [2540, -12, -88, 1100, -160, -40000, -36, 420, 780], [-84, 620, 160, -52, 520, 1000, 600, -24, 740], [-160, -156, -148, 1120, -24, 360, -12, 20, 400], [-76, -4, -108, 820, -32, 1960, 560, 440, 1500], [-40, -64, 140, -36, -72, 20, 3340, 820, 880]]
INFO:root:Count MDP: 5
INFO:root:Ship 2 command: n actual position: Position(14, 28) new position: Position(14, 27)
INFO:root:Time: 0.01661205291748047
INFO:root:=============== TURN 005 ================
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 8), (3, 0), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 2), (4, 4), (4, 6), (4, 7), (4, 8), (5, 0), (5, 1), (5, 3), (5, 4), (5, 5), (5, 7), (5, 8), (6, 2), (6, 4), (6, 6), (6, 7), (6, 8), (7, 2), (7, 4), (7, 5), (7, 6), (7, 7), (7, 8), (8, 1), (8, 4), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[2780, 2520, 2960, 6700, 4560, 1420, 3160, 2960, 3160], [2000, 2140, 1580, 4600, 1660, 2440, 1800, 700, 1900], [380, 140, 320, 920, 420, 180, 920, -12, 860], [20, 1400, 2280, 320, 400, 1920, 240, 1520, 1600], [-12, -88, -40000, -160, 340, -36, 420, 780, 1380], [620, 160, -52, 520, 1000, 600, -24, 740, 2980], [-156, -148, 1120, -24, 360, -12, 20, 400, 780], [-4, -108, 820, -32, 1960, 560, 440, 1500, 940], [-64, 140, -36, -72, 20, 3340, 820, 880, 2520]]
INFO:root:Count MDP: 3
INFO:root:Ship 0 command: o actual position: Position(14, 29) new position: Position(14, 29)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 0), (4, 1), (4, 4), (4, 6), (4, 8), (5, 0), (5, 2), (5, 3), (5, 5), (5, 6), (5, 7), (6, 4), (6, 6), (6, 8), (7, 4), (7, 6), (7, 7), (7, 8), (8, 3), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[3600, 5340, 2780, 2520, 2960, 6700, 4560, 1420, 3160], [1460, 1700, 2000, 2140, 1580, 4600, 1660, 2440, 1800], [700, 320, 380, 140, 320, 920, 420, 180, 920], [1200, 2480, 20, 1400, 2280, 320, 400, 1920, 240], [320, 2540, -12, -88, 20000, -160, -40000, -36, 420], [1160, -84, 620, 160, -52, 520, 1000, 600, -24], [0, -160, -156, -148, 1120, -24, 360, -12, 20], [-84, -76, -4, -108, 820, -32, 1960, 560, 440], [-80, -40, -64, 140, -36, -72, 20, 3340, 820]]
INFO:root:Count MDP: 3
INFO:root:Ship 2 command: o actual position: Position(14, 27) new position: Position(14, 27)
INFO:root:Time: 0.014657020568847656
INFO:root:=============== TURN 006 ================
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 8), (3, 0), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 2), (4, 4), (4, 6), (4, 7), (4, 8), (5, 0), (5, 1), (5, 3), (5, 4), (5, 5), (5, 7), (5, 8), (6, 2), (6, 4), (6, 6), (6, 7), (6, 8), (7, 2), (7, 4), (7, 5), (7, 6), (7, 7), (7, 8), (8, 1), (8, 4), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[2780, 2520, 2960, 6700, 4560, 1420, 3160, 2960, 3160], [2000, 2140, 1580, 4600, 1660, 2440, 1800, 700, 1900], [380, 140, 320, 920, 420, 180, 920, -12, 860], [20, 1400, 2280, 320, 400, 1920, 240, 1520, 1600], [-12, -88, -40000, -8000, 40, -36, 420, 780, 1380], [620, 160, -52, 520, 1000, 600, -24, 740, 2980], [-156, -148, 1120, -24, 360, -12, 20, 400, 780], [-4, -108, 820, -32, 1960, 560, 440, 1500, 940], [-64, 140, -36, -72, 20, 3340, 820, 880, 2520]]
INFO:root:Count MDP: 3
INFO:root:Ship 0 command: o actual position: Position(14, 29) new position: Position(14, 29)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 0), (4, 1), (4, 4), (4, 6), (4, 8), (5, 0), (5, 2), (5, 3), (5, 5), (5, 6), (5, 7), (6, 4), (6, 6), (6, 8), (7, 4), (7, 6), (7, 7), (7, 8), (8, 3), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[3600, 5340, 2780, 2520, 2960, 6700, 4560, 1420, 3160], [1460, 1700, 2000, 2140, 1580, 4600, 1660, 2440, 1800], [700, 320, 380, 140, 320, 920, 420, 180, 920], [1200, 2480, 20, 1400, 2280, 320, 400, 1920, 240], [320, 2540, -12, -88, 620, -8000, -40000, -36, 420], [1160, -84, 620, 160, -52, 520, 1000, 600, -24], [0, -160, -156, -148, 1120, -24, 360, -12, 20], [-84, -76, -4, -108, 820, -32, 1960, 560, 440], [-80, -40, -64, 140, -36, -72, 20, 3340, 820]]
INFO:root:Count MDP: 4
INFO:root:Ship 2 command: o actual position: Position(14, 27) new position: Position(14, 27)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (3, 0), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 0), (4, 3), (4, 5), (4, 7), (4, 8), (5, 1), (5, 2), (5, 4), (5, 5), (5, 6), (5, 8), (6, 3), (6, 5), (6, 7), (6, 8), (7, 3), (7, 5), (7, 6), (7, 7), (7, 8), (8, 2), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[5340, 2780, 2520, 2960, 6700, 4560, 1420, 3160, 2960], [1700, 2000, 2140, 1580, 4600, 1660, 2440, 1800, 700], [320, 380, 140, 320, 920, 420, 180, 920, -12], [2480, 20, 1400, 2280, 320, 400, 1920, 240, 1520], [2540, -12, -88, -40000, -160, -40000, -36, 420, 780], [-84, 620, 160, -52, 520, 1000, 600, -24, 740], [-160, -156, -148, 1120, -24, 360, -12, 20, 400], [-76, -4, -108, 820, -32, 1960, 560, 440, 1500], [-40, -64, 140, -36, -72, 20, 3340, 820, 880]]
INFO:root:Count MDP: 4
INFO:root:Ship 4 command: e actual position: Position(14, 28) new position: Position(15, 28)
INFO:root:Time: 0.024438858032226562
INFO:root:=============== TURN 007 ================
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 8), (3, 0), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 2), (4, 6), (4, 7), (4, 8), (5, 0), (5, 1), (5, 3), (5, 4), (5, 5), (5, 7), (5, 8), (6, 2), (6, 4), (6, 6), (6, 7), (6, 8), (7, 2), (7, 4), (7, 5), (7, 6), (7, 7), (7, 8), (8, 1), (8, 4), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[2780, 2520, 2960, 6700, 4560, 1420, 3160, 2960, 3160], [2000, 2140, 1580, 4600, 1660, 2440, 1800, 700, 1900], [380, 140, 320, 920, 420, 180, 920, -12, 860], [20, 1400, 2280, 320, 400, 1920, 240, 1520, 1600], [-12, -88, -40000, -160, -36, -36, 420, 780, 1380], [620, 160, -52, -40000, 1000, 600, -24, 740, 2980], [-156, -148, 1120, -24, 360, -12, 20, 400, 780], [-4, -108, 820, -32, 1960, 560, 440, 1500, 940], [-64, 140, -36, -72, 20, 3340, 820, 880, 2520]]
INFO:root:Count MDP: 2
INFO:root:Ship 0 command: s actual position: Position(14, 29) new position: Position(14, 30)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 0), (4, 1), (4, 4), (4, 8), (5, 0), (5, 2), (5, 3), (5, 5), (5, 6), (5, 7), (6, 4), (6, 6), (6, 8), (7, 4), (7, 6), (7, 7), (7, 8), (8, 3), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[3600, 5340, 2780, 2520, 2960, 6700, 4560, 1420, 3160], [1460, 1700, 2000, 2140, 1580, 4600, 1660, 2440, 1800], [700, 320, 380, 140, 320, 920, 420, 180, 920], [1200, 2480, 20, 1400, 2280, 320, 400, 1920, 240], [320, 2540, -12, -88, 260, -160, -36, -8000, 420], [1160, -84, 620, 160, -52, -40000, 1000, 600, -24], [0, -160, -156, -148, 1120, -24, 360, -12, 20], [-84, -76, -4, -108, 820, -32, 1960, 560, 440], [-80, -40, -64, 140, -36, -72, 20, 3340, 820]]
INFO:root:Count MDP: 4
INFO:root:Ship 2 command: o actual position: Position(14, 27) new position: Position(14, 27)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 3), (3, 7), (3, 8), (4, 1), (4, 2), (4, 4), (4, 5), (4, 6), (4, 8), (5, 3), (5, 5), (5, 7), (5, 8), (6, 3), (6, 5), (6, 6), (6, 7), (6, 8), (7, 2), (7, 5), (7, 6), (7, 7), (7, 8), (8, 0), (8, 2), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[1700, 2000, 2140, 1580, 4600, 1660, 2440, 1800, 700], [320, 380, 140, 320, 920, 420, 180, 920, -12], [2480, 20, 1400, 2280, 320, 400, 1920, 240, 1520], [2540, -12, -88, -40000, -160, -36, -8000, 420, 780], [-84, 620, 160, -52, 20000, 1000, 600, -24, 740], [-160, -156, -148, 1120, -24, 360, -12, 20, 400], [-76, -4, -108, 820, -32, 1960, 560, 440, 1500], [-40, -64, 140, -36, -72, 20, 3340, 820, 880], [2440, -40, 440, -88, -96, 0, 920, 5040, 3580]]
INFO:root:Count MDP: 3
INFO:root:Ship 4 command: o actual position: Position(15, 28) new position: Position(15, 28)
INFO:root:Time: 0.021502256393432617
INFO:root:=============== TURN 008 ================
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 0), (4, 1), (4, 8), (5, 0), (5, 2), (5, 3), (5, 5), (5, 6), (5, 7), (6, 4), (6, 6), (6, 8), (7, 4), (7, 6), (7, 7), (7, 8), (8, 3), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[3600, 5340, 2780, 2520, 2960, 6700, 4560, 1420, 3160], [1460, 1700, 2000, 2140, 1580, 4600, 1660, 2440, 1800], [700, 320, 380, 140, 320, 920, 420, 180, 920], [1200, 2480, 20, 1400, 2280, 320, 400, 1920, 240], [320, 2540, -12, -88, -4, -8000, -36, -8000, 420], [1160, -84, 620, 160, -52, -40000, 1000, 600, -24], [0, -160, -156, -148, 1120, -24, 360, -12, 20], [-84, -76, -4, -108, 820, -32, 1960, 560, 440], [-80, -40, -64, 140, -36, -72, 20, 3340, 820]]
INFO:root:Count MDP: 4
INFO:root:Ship 2 command: w actual position: Position(14, 27) new position: Position(13, 27)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 7), (3, 8), (4, 1), (4, 2), (4, 4), (4, 5), (4, 6), (4, 8), (5, 3), (5, 5), (5, 7), (5, 8), (6, 3), (6, 5), (6, 6), (6, 7), (6, 8), (7, 2), (7, 5), (7, 6), (7, 7), (7, 8), (8, 0), (8, 2), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[1700, 2000, 2140, 1580, 4600, 1660, 2440, 1800, 700], [320, 380, 140, 320, 920, 420, 180, 920, -12], [2480, 20, 1400, -40000, 320, 400, 1920, 240, 1520], [2540, -12, -88, -4, -8000, -36, -8000, 420, 780], [-84, 620, 160, -52, 180, 1000, 600, -24, 740], [-160, -156, -148, 1120, -24, 360, -12, 20, 400], [-76, -4, -108, 820, -32, 1960, 560, 440, 1500], [-40, -64, 140, -36, -72, 20, 3340, 820, 880], [2440, -40, 440, -88, -96, 0, 920, 5040, 3580]]
INFO:root:Count MDP: 4
INFO:root:Ship 4 command: o actual position: Position(15, 28) new position: Position(15, 28)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 7), (2, 8), (3, 0), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 5), (4, 6), (4, 7), (4, 8), (5, 0), (5, 2), (5, 3), (5, 4), (5, 6), (5, 7), (5, 8), (6, 1), (6, 3), (6, 5), (6, 6), (6, 7), (6, 8), (7, 1), (7, 3), (7, 4), (7, 5), (7, 6), (7, 7), (7, 8), (8, 0), (8, 3), (8, 4), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[2520, 2960, 6700, 4560, 1420, 3160, 2960, 3160, 7080], [2140, 1580, 4600, 1660, 2440, 1800, 700, 1900, 5900], [140, 320, 920, 420, 180, 920, -12, 860, 4340], [1400, -40000, 320, 400, 1920, 240, 1520, 1600, 2080], [-88, -4, -8000, -36, -36, 420, 780, 1380, 1760], [160, -52, -40000, 1000, 600, -24, 740, 2980, 2140], [-148, 1120, -24, 360, -12, 20, 400, 780, 660], [-108, 820, -32, 1960, 560, 440, 1500, 940, 1880], [140, -36, -72, 20, 3340, 820, 880, 2520, 6740]]
INFO:root:Count MDP: 3
INFO:root:Ship 0 command: w actual position: Position(14, 30) new position: Position(13, 30)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (3, 0), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 0), (4, 7), (4, 8), (5, 1), (5, 2), (5, 4), (5, 5), (5, 6), (5, 8), (6, 3), (6, 5), (6, 7), (6, 8), (7, 3), (7, 5), (7, 6), (7, 7), (7, 8), (8, 2), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[5340, 2780, 2520, 2960, 6700, 4560, 1420, 3160, 2960], [1700, 2000, 2140, 1580, 4600, 1660, 2440, 1800, 700], [320, 380, 140, 320, 920, 420, 180, 920, -12], [2480, 20, 1400, -40000, 320, 400, -40000, 240, 1520], [2540, -12, -88, -4, -160, -36, -36, 420, 780], [-84, 620, 160, -52, -40000, 1000, 600, -24, 740], [-160, -156, -148, 1120, -24, 360, -12, 20, 400], [-76, -4, -108, 820, -32, 1960, 560, 440, 1500], [-40, -64, 140, -36, -72, 20, 3340, 820, 880]]
INFO:root:Count MDP: 4
INFO:root:Ship 6 command: n actual position: Position(14, 28) new position: Position(14, 27)
INFO:root:Time: 0.03322410583496094
INFO:root:=============== TURN 009 ================
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 7), (3, 8), (4, 1), (4, 2), (4, 5), (4, 6), (4, 8), (5, 3), (5, 5), (5, 7), (5, 8), (6, 3), (6, 5), (6, 6), (6, 7), (6, 8), (7, 2), (7, 5), (7, 6), (7, 7), (7, 8), (8, 0), (8, 2), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[1700, 2000, 2140, 1580, 4600, 1660, 2440, 1800, 700], [320, 380, 140, 320, 920, 420, 180, 920, -12], [2480, 20, 1400, -40000, 320, 400, -40000, 240, 1520], [2540, -12, -88, -8000, -160, -36, -36, 420, 780], [-84, 620, 160, -52, -16, 1000, 600, -24, 740], [-160, -156, -148, 1120, -24, 360, -12, 20, 400], [-76, -4, -108, 820, -32, 1960, 560, 440, 1500], [-40, -64, 140, -36, -72, 20, 3340, 820, 880], [2440, -40, 440, -88, -96, 0, 920, 5040, 3580]]
INFO:root:Count MDP: 4
INFO:root:Ship 4 command: e actual position: Position(15, 28) new position: Position(16, 28)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 0), (4, 1), (4, 2), (4, 3), (4, 4), (4, 5), (4, 6), (4, 7), (4, 8), (5, 0), (5, 1), (5, 8), (6, 0), (6, 2), (6, 3), (6, 6), (6, 7), (7, 4), (7, 6), (7, 8), (8, 4), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[5400, 10060, 9180, 3360, 3600, 2900, 2800, 1700, 2520], [3600, 5340, 2780, 2520, 2960, 6700, 4560, 1420, 3160], [1460, 1700, 2000, 2140, 1580, 4600, 1660, 2440, 1800], [700, 320, 380, 140, 320, 920, 420, 180, 920], [1200, 2480, 20, 1400, 2280, 320, 400, -40000, 240], [320, 2540, -12, -88, -8000, -160, -36, -36, 420], [1160, -84, 620, 160, -52, -16, 1000, 600, -24], [0, -160, -156, -148, 1120, -8000, 360, -12, 20], [-84, -76, -4, -108, 820, -32, 1960, 560, 440]]
INFO:root:Count MDP: 2
INFO:root:Ship 2 command: o actual position: Position(13, 27) new position: Position(13, 27)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 7), (3, 8), (4, 0), (4, 1), (4, 2), (4, 3), (4, 4), (4, 5), (4, 6), (4, 7), (4, 8), (5, 5), (5, 6), (5, 7), (5, 8), (6, 0), (6, 3), (6, 4), (6, 6), (6, 7), (6, 8), (7, 1), (7, 3), (7, 5), (7, 6), (7, 7), (7, 8), (8, 1), (8, 3), (8, 4), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[3360, 3600, 2900, 2800, 1700, 2520, 3880, 7680, 3400], [2520, 2960, 6700, 4560, 1420, 3160, 2960, 3160, 7080], [2140, 1580, 4600, 1660, 2440, 1800, 700, 1900, 5900], [140, 320, 920, 420, 180, 920, -12, 860, 4340], [1400, -40000, 320, 400, 1920, 240, 1520, 1600, 2080], [-88, -8000, -160, -36, -36, 420, 780, 1380, 1760], [160, -52, -16, 1000, 600, -24, 740, 2980, 2140], [-148, 1120, -8000, 360, -12, 20, 400, 780, 660], [-108, 820, -32, 1960, 560, 440, 1500, 940, 1880]]
INFO:root:Count MDP: 4
INFO:root:Ship 0 command: o actual position: Position(13, 30) new position: Position(13, 30)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 0), (4, 1), (4, 8), (5, 0), (5, 2), (5, 3), (5, 6), (5, 7), (6, 4), (6, 6), (6, 8), (7, 4), (7, 6), (7, 7), (7, 8), (8, 3), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[3600, 5340, 2780, 2520, 2960, 6700, 4560, 1420, 3160], [1460, 1700, 2000, 2140, 1580, 4600, 1660, 2440, 1800], [700, 320, 380, 140, 320, 920, 420, 180, 920], [1200, 2480, 20, 1400, -40000, 320, 400, -40000, 240], [320, 2540, -12, -88, 4000, -160, -36, -36, 420], [1160, -84, 620, 160, -52, -16, 1000, 600, -24], [0, -160, -156, -148, 1120, -8000, 360, -12, 20], [-84, -76, -4, -108, 820, -32, 1960, 560, 440], [-80, -40, -64, 140, -36, -72, 20, 3340, 820]]
INFO:root:Count MDP: 4
INFO:root:Ship 6 command: o actual position: Position(14, 27) new position: Position(14, 27)
INFO:root:Time: 0.033734798431396484
INFO:root:=============== TURN 010 ================
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 0), (4, 1), (4, 2), (4, 3), (4, 4), (4, 5), (4, 6), (4, 7), (4, 8), (5, 0), (5, 1), (5, 8), (6, 0), (6, 2), (6, 3), (6, 6), (6, 7), (7, 4), (7, 6), (7, 8), (8, 4), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[5400, 10060, 9180, 3360, 3600, 2900, 2800, 1700, 2520], [3600, 5340, 2780, 2520, 2960, 6700, 4560, 1420, 3160], [1460, 1700, 2000, 2140, 1580, 4600, 1660, 2440, 1800], [700, 320, 380, 140, 320, 920, 420, 180, 920], [1200, 2480, 20, 1400, 1500, 320, 400, -40000, 240], [320, 2540, -12, -88, -8000, -8000, -36, -36, 420], [1160, -84, 620, 160, -52, -16, 1000, 600, -24], [0, -160, -156, -148, 1120, -8000, 360, -12, 20], [-84, -76, -4, -108, 820, -32, 1960, 560, 440]]
INFO:root:Count MDP: 4
INFO:root:Ship 2 command: o actual position: Position(13, 27) new position: Position(13, 27)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 7), (3, 8), (4, 0), (4, 1), (4, 2), (4, 3), (4, 4), (4, 5), (4, 6), (4, 7), (4, 8), (5, 5), (5, 6), (5, 7), (5, 8), (6, 0), (6, 3), (6, 4), (6, 6), (6, 7), (6, 8), (7, 1), (7, 3), (7, 5), (7, 6), (7, 7), (7, 8), (8, 1), (8, 3), (8, 4), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[3360, 3600, 2900, 2800, 1700, 2520, 3880, 7680, 3400], [2520, 2960, 6700, 4560, 1420, 3160, 2960, 3160, 7080], [2140, 1580, 4600, 1660, 2440, 1800, 700, 1900, 5900], [140, 320, 920, 420, 180, 920, -12, 860, 4340], [1400, -40000, 320, 400, 1240, 240, 1520, 1600, 2080], [-88, -8000, -8000, -36, -36, 420, 780, 1380, 1760], [160, -52, -16, 1000, 600, -24, 740, 2980, 2140], [-148, 1120, -8000, 360, -12, 20, 400, 780, 660], [-108, 820, -32, 1960, 560, 440, 1500, 940, 1880]]
INFO:root:Count MDP: 2
INFO:root:Ship 0 command: o actual position: Position(13, 30) new position: Position(13, 30)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 7), (2, 8), (3, 1), (3, 2), (3, 5), (3, 6), (3, 8), (4, 3), (4, 5), (4, 7), (4, 8), (5, 3), (5, 5), (5, 6), (5, 7), (5, 8), (6, 2), (6, 5), (6, 6), (6, 7), (6, 8), (7, 0), (7, 2), (7, 6), (7, 7), (7, 8), (8, 0), (8, 1), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[320, 380, 140, 320, 920, 420, 180, 920, -12], [2480, 20, 1400, -40000, 320, 400, -40000, 240, 1520], [2540, -12, -88, -8000, -8000, -36, -36, 420, 780], [-84, 620, 160, -52, -16, 1000, 600, -24, 740], [-160, -156, -148, 1120, -24, 360, -12, 20, 400], [-76, -4, -108, 820, -32, 1960, 560, 440, 1500], [-40, -64, 140, -36, -72, 20, 3340, 820, 880], [2440, -40, 440, -88, -96, 0, 920, 5040, 3580], [2820, 1920, -88, -60, -100, 840, 2760, 2500, 8920]]
INFO:root:Count MDP: 4
INFO:root:Ship 4 command: e actual position: Position(16, 28) new position: Position(17, 28)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (3, 0), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 0), (4, 7), (4, 8), (5, 1), (5, 2), (5, 5), (5, 6), (5, 8), (6, 3), (6, 5), (6, 7), (6, 8), (7, 3), (7, 5), (7, 6), (7, 7), (7, 8), (8, 2), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[5340, 2780, 2520, 2960, 6700, 4560, 1420, 3160, 2960], [1700, 2000, 2140, 1580, 4600, 1660, 2440, 1800, 700], [320, 380, 140, 320, 920, 420, 180, 920, -12], [2480, 20, 1400, -40000, 320, 400, -40000, 240, 1520], [2540, -12, -88, -8000, -160, -36, -36, 420, 780], [-84, 620, 160, -52, -16, 1000, 600, -24, 740], [-160, -156, -148, 1120, -24, 360, -12, 20, 400], [-76, -4, -108, 820, -8000, 1960, 560, 440, 1500], [-40, -64, 140, -36, -72, 20, 3340, 820, 880]]
INFO:root:Count MDP: 4
INFO:root:Ship 8 command: e actual position: Position(14, 28) new position: Position(15, 28)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 0), (4, 1), (4, 8), (5, 0), (5, 2), (5, 3), (5, 6), (5, 7), (6, 4), (6, 6), (6, 8), (7, 4), (7, 6), (7, 7), (7, 8), (8, 3), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[3600, 5340, 2780, 2520, 2960, 6700, 4560, 1420, 3160], [1460, 1700, 2000, 2140, 1580, 4600, 1660, 2440, 1800], [700, 320, 380, 140, 320, 920, 420, 180, 920], [1200, 2480, 20, 1400, -40000, 320, 400, -40000, 240], [320, 2540, -12, -88, -44, -160, -36, -36, 420], [1160, -84, 620, 160, -52, -8000, 1000, 600, -24], [0, -160, -156, -148, 1120, -24, 360, -12, 20], [-84, -76, -4, -108, 820, -8000, 1960, 560, 440], [-80, -40, -64, 140, -36, -72, 20, 3340, 820]]
INFO:root:Count MDP: 4
INFO:root:Ship 6 command: n actual position: Position(14, 27) new position: Position(14, 26)
INFO:root:Time: 0.04450845718383789
INFO:root:=============== TURN 011 ================
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 0), (4, 1), (4, 2), (4, 3), (4, 4), (4, 5), (4, 6), (4, 7), (4, 8), (5, 0), (5, 1), (5, 8), (6, 0), (6, 2), (6, 3), (6, 6), (6, 7), (7, 4), (7, 6), (7, 8), (8, 4), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[5400, 10060, 9180, 3360, 3600, 2900, 2800, 1700, 2520], [3600, 5340, 2780, 2520, 2960, 6700, 4560, 1420, 3160], [1460, 1700, 2000, 2140, 1580, 4600, 1660, 2440, 1800], [700, 320, 380, 140, 320, 920, 420, 180, 920], [1200, 2480, 20, 1400, 920, 320, 400, -40000, 240], [320, 2540, -12, -8000, -44, -160, -36, -36, 420], [1160, -84, 620, 160, -52, -8000, 1000, 600, -24], [0, -160, -156, -148, 1120, -24, 360, -12, 20], [-84, -76, -4, -108, 820, -8000, 1960, 560, 440]]
INFO:root:Count MDP: 4
INFO:root:Ship 2 command: o actual position: Position(13, 27) new position: Position(13, 27)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 7), (3, 8), (4, 0), (4, 1), (4, 2), (4, 3), (4, 4), (4, 5), (4, 6), (4, 7), (4, 8), (5, 5), (5, 6), (5, 7), (5, 8), (6, 0), (6, 3), (6, 4), (6, 6), (6, 7), (6, 8), (7, 1), (7, 3), (7, 5), (7, 6), (7, 7), (7, 8), (8, 1), (8, 3), (8, 4), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[3360, 3600, 2900, 2800, 1700, 2520, 3880, 7680, 3400], [2520, 2960, 6700, 4560, 1420, 3160, 2960, 3160, 7080], [2140, 1580, 4600, 1660, 2440, 1800, 700, 1900, 5900], [140, 320, 920, 420, 180, 920, -12, 860, 4340], [1400, -40000, 320, 400, 720, 240, 1520, 1600, 2080], [-8000, -44, -160, -36, -36, 420, 780, 1380, 1760], [160, -52, -8000, 1000, 600, -24, 740, 2980, 2140], [-148, 1120, -24, 360, -12, 20, 400, 780, 660], [-108, 820, -8000, 1960, 560, 440, 1500, 940, 1880]]
INFO:root:Count MDP: 2
INFO:root:Ship 0 command: o actual position: Position(13, 30) new position: Position(13, 30)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 7), (1, 8), (2, 1), (2, 2), (2, 5), (2, 6), (2, 8), (3, 3), (3, 5), (3, 7), (3, 8), (4, 3), (4, 5), (4, 6), (4, 7), (4, 8), (5, 2), (5, 5), (5, 6), (5, 7), (5, 8), (6, 0), (6, 2), (6, 6), (6, 7), (6, 8), (7, 0), (7, 1), (7, 5), (7, 6), (7, 7), (7, 8), (8, 0), (8, 2), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[2480, 20, 1400, -40000, 320, 400, -40000, 240, 1520], [2540, -12, -8000, -44, -160, -36, -36, 420, 780], [-84, 620, 160, -52, -8000, 1000, 600, -24, 740], [-160, -156, -148, 1120, -24, 360, -12, 20, 400], [-76, -4, -108, 820, -32, 1960, 560, 440, 1500], [-40, -64, 140, -36, -72, 20, 3340, 820, 880], [2440, -40, 440, -88, -96, 0, 920, 5040, 3580], [2820, 1920, -88, -60, -100, 840, 2760, 2500, 8920], [460, -12, 660, -20, -44, -44, 460, 2140, 5240]]
INFO:root:Count MDP: 4
INFO:root:Ship 4 command: s actual position: Position(17, 28) new position: Position(17, 29)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 7), (3, 8), (4, 1), (4, 2), (4, 5), (4, 6), (4, 8), (5, 3), (5, 5), (5, 7), (5, 8), (6, 3), (6, 5), (6, 6), (6, 7), (6, 8), (7, 2), (7, 5), (7, 6), (7, 7), (7, 8), (8, 0), (8, 2), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[1700, 2000, 2140, 1580, 4600, 1660, 2440, 1800, 700], [320, 380, 140, 320, 920, 420, 180, 920, -12], [2480, 20, 1400, -40000, 320, 400, -40000, 240, 1520], [2540, -12, -8000, -44, -160, -36, -36, 420, 780], [-84, 620, 160, -52, 4000, 1000, 600, -24, 740], [-160, -156, -148, 1120, -24, 360, -12, 20, 400], [-76, -4, -108, 820, -32, -40000, 560, 440, 1500], [-40, -64, 140, -36, -72, 20, 3340, 820, 880], [2440, -40, 440, -88, -96, 0, 920, 5040, 3580]]
INFO:root:Count MDP: 4
INFO:root:Ship 8 command: o actual position: Position(15, 28) new position: Position(15, 28)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 0), (4, 1), (4, 2), (5, 0), (5, 1), (5, 3), (5, 4), (5, 7), (5, 8), (6, 0), (6, 5), (6, 7), (7, 0), (7, 5), (7, 7), (7, 8), (8, 0), (8, 4), (8, 7), (8, 8)]
INFO:root:Rewards:
[[5560, 3600, 5340, 2780, 2520, 2960, 6700, 4560, 1420], [3880, 1460, 1700, 2000, 2140, 1580, 4600, 1660, 2440], [-12, 700, 320, 380, 140, 320, 920, 420, 180], [2140, 1200, 2480, 20, 1400, -40000, 320, 400, -40000], [1860, 320, 2540, -12, -88, -44, -160, -36, -36], [900, 1160, -84, 620, 160, -52, -8000, 1000, 600], [980, 0, -160, -156, -148, 1120, -24, 360, -12], [360, -84, -76, -4, -108, 820, -32, -40000, 560], [180, -80, -40, -64, 140, -36, -72, 20, 3340]]
INFO:root:Count MDP: 4
INFO:root:Ship 6 command: n actual position: Position(14, 26) new position: Position(14, 25)
INFO:root:Time: 0.046716928482055664
INFO:root:=============== TURN 012 ================
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 0), (4, 1), (4, 2), (4, 3), (4, 4), (4, 5), (4, 6), (4, 7), (4, 8), (5, 0), (5, 1), (5, 8), (6, 0), (6, 2), (6, 3), (6, 6), (6, 7), (7, 4), (7, 6), (7, 8), (8, 4), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[5400, 10060, 9180, 3360, 3600, 2900, 2800, 1700, 2520], [3600, 5340, 2780, 2520, 2960, 6700, 4560, 1420, 3160], [1460, 1700, 2000, 2140, 1580, 4600, 1660, 2440, 1800], [700, 320, 380, 140, 320, 920, 420, 180, 920], [1200, 2480, 20, 1400, 480, 320, 400, -40000, 240], [320, 2540, -8000, -88, -44, -160, -36, -36, 420], [1160, -84, 620, 160, -52, -8000, 1000, 600, -24], [0, -160, -156, -148, 1120, -24, 360, -12, 20], [-84, -76, -4, -108, 820, -32, -40000, 560, 440]]
INFO:root:Count MDP: 3
INFO:root:Ship 2 command: o actual position: Position(13, 27) new position: Position(13, 27)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 7), (3, 8), (4, 0), (4, 1), (4, 2), (4, 3), (4, 4), (4, 5), (4, 6), (4, 7), (4, 8), (5, 5), (5, 6), (5, 7), (5, 8), (6, 0), (6, 3), (6, 4), (6, 6), (6, 7), (6, 8), (7, 1), (7, 3), (7, 5), (7, 6), (7, 7), (7, 8), (8, 1), (8, 3), (8, 4), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[3360, 3600, 2900, 2800, 1700, 2520, 3880, 7680, 3400], [2520, 2960, 6700, 4560, 1420, 3160, 2960, 3160, 7080], [2140, 1580, 4600, 1660, 2440, 1800, 700, 1900, 5900], [140, 320, 920, 420, 180, 920, -12, 860, 4340], [1400, -40000, 320, 400, 340, 240, 1520, 1600, 2080], [-88, -44, -160, -36, -36, 420, 780, 1380, 1760], [160, -52, -8000, 1000, 600, -24, 740, 2980, 2140], [-148, 1120, -24, 360, -12, 20, 400, 780, 660], [-108, 820, -32, -40000, 560, 440, 1500, 940, 1880]]
INFO:root:Count MDP: 2
INFO:root:Ship 0 command: o actual position: Position(13, 30) new position: Position(13, 30)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 4), (2, 5), (2, 7), (2, 8), (3, 2), (3, 4), (3, 6), (3, 7), (3, 8), (4, 2), (4, 4), (4, 5), (4, 6), (4, 7), (4, 8), (5, 1), (5, 4), (5, 5), (5, 6), (5, 7), (5, 8), (6, 1), (6, 5), (6, 6), (6, 7), (6, 8), (7, 0), (7, 4), (7, 5), (7, 6), (7, 7), (7, 8), (8, 1), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[20, 1400, -40000, 320, 400, -40000, 240, 1520, 1600], [-8000, -88, -44, -160, -36, -36, 420, 780, 1380], [620, 160, -52, -8000, 1000, 600, -24, 740, 2980], [-156, -148, 1120, -24, 360, -12, 20, 400, 780], [-4, -108, 820, -32, 1960, 560, 440, 1500, 940], [-64, 140, -36, -72, 20, 3340, 820, 880, 2520], [-40, 440, -88, -96, 0, 920, 5040, 3580, 2420], [1920, -88, -60, -100, 840, 2760, 2500, 8920, 3180], [-12, 660, -20, -44, -44, 460, 2140, 5240, 2800]]
INFO:root:Count MDP: 4
INFO:root:Ship 4 command: o actual position: Position(17, 29) new position: Position(17, 29)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 7), (3, 8), (4, 1), (4, 2), (4, 5), (4, 6), (4, 8), (5, 3), (5, 5), (5, 7), (5, 8), (6, 3), (6, 5), (6, 6), (6, 7), (6, 8), (7, 2), (7, 5), (7, 6), (7, 7), (7, 8), (8, 0), (8, 2), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[1700, 2000, 2140, 1580, 4600, 1660, 2440, 1800, 700], [320, 380, 140, 320, 920, 420, 180, 920, -12], [2480, 20, 1400, -40000, 320, 400, -40000, 240, 1520], [2540, -8000, -88, -44, -160, -36, -36, 420, 780], [-84, 620, 160, -52, -52, 1000, 600, -24, 740], [-160, -156, -148, 1120, -24, 360, -12, 20, 400], [-76, -4, -108, 820, -32, -40000, 560, 440, 1500], [-40, -64, 140, -36, -72, 20, 3340, 820, 880], [2440, -40, 440, -88, -96, 0, 920, 5040, 3580]]
INFO:root:Count MDP: 3
INFO:root:Ship 8 command: s actual position: Position(15, 28) new position: Position(15, 29)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 0), (4, 1), (4, 2), (4, 3), (5, 1), (5, 2), (5, 4), (5, 5), (5, 8), (6, 1), (6, 6), (6, 8), (7, 0), (7, 1), (7, 6), (7, 8), (8, 1), (8, 5), (8, 8)]
INFO:root:Rewards:
[[1880, 5560, 3600, 5340, 2780, 2520, 2960, 6700, 4560], [3840, 3880, 1460, 1700, 2000, 2140, 1580, 4600, 1660], [140, -12, 700, 320, 380, 140, 320, 920, 420], [-4, 2140, 1200, 2480, 20, 1400, -40000, 320, 400], [1600, 1860, 320, 2540, -12, -88, -44, -160, -36], [-84, 900, 1160, -84, 620, 160, -52, -52, -40000], [-32, 980, 0, -160, -156, -148, 1120, -24, 360], [280, 360, -84, -76, -4, -108, 820, -32, -40000], [-52, 180, -80, -40, -64, 140, -36, -72, 20]]
INFO:root:Count MDP: 5
INFO:root:Ship 6 command: n actual position: Position(14, 25) new position: Position(14, 24)
INFO:root:Time: 0.04105114936828613
INFO:root:=============== TURN 013 ================
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 0), (4, 1), (4, 2), (4, 3), (4, 4), (4, 5), (4, 6), (4, 7), (4, 8), (5, 0), (5, 1), (5, 8), (6, 0), (6, 2), (6, 3), (6, 6), (6, 7), (7, 4), (7, 6), (7, 8), (8, 4), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[5400, 10060, 9180, 3360, 3600, 2900, 2800, 1700, 2520], [3600, 5340, 2780, 2520, 2960, 6700, 4560, 1420, 3160], [1460, 1700, 2000, 2140, 1580, 4600, 1660, 2440, 1800], [700, 320, 380, 140, 320, 920, 420, 180, 920], [1200, 2480, 20, 1400, 160, 320, 400, -40000, 240], [320, -40000, -12, -88, -44, -160, -36, -36, 420], [1160, -84, 620, 160, -52, -52, -40000, 600, -24], [0, -160, -156, -148, 1120, -24, 360, -12, 20], [-84, -76, -4, -108, 820, -32, -40000, 560, 440]]
INFO:root:Count MDP: 4
INFO:root:Ship 2 command: o actual position: Position(13, 27) new position: Position(13, 27)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 6), (3, 7), (3, 8), (4, 0), (4, 1), (4, 4), (4, 5), (4, 7), (4, 8), (5, 2), (5, 4), (5, 6), (5, 7), (5, 8), (6, 2), (6, 4), (6, 5), (6, 6), (6, 7), (6, 8), (7, 1), (7, 4), (7, 5), (7, 6), (7, 7), (7, 8), (8, 1), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[2000, 2140, 1580, 4600, 1660, 2440, 1800, 700, 1900], [380, 140, 320, 920, 420, 180, 920, -12, 860], [20, 1400, -40000, 320, 400, -40000, 240, 1520, 1600], [-12, -88, -44, -160, -36, -36, 420, 780, 1380], [620, 160, -52, -52, 20000, 600, -24, 740, 2980], [-156, -148, 1120, -24, 360, -12, 20, 400, 780], [-4, -108, 820, -32, -40000, 560, 440, 1500, 940], [-64, 140, -36, -72, 20, 3340, 820, 880, 2520], [-40, 440, -88, -96, 0, 920, 5040, 3580, 2420]]
INFO:root:Count MDP: 4
INFO:root:Ship 8 command: o actual position: Position(15, 29) new position: Position(15, 29)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 7), (3, 8), (4, 0), (4, 1), (4, 2), (4, 3), (4, 4), (4, 5), (4, 6), (4, 7), (4, 8), (5, 5), (5, 6), (5, 7), (5, 8), (6, 0), (6, 3), (6, 4), (6, 6), (6, 7), (6, 8), (7, 1), (7, 3), (7, 5), (7, 6), (7, 7), (7, 8), (8, 1), (8, 3), (8, 4), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[3360, 3600, 2900, 2800, 1700, 2520, 3880, 7680, 3400], [2520, 2960, 6700, 4560, 1420, 3160, 2960, 3160, 7080], [2140, 1580, 4600, 1660, 2440, 1800, 700, 1900, 5900], [140, 320, 920, 420, 180, 920, -12, 860, 4340], [1400, -40000, 320, 400, 40, 240, 1520, 1600, 2080], [-88, -44, -160, -36, -36, 420, 780, 1380, 1760], [160, -52, -52, -40000, 600, -24, 740, 2980, 2140], [-148, 1120, -24, 360, -12, 20, 400, 780, 660], [-108, 820, -32, -40000, 560, 440, 1500, 940, 1880]]
INFO:root:Count MDP: 4
INFO:root:Ship 0 command: o actual position: Position(13, 30) new position: Position(13, 30)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 4), (2, 5), (2, 7), (2, 8), (3, 2), (3, 4), (3, 6), (3, 7), (3, 8), (4, 2), (4, 4), (4, 5), (4, 6), (4, 7), (4, 8), (5, 1), (5, 4), (5, 5), (5, 6), (5, 7), (5, 8), (6, 1), (6, 5), (6, 6), (6, 7), (6, 8), (7, 0), (7, 4), (7, 5), (7, 6), (7, 7), (7, 8), (8, 1), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[20, 1400, -40000, 320, 400, -40000, 240, 1520, 1600], [-12, -88, -44, -160, -36, -36, 420, 780, 1380], [620, 160, -52, -52, -40000, 600, -24, 740, 2980], [-156, -148, 1120, -24, 360, -12, 20, 400, 780], [-4, -108, 820, -32, 1260, 560, 440, 1500, 940], [-64, 140, -36, -72, 20, 3340, 820, 880, 2520], [-40, 440, -88, -96, 0, 920, 5040, 3580, 2420], [1920, -88, -60, -100, 840, 2760, 2500, 8920, 3180], [-12, 660, -20, -44, -44, 460, 2140, 5240, 2800]]
INFO:root:Count MDP: 4
INFO:root:Ship 4 command: o actual position: Position(17, 29) new position: Position(17, 29)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 1), (4, 2), (4, 3), (4, 4), (5, 0), (5, 2), (5, 3), (5, 5), (5, 6), (6, 2), (6, 7), (7, 1), (7, 2), (7, 7), (8, 2), (8, 6)]
INFO:root:Rewards:
[[1580, 1880, 5560, 3600, 5340, 2780, 2520, 2960, 6700], [1120, 3840, 3880, 1460, 1700, 2000, 2140, 1580, 4600], [1060, 140, -12, 700, 320, 380, 140, 320, 920], [860, -4, 2140, 1200, 2480, 20, 1400, -40000, 320], [-120, 1600, 1860, 320, 20000, -12, -88, -44, -160], [40, -84, 900, 1160, -84, 620, 160, -52, -52], [-160, -32, 980, 0, -160, -156, -148, 1120, -24], [-120, 280, 360, -84, -76, -4, -108, 820, -32], [-120, -52, 180, -80, -40, -64, 140, -36, -72]]
INFO:root:Count MDP: 6
INFO:root:Ship 6 command: o actual position: Position(14, 24) new position: Position(14, 24)
INFO:root:Time: 0.04690241813659668
INFO:root:=============== TURN 014 ================
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 0), (4, 1), (4, 2), (4, 3), (4, 5), (4, 6), (4, 8), (5, 0), (5, 1), (5, 8), (6, 0), (6, 2), (6, 3), (6, 6), (6, 7), (7, 4), (7, 6), (7, 8), (8, 4), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[5400, 10060, 9180, 3360, 3600, 2900, 2800, 1700, 2520], [3600, 5340, 2780, 2520, 2960, 6700, 4560, 1420, 3160], [1460, 1700, 2000, 2140, 1580, 4600, 1660, 2440, 1800], [700, 320, 380, 140, 320, 920, 420, 180, 920], [1200, 2480, 20, 1400, -16, 320, 400, -8000, 240], [320, -40000, -12, -88, -44, -160, -36, -36, 420], [1160, -84, 620, 160, -52, -52, -40000, 600, -24], [0, -160, -156, -148, 1120, -24, 360, -12, 20], [-84, -76, -4, -108, 820, -32, -40000, 560, 440]]
INFO:root:Count MDP: 4
INFO:root:Ship 2 command: n actual position: Position(13, 27) new position: Position(13, 26)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 8), (2, 0), (2, 1), (2, 3), (2, 4), (2, 6), (2, 7), (2, 8), (3, 6), (3, 7), (3, 8), (4, 0), (4, 1), (4, 4), (4, 5), (4, 7), (4, 8), (5, 2), (5, 4), (5, 6), (5, 7), (5, 8), (6, 2), (6, 4), (6, 5), (6, 6), (6, 7), (6, 8), (7, 1), (7, 4), (7, 5), (7, 6), (7, 7), (7, 8), (8, 1), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[2000, 2140, 1580, 4600, 1660, 2440, 1800, 700, 1900], [380, 140, 320, 920, 420, 180, 920, -12, 860], [20, -40000, -16, 320, 400, -8000, 240, 1520, 1600], [-12, -88, -44, -160, -36, -36, 420, 780, 1380], [620, 160, -52, -52, 540, 600, -24, 740, 2980], [-156, -148, 1120, -24, 360, -12, 20, 400, 780], [-4, -108, 820, -32, -40000, 560, 440, 1500, 940], [-64, 140, -36, -72, 20, 3340, 820, 880, 2520], [-40, 440, -88, -96, 0, 920, 5040, 3580, 2420]]
INFO:root:Count MDP: 4
INFO:root:Ship 8 command: o actual position: Position(15, 29) new position: Position(15, 29)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 7), (3, 8), (4, 0), (4, 2), (4, 3), (4, 5), (4, 6), (4, 7), (4, 8), (5, 5), (5, 6), (5, 7), (5, 8), (6, 0), (6, 3), (6, 4), (6, 6), (6, 7), (6, 8), (7, 1), (7, 3), (7, 5), (7, 6), (7, 7), (7, 8), (8, 1), (8, 3), (8, 4), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[3360, 3600, 2900, 2800, 1700, 2520, 3880, 7680, 3400], [2520, 2960, 6700, 4560, 1420, 3160, 2960, 3160, 7080], [2140, 1580, 4600, 1660, 2440, 1800, 700, 1900, 5900], [140, 320, 920, 420, 180, 920, -12, 860, 4340], [-40000, -16, 320, 400, -36, 240, 1520, 1600, 2080], [-88, -44, -160, -36, -36, 420, 780, 1380, 1760], [160, -52, -52, -40000, 600, -24, 740, 2980, 2140], [-148, 1120, -24, 360, -12, 20, 400, 780, 660], [-108, 820, -32, -40000, 560, 440, 1500, 940, 1880]]
INFO:root:Count MDP: 3
INFO:root:Ship 0 command: e actual position: Position(13, 30) new position: Position(14, 30)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 3), (0, 4), (0, 6), (0, 7), (0, 8), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 4), (2, 5), (2, 7), (2, 8), (3, 2), (3, 4), (3, 6), (3, 7), (3, 8), (4, 2), (4, 4), (4, 5), (4, 6), (4, 7), (4, 8), (5, 1), (5, 4), (5, 5), (5, 6), (5, 7), (5, 8), (6, 1), (6, 5), (6, 6), (6, 7), (6, 8), (7, 0), (7, 4), (7, 5), (7, 6), (7, 7), (7, 8), (8, 1), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[20, -40000, -16, 320, 400, -36, 240, 1520, 1600], [-12, -88, -44, -160, -36, -8000, 420, 780, 1380], [620, 160, -52, -52, -40000, 600, -24, 740, 2980], [-156, -148, 1120, -24, 360, -12, 20, 400, 780], [-4, -108, 820, -32, 740, 560, 440, 1500, 940], [-64, 140, -36, -72, 20, 3340, 820, 880, 2520], [-40, 440, -88, -96, 0, 920, 5040, 3580, 2420], [1920, -88, -60, -100, 840, 2760, 2500, 8920, 3180], [-12, 660, -20, -44, -44, 460, 2140, 5240, 2800]]
INFO:root:Count MDP: 4
INFO:root:Ship 4 command: o actual position: Position(17, 29) new position: Position(17, 29)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 8), (4, 1), (4, 2), (4, 3), (4, 4), (5, 0), (5, 2), (5, 3), (5, 5), (5, 6), (6, 2), (6, 7), (7, 1), (7, 2), (7, 7), (8, 2), (8, 6)]
INFO:root:Rewards:
[[1580, 1880, 5560, 3600, 5340, 2780, 2520, 2960, 6700], [1120, 3840, 3880, 1460, 1700, 2000, 2140, 1580, 4600], [1060, 140, -12, 700, 320, 380, 140, 320, 920], [860, -4, 2140, 1200, 2480, 20, -40000, -16, 320], [-120, 1600, 1860, 320, 1700, -12, -88, -44, -160], [40, -84, 900, 1160, -84, 620, 160, -52, -52], [-160, -32, 980, 0, -160, -156, -148, 1120, -24], [-120, 280, 360, -84, -76, -4, -108, 820, -32], [-120, -52, 180, -80, -40, -64, 140, -36, -72]]
INFO:root:Count MDP: 5
INFO:root:Ship 6 command: o actual position: Position(14, 24) new position: Position(14, 24)
INFO:root:Time: 0.04690122604370117
INFO:root:=============== TURN 015 ================
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 7), (2, 8), (3, 0), (3, 2), (3, 3), (3, 5), (3, 6), (3, 7), (3, 8), (4, 5), (4, 6), (4, 7), (4, 8), (5, 0), (5, 3), (5, 4), (5, 6), (5, 7), (5, 8), (6, 1), (6, 3), (6, 5), (6, 6), (6, 7), (6, 8), (7, 1), (7, 3), (7, 4), (7, 5), (7, 6), (7, 7), (7, 8), (8, 0), (8, 3), (8, 4), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[2520, 2960, 6700, 4560, 1420, 3160, 2960, 3160, 7080], [2140, 1580, 4600, 1660, 2440, 1800, 700, 1900, 5900], [140, 320, 920, 420, 180, 920, -12, 860, 4340], [-40000, -16, 320, 400, -36, 240, 1520, 1600, 2080], [-88, -44, -160, -36, -36, 420, 780, 1380, 1760], [160, -52, -52, -40000, 600, -24, 740, 2980, 2140], [-148, 1120, -24, 360, -12, 20, 400, 780, 660], [-108, 820, -32, -40000, 560, 440, 1500, 940, 1880], [140, -36, -72, 20, 3340, 820, 880, 2520, 6740]]
INFO:root:Count MDP: 4
INFO:root:Ship 0 command: e actual position: Position(14, 30) new position: Position(15, 30)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 8), (2, 0), (2, 1), (2, 3), (2, 4), (2, 6), (2, 7), (2, 8), (3, 6), (3, 7), (3, 8), (4, 0), (4, 1), (4, 4), (4, 5), (4, 7), (4, 8), (5, 2), (5, 4), (5, 6), (5, 7), (5, 8), (6, 2), (6, 4), (6, 5), (6, 6), (6, 7), (6, 8), (7, 1), (7, 4), (7, 5), (7, 6), (7, 7), (7, 8), (8, 1), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[2000, 2140, 1580, 4600, 1660, 2440, 1800, 700, 1900], [380, 140, 320, 920, 420, 180, 920, -12, 860], [20, -40000, -16, 320, 400, -36, 240, 1520, 1600], [-12, -88, -44, -160, -36, -36, 420, 780, 1380], [620, 160, -52, -52, 200, -40000, -24, 740, 2980], [-156, -148, 1120, -24, 360, -12, 20, 400, 780], [-4, -108, 820, -32, -40000, 560, 440, 1500, 940], [-64, 140, -36, -72, 20, 3340, 820, 880, 2520], [-40, 440, -88, -96, 0, 920, 5040, 3580, 2420]]
INFO:root:Count MDP: 5
INFO:root:Ship 8 command: o actual position: Position(15, 29) new position: Position(15, 29)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 3), (0, 4), (0, 6), (0, 7), (0, 8), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 4), (2, 5), (2, 7), (2, 8), (3, 2), (3, 4), (3, 6), (3, 7), (3, 8), (4, 2), (4, 4), (4, 5), (4, 6), (4, 7), (4, 8), (5, 1), (5, 4), (5, 5), (5, 6), (5, 7), (5, 8), (6, 1), (6, 5), (6, 6), (6, 7), (6, 8), (7, 0), (7, 4), (7, 5), (7, 6), (7, 7), (7, 8), (8, 1), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[20, -40000, -16, 320, 400, -36, 240, 1520, 1600], [-12, -88, -44, -160, -36, -36, 420, 780, 1380], [620, 160, -52, -52, -40000, -40000, -24, 740, 2980], [-156, -148, 1120, -24, 360, -12, 20, 400, 780], [-4, -108, 820, -32, 340, 560, 440, 1500, 940], [-64, 140, -36, -72, 20, 3340, 820, 880, 2520], [-40, 440, -88, -96, 0, 920, 5040, 3580, 2420], [1920, -88, -60, -100, 840, 2760, 2500, 8920, 3180], [-12, 660, -20, -44, -44, 460, 2140, 5240, 2800]]
INFO:root:Count MDP: 5
INFO:root:Ship 4 command: o actual position: Position(17, 29) new position: Position(17, 29)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 8), (4, 1), (4, 2), (4, 3), (4, 4), (5, 0), (5, 2), (5, 3), (5, 5), (5, 6), (6, 2), (6, 7), (7, 1), (7, 2), (7, 7), (8, 2), (8, 6)]
INFO:root:Rewards:
[[1580, 1880, 5560, 3600, 5340, 2780, 2520, 2960, 6700], [1120, 3840, 3880, 1460, 1700, 2000, 2140, 1580, 4600], [1060, 140, -12, 700, 320, 380, 140, 320, 920], [860, -4, 2140, 1200, 2480, 20, -40000, -16, 320], [-120, 1600, 1860, 320, 1060, -12, -88, -44, -160], [40, -84, 900, 1160, -84, 620, 160, -52, -52], [-160, -32, 980, 0, -160, -156, -148, 1120, -24], [-120, 280, 360, -84, -76, -4, -108, 820, -32], [-120, -52, 180, -80, -40, -64, 140, -36, -72]]
INFO:root:Count MDP: 5
INFO:root:Ship 6 command: o actual position: Position(14, 24) new position: Position(14, 24)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 0), (4, 1), (4, 2), (4, 3), (4, 4), (4, 6), (4, 7), (5, 0), (5, 1), (5, 2), (6, 0), (6, 1), (6, 3), (6, 4), (6, 7), (6, 8), (7, 0), (7, 5), (7, 7), (8, 0), (8, 5), (8, 7), (8, 8)]
INFO:root:Rewards:
[[5700, 5400, 10060, 9180, 3360, 3600, 2900, 2800, 1700], [5560, 3600, 5340, 2780, 2520, 2960, 6700, 4560, 1420], [3880, 1460, 1700, 2000, 2140, 1580, 4600, 1660, 2440], [-12, 700, 320, 380, 140, 320, 920, 420, 180], [2140, 1200, 2480, 20, 1400, -16, 320, 400, -36], [1860, 320, -40000, -12, -88, -44, -160, -36, -36], [900, 1160, -84, 620, 160, -52, -52, -40000, -40000], [980, 0, -160, -156, -148, 1120, -24, 360, -12], [360, -84, -76, -4, -108, 820, -32, -40000, 560]]
INFO:root:Count MDP: 4
INFO:root:Ship 2 command: o actual position: Position(13, 26) new position: Position(13, 26)
INFO:root:Time: 0.05375194549560547
INFO:root:=============== TURN 016 ================
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 7), (1, 8), (2, 0), (2, 2), (2, 3), (2, 5), (2, 6), (2, 7), (2, 8), (3, 5), (3, 6), (3, 7), (3, 8), (4, 0), (4, 4), (4, 6), (4, 7), (4, 8), (5, 1), (5, 3), (5, 5), (5, 6), (5, 7), (5, 8), (6, 1), (6, 3), (6, 4), (6, 5), (6, 6), (6, 7), (6, 8), (7, 0), (7, 3), (7, 4), (7, 5), (7, 6), (7, 7), (7, 8), (8, 0), (8, 4), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[2140, 1580, 4600, 1660, 2440, 1800, 700, 1900, 5900], [140, 320, 920, 420, 180, 920, -12, 860, 4340], [-40000, -16, 320, 400, -36, 240, 1520, 1600, 2080], [-88, -44, -160, -36, -36, 420, 780, 1380, 1760], [160, -52, -52, -8000, 600, -24, 740, 2980, 2140], [-148, 1120, -24, 360, -12, 20, 400, 780, 660], [-108, 820, -32, -40000, 560, 440, 1500, 940, 1880], [140, -36, -72, 20, 3340, 820, 880, 2520, 6740], [440, -88, -96, 0, 920, 5040, 3580, 2420, 4620]]
INFO:root:Count MDP: 4
INFO:root:Ship 0 command: o actual position: Position(15, 30) new position: Position(15, 30)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 8), (2, 0), (2, 1), (2, 3), (2, 4), (2, 6), (2, 7), (2, 8), (3, 6), (3, 7), (3, 8), (4, 0), (4, 1), (4, 5), (4, 7), (4, 8), (5, 2), (5, 4), (5, 6), (5, 7), (5, 8), (6, 2), (6, 4), (6, 5), (6, 6), (6, 7), (6, 8), (7, 1), (7, 4), (7, 5), (7, 6), (7, 7), (7, 8), (8, 1), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[2000, 2140, 1580, 4600, 1660, 2440, 1800, 700, 1900], [380, 140, 320, 920, 420, 180, 920, -12, 860], [20, -40000, -16, 320, 400, -36, 240, 1520, 1600], [-12, -88, -44, -160, -36, -36, 420, 780, 1380], [620, 160, -52, -52, -12, -40000, -24, 740, 2980], [-156, -148, 1120, -24, 360, -12, 20, 400, 780], [-4, -108, 820, -32, -40000, 560, 440, 1500, 940], [-64, 140, -36, -72, 20, 3340, 820, 880, 2520], [-40, 440, -88, -96, 0, 920, 5040, 3580, 2420]]
INFO:root:Count MDP: 6
INFO:root:Ship 8 command: n actual position: Position(15, 29) new position: Position(15, 28)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 3), (0, 4), (0, 6), (0, 7), (0, 8), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 5), (2, 7), (2, 8), (3, 2), (3, 4), (3, 6), (3, 7), (3, 8), (4, 2), (4, 4), (4, 5), (4, 6), (4, 7), (4, 8), (5, 1), (5, 4), (5, 5), (5, 6), (5, 7), (5, 8), (6, 1), (6, 5), (6, 6), (6, 7), (6, 8), (7, 0), (7, 4), (7, 5), (7, 6), (7, 7), (7, 8), (8, 1), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[20, -40000, -16, 320, 400, -36, 240, 1520, 1600], [-12, -88, -44, -160, -36, -36, 420, 780, 1380], [620, 160, -52, -8000, -12, -40000, -24, 740, 2980], [-156, -148, 1120, -24, 360, -12, 20, 400, 780], [-4, -108, 820, -32, 40, 560, 440, 1500, 940], [-64, 140, -36, -72, 20, 3340, 820, 880, 2520], [-40, 440, -88, -96, 0, 920, 5040, 3580, 2420], [1920, -88, -60, -100, 840, 2760, 2500, 8920, 3180], [-12, 660, -20, -44, -44, 460, 2140, 5240, 2800]]
INFO:root:Count MDP: 5
INFO:root:Ship 4 command: o actual position: Position(17, 29) new position: Position(17, 29)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 8), (4, 1), (4, 2), (4, 3), (4, 4), (5, 0), (5, 2), (5, 3), (5, 5), (5, 6), (6, 2), (6, 7), (7, 1), (7, 2), (7, 7), (8, 2), (8, 6)]
INFO:root:Rewards:
[[1580, 1880, 5560, 3600, 5340, 2780, 2520, 2960, 6700], [1120, 3840, 3880, 1460, 1700, 2000, 2140, 1580, 4600], [1060, 140, -12, 700, 320, 380, 140, 320, 920], [860, -4, 2140, 1200, 2480, 20, -40000, -16, 320], [-120, 1600, 1860, 320, 580, -12, -88, -44, -160], [40, -84, 900, 1160, -84, 620, 160, -52, -8000], [-160, -32, 980, 0, -160, -156, -148, 1120, -24], [-120, 280, 360, -84, -76, -4, -108, 820, -32], [-120, -52, 180, -80, -40, -64, 140, -36, -72]]
INFO:root:Count MDP: 5
INFO:root:Ship 6 command: o actual position: Position(14, 24) new position: Position(14, 24)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 0), (4, 1), (4, 2), (4, 3), (4, 4), (4, 6), (4, 7), (5, 0), (5, 1), (5, 2), (6, 0), (6, 1), (6, 3), (6, 4), (6, 8), (7, 0), (7, 5), (7, 7), (8, 0), (8, 5), (8, 7), (8, 8)]
INFO:root:Rewards:
[[5700, 5400, 10060, 9180, 3360, 3600, 2900, 2800, 1700], [5560, 3600, 5340, 2780, 2520, 2960, 6700, 4560, 1420], [3880, 1460, 1700, 2000, 2140, 1580, 4600, 1660, 2440], [-12, 700, 320, 380, 140, 320, 920, 420, 180], [2140, 1200, 2480, 20, 840, -16, 320, 400, -36], [1860, 320, -40000, -12, -88, -44, -160, -36, -36], [900, 1160, -84, 620, 160, -52, -8000, -12, -40000], [980, 0, -160, -156, -148, 1120, -24, 360, -12], [360, -84, -76, -4, -108, 820, -32, -40000, 560]]
INFO:root:Count MDP: 4
INFO:root:Ship 2 command: o actual position: Position(13, 26) new position: Position(13, 26)
INFO:root:Time: 0.052774906158447266
INFO:root:=============== TURN 017 ================
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (2, 0), (2, 1), (2, 2), (2, 4), (2, 5), (2, 7), (2, 8), (3, 0), (3, 7), (3, 8), (4, 1), (4, 2), (4, 6), (4, 8), (5, 3), (5, 5), (5, 7), (5, 8), (6, 3), (6, 6), (6, 7), (6, 8), (7, 2), (7, 5), (7, 6), (7, 7), (7, 8), (8, 0), (8, 2), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[1700, 2000, 2140, 1580, 4600, 1660, 2440, 1800, 700], [320, 380, 140, 320, 920, 420, 180, 920, -12], [2480, 20, -40000, -16, 320, 400, -36, 240, 1520], [-40000, -12, -88, -44, -160, -36, -36, 420, 780], [-84, 620, 160, -52, -52, -12, -40000, -24, 740], [-160, -156, -148, 1120, -24, 360, -12, 20, 400], [-76, -4, -108, 820, -32, -8000, 560, 440, 1500], [-40, -64, 140, -36, -72, 20, 3340, 820, 880], [2440, -40, 440, -88, -96, 0, 920, 5040, 3580]]
INFO:root:Count MDP: 5
INFO:root:Ship 8 command: e actual position: Position(15, 28) new position: Position(16, 28)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 7), (1, 8), (2, 0), (2, 2), (2, 3), (2, 5), (2, 6), (2, 7), (2, 8), (3, 5), (3, 6), (3, 7), (3, 8), (4, 0), (4, 4), (4, 6), (4, 7), (4, 8), (5, 1), (5, 3), (5, 5), (5, 6), (5, 7), (5, 8), (6, 1), (6, 4), (6, 5), (6, 6), (6, 7), (6, 8), (7, 0), (7, 3), (7, 4), (7, 5), (7, 6), (7, 7), (7, 8), (8, 0), (8, 4), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[2140, 1580, 4600, 1660, 2440, 1800, 700, 1900, 5900], [140, 320, 920, 420, 180, 920, -12, 860, 4340], [-40000, -16, 320, 400, -36, 240, 1520, 1600, 2080], [-88, -44, -160, -36, -36, 420, 780, 1380, 1760], [160, -52, -52, -12, 240, -24, 740, 2980, 2140], [-148, 1120, -8000, 360, -12, 20, 400, 780, 660], [-108, 820, -32, -8000, 560, 440, 1500, 940, 1880], [140, -36, -72, 20, 3340, 820, 880, 2520, 6740], [440, -88, -96, 0, 920, 5040, 3580, 2420, 4620]]
INFO:root:Count MDP: 5
INFO:root:Ship 0 command: o actual position: Position(15, 30) new position: Position(15, 30)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 3), (0, 4), (0, 6), (0, 7), (0, 8), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 5), (2, 7), (2, 8), (3, 2), (3, 4), (3, 6), (3, 7), (3, 8), (4, 2), (4, 5), (4, 6), (4, 7), (4, 8), (5, 1), (5, 4), (5, 5), (5, 6), (5, 7), (5, 8), (6, 1), (6, 5), (6, 6), (6, 7), (6, 8), (7, 0), (7, 4), (7, 5), (7, 6), (7, 7), (7, 8), (8, 1), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[20, -40000, -16, 320, 400, -36, 240, 1520, 1600], [-12, -88, -44, -160, -36, -36, 420, 780, 1380], [620, 160, -52, -52, -12, -40000, -24, 740, 2980], [-156, -148, 1120, -8000, 360, -12, 20, 400, 780], [-4, -108, 820, -32, -36, 560, 440, 1500, 940], [-64, 140, -36, -72, 20, 3340, 820, 880, 2520], [-40, 440, -88, -96, 0, 920, 5040, 3580, 2420], [1920, -88, -60, -100, 840, 2760, 2500, 8920, 3180], [-12, 660, -20, -44, -44, 460, 2140, 5240, 2800]]
INFO:root:Count MDP: 6
INFO:root:Ship 4 command: n actual position: Position(17, 29) new position: Position(17, 28)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 8), (4, 1), (4, 2), (4, 3), (4, 4), (5, 0), (5, 2), (5, 3), (5, 5), (5, 6), (6, 2), (6, 7), (7, 1), (7, 2), (7, 7), (8, 2), (8, 6)]
INFO:root:Rewards:
[[1580, 1880, 5560, 3600, 5340, 2780, 2520, 2960, 6700], [1120, 3840, 3880, 1460, 1700, 2000, 2140, 1580, 4600], [1060, 140, -12, 700, 320, 380, 140, 320, 920], [860, -4, 2140, 1200, 2480, 20, -40000, -16, 320], [-120, 1600, 1860, 320, 220, -12, -88, -44, -160], [40, -84, 900, 1160, -84, 620, 160, -52, -52], [-160, -32, 980, 0, -160, -156, -148, 1120, -8000], [-120, 280, 360, -84, -76, -4, -108, 820, -8000], [-120, -52, 180, -80, -40, -64, 140, -36, -72]]
INFO:root:Count MDP: 5
INFO:root:Ship 6 command: o actual position: Position(14, 24) new position: Position(14, 24)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 0), (4, 1), (4, 2), (4, 3), (4, 4), (4, 6), (4, 7), (5, 0), (5, 1), (5, 2), (6, 0), (6, 1), (6, 3), (6, 4), (6, 8), (7, 0), (7, 5), (7, 7), (8, 0), (8, 5), (8, 8)]
INFO:root:Rewards:
[[5700, 5400, 10060, 9180, 3360, 3600, 2900, 2800, 1700], [5560, 3600, 5340, 2780, 2520, 2960, 6700, 4560, 1420], [3880, 1460, 1700, 2000, 2140, 1580, 4600, 1660, 2440], [-12, 700, 320, 380, 140, 320, 920, 420, 180], [2140, 1200, 2480, 20, 420, -16, 320, 400, -36], [1860, 320, -40000, -12, -88, -44, -160, -36, -36], [900, 1160, -84, 620, 160, -52, -52, -12, -40000], [980, 0, -160, -156, -148, 1120, -8000, 360, -12], [360, -84, -76, -4, -108, 820, -8000, -36, 560]]
INFO:root:Count MDP: 5
INFO:root:Ship 2 command: o actual position: Position(13, 26) new position: Position(13, 26)
INFO:root:Time: 0.05569720268249512
INFO:root:=============== TURN 018 ================
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (1, 0), (1, 1), (1, 2), (1, 4), (1, 5), (1, 7), (1, 8), (2, 7), (2, 8), (3, 1), (3, 2), (3, 8), (4, 3), (4, 5), (4, 7), (4, 8), (5, 3), (5, 6), (5, 7), (5, 8), (6, 2), (6, 5), (6, 6), (6, 7), (6, 8), (7, 0), (7, 2), (7, 6), (7, 7), (7, 8), (8, 0), (8, 1), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[320, 380, 140, 320, 920, 420, 180, 920, -12], [2480, 20, -40000, -16, 320, 400, -36, 240, 1520], [-8000, -12, -88, -44, -160, -36, -36, 420, 780], [-84, 620, 160, -52, -52, -12, -8000, -24, 740], [-160, -156, -148, 1120, -24, 360, -12, 20, 400], [-76, -4, -108, 820, -8000, -36, 560, 440, 1500], [-40, -64, 140, -36, -72, 20, 3340, 820, 880], [2440, -40, 440, -88, -96, 0, 920, 5040, 3580], [2820, 1920, -88, -60, -100, 840, 2760, 2500, 8920]]
INFO:root:Count MDP: 6
INFO:root:Ship 8 command: n actual position: Position(16, 28) new position: Position(16, 27)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 7), (1, 8), (2, 0), (2, 2), (2, 3), (2, 5), (2, 6), (2, 7), (2, 8), (3, 5), (3, 6), (3, 7), (3, 8), (4, 0), (4, 6), (4, 7), (4, 8), (5, 1), (5, 3), (5, 5), (5, 6), (5, 7), (5, 8), (6, 1), (6, 4), (6, 5), (6, 6), (6, 7), (6, 8), (7, 0), (7, 3), (7, 4), (7, 5), (7, 6), (7, 7), (7, 8), (8, 0), (8, 4), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[2140, 1580, 4600, 1660, 2440, 1800, 700, 1900, 5900], [140, 320, 920, 420, 180, 920, -12, 860, 4340], [-40000, -16, 320, 400, -36, 240, 1520, 1600, 2080], [-88, -44, -160, -36, -36, 420, 780, 1380, 1760], [160, -52, -52, -12, -4, -24, 740, 2980, 2140], [-148, -40000, -24, 360, -12, 20, 400, 780, 660], [-108, 820, -8000, -36, 560, 440, 1500, 940, 1880], [140, -36, -72, 20, 3340, 820, 880, 2520, 6740], [440, -88, -96, 0, 920, 5040, 3580, 2420, 4620]]
INFO:root:Count MDP: 4
INFO:root:Ship 0 command: s actual position: Position(15, 30) new position: Position(15, 31)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 8), (4, 1), (4, 2), (4, 3), (5, 0), (5, 2), (5, 3), (5, 5), (5, 6), (6, 2), (6, 7), (7, 1), (7, 2), (7, 7), (8, 2), (8, 6)]
INFO:root:Rewards:
[[1580, 1880, 5560, 3600, 5340, 2780, 2520, 2960, 6700], [1120, 3840, 3880, 1460, 1700, 2000, 2140, 1580, 4600], [1060, 140, -12, 700, 320, 380, 140, 320, 920], [860, -4, 2140, 1200, 2480, 20, -40000, -16, 320], [-120, 1600, 1860, 320, -8, -12, -88, -44, -160], [40, -84, 900, 1160, -84, 620, 160, -52, -52], [-160, -32, 980, 0, -160, -156, -148, -40000, -24], [-120, 280, 360, -84, -76, -4, -108, 820, -8000], [-120, -52, 180, -80, -40, -64, 140, -36, -72]]
INFO:root:Count MDP: 5
INFO:root:Ship 6 command: w actual position: Position(14, 24) new position: Position(13, 24)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 0), (4, 1), (4, 2), (4, 3), (4, 4), (4, 6), (4, 7), (5, 0), (5, 1), (6, 0), (6, 1), (6, 3), (6, 4), (7, 0), (7, 5), (7, 7), (8, 0), (8, 5), (8, 8)]
INFO:root:Rewards:
[[5700, 5400, 10060, 9180, 3360, 3600, 2900, 2800, 1700], [5560, 3600, 5340, 2780, 2520, 2960, 6700, 4560, 1420], [3880, 1460, 1700, 2000, 2140, 1580, 4600, 1660, 2440], [-12, 700, 320, 380, 140, 320, 920, 420, 180], [2140, 1200, -40000, 20, 100, -16, 320, 400, -36], [1860, 320, -8, -12, -88, -44, -160, -36, -36], [900, 1160, -84, 620, 160, -52, -52, -12, -4], [980, 0, -160, -156, -148, -40000, -24, 360, -12], [360, -84, -76, -4, -108, 820, -8000, -36, 560]]
INFO:root:Count MDP: 5
INFO:root:Ship 2 command: o actual position: Position(13, 26) new position: Position(13, 26)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 4), (0, 5), (0, 7), (0, 8), (1, 7), (1, 8), (2, 1), (2, 2), (2, 8), (3, 3), (3, 5), (3, 7), (3, 8), (4, 3), (4, 6), (4, 7), (4, 8), (5, 2), (5, 5), (5, 6), (5, 7), (5, 8), (6, 0), (6, 2), (6, 6), (6, 7), (6, 8), (7, 0), (7, 1), (7, 5), (7, 6), (7, 7), (7, 8), (8, 0), (8, 2), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[-40000, 20, -40000, -16, 320, 400, -36, 240, 1520], [-8, -12, -88, -44, -160, -36, -36, 420, 780], [-84, 620, 160, -52, -52, -12, -4, -8000, 740], [-160, -156, -148, -40000, -24, 360, -12, 20, 400], [-76, -4, -108, 820, -32, -36, 560, 440, 1500], [-40, -64, 140, -36, -72, 20, 3340, 820, 880], [2440, -40, 440, -88, -96, 0, 920, 5040, 3580], [2820, 1920, -88, -60, -100, 840, 2760, 2500, 8920], [460, -12, 660, -20, -44, -44, 460, 2140, 5240]]
INFO:root:Count MDP: 6
INFO:root:Ship 4 command: e actual position: Position(17, 28) new position: Position(18, 28)
INFO:root:Time: 0.05569577217102051
INFO:root:=============== TURN 019 ================
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 0), (4, 1), (4, 2), (4, 3), (4, 6), (4, 7), (5, 0), (5, 1), (6, 0), (6, 1), (6, 3), (6, 4), (7, 0), (7, 5), (7, 7), (8, 0), (8, 5), (8, 8)]
INFO:root:Rewards:
[[5700, 5400, 10060, 9180, 3360, 3600, 2900, 2800, 1700], [5560, 3600, 5340, 2780, 2520, 2960, 6700, 4560, 1420], [3880, 1460, 1700, 2000, 2140, 1580, 4600, 1660, 2440], [-12, 700, 320, 380, 140, 320, 920, 420, 180], [2140, 1200, -40000, 20, -28, -16, 320, 400, -36], [1860, 320, -8, -12, -88, -44, -160, -36, -36], [900, 1160, -84, 620, 160, -52, -52, -12, -4], [980, 0, -160, -156, -148, -40000, -24, 360, -12], [360, -84, -76, -4, -108, 820, -32, -36, 560]]
INFO:root:Count MDP: 5
INFO:root:Ship 2 command: e actual position: Position(13, 26) new position: Position(14, 26)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 6), (1, 7), (1, 8), (2, 1), (2, 2), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 5), (4, 6), (4, 7), (4, 8), (5, 0), (5, 2), (5, 4), (5, 5), (5, 6), (5, 7), (5, 8), (6, 0), (6, 3), (6, 4), (6, 5), (6, 6), (6, 7), (6, 8), (7, 2), (7, 3), (7, 4), (7, 5), (7, 6), (7, 7), (7, 8), (8, 3), (8, 4), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[1580, 4600, 1660, 2440, 1800, 700, 1900, 5900, 6160], [320, 920, 420, 180, 920, -12, 860, 4340, 4820], [-16, 320, 400, -36, 240, 1520, 1600, 2080, 2400], [-44, -160, -36, -36, 420, 780, 1380, 1760, 6240], [-52, -52, -12, -4, -24, 740, 2980, 2140, 2740], [-40000, -24, 360, -12, 20, 400, 780, 660, 2580], [820, -32, -36, 560, 440, 1500, 940, 1880, 2400], [-36, -8000, 20, 3340, 820, 880, 2520, 6740, 2700], [-88, -96, 0, 920, 5040, 3580, 2420, 4620, 6060]]
INFO:root:Count MDP: 3
INFO:root:Ship 0 command: s actual position: Position(15, 31) new position: Position(15, 32)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 5), (1, 6), (1, 8), (2, 0), (2, 8), (3, 0), (3, 2), (3, 3), (4, 4), (4, 6), (4, 8), (5, 4), (5, 7), (5, 8), (6, 3), (6, 6), (6, 7), (6, 8), (7, 1), (7, 3), (7, 7), (7, 8), (8, 0), (8, 1), (8, 2), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[700, 320, 380, 140, 320, 920, 420, 180, 920], [1200, -40000, 20, -28, -16, 320, 400, -36, 240], [320, -8, -12, -8000, -44, -160, -36, -36, 420], [1160, -84, 620, 160, -52, -52, -12, -4, -24], [0, -160, -156, -148, 1120, -24, 360, -12, 20], [-84, -76, -4, -108, 820, -32, -36, 560, 440], [-80, -40, -64, 140, -36, -8000, 20, 3340, 820], [-16, 2440, -40, 440, -88, -96, 0, 920, 5040], [420, 2820, 1920, -88, -60, -100, 840, 2760, 2500]]
INFO:root:Count MDP: 5
INFO:root:Ship 8 command: o actual position: Position(16, 27) new position: Position(16, 27)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 1), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 0), (4, 2), (4, 3), (4, 4), (4, 5), (4, 8), (5, 1), (5, 2), (5, 3), (6, 0), (6, 2), (6, 3), (6, 5), (6, 6), (7, 2), (7, 7), (8, 1), (8, 2), (8, 7)]
INFO:root:Rewards:
[[2760, 3300, 5700, 5400, 10060, 9180, 3360, 3600, 2900], [1580, 1880, 5560, 3600, 5340, 2780, 2520, 2960, 6700], [1120, 3840, 3880, 1460, 1700, 2000, 2140, 1580, 4600], [1060, 140, -12, 700, 320, 380, 140, 320, 920], [860, -4, 2140, 1200, 2480, 20, -28, -16, 320], [-120, 1600, 1860, 320, -8, -12, -8000, -44, -160], [40, -84, 900, 1160, -84, 620, 160, -52, -52], [-160, -32, 980, 0, -160, -156, -148, -40000, -24], [-120, 280, 360, -84, -76, -4, -108, 820, -32]]
INFO:root:Count MDP: 5
INFO:root:Ship 6 command: o actual position: Position(13, 24) new position: Position(13, 24)
INFO:root:Terminais: [(0, 7), (0, 8), (1, 1), (1, 2), (1, 8), (2, 3), (2, 5), (2, 7), (2, 8), (3, 3), (3, 6), (3, 7), (3, 8), (4, 2), (4, 5), (4, 6), (4, 7), (4, 8), (5, 0), (5, 2), (5, 6), (5, 7), (5, 8), (6, 0), (6, 1), (6, 5), (6, 6), (6, 7), (6, 8), (7, 0), (7, 2), (7, 6), (7, 7), (7, 8), (8, 1), (8, 2), (8, 3), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[-8, -12, -8000, -44, -160, -36, -36, 420, 780], [-84, 620, 160, -52, -52, -12, -4, -24, -40000], [-160, -156, -148, -40000, -24, 360, -12, 20, 400], [-76, -4, -108, 820, -32, -36, 560, 440, 1500], [-40, -64, 140, -36, -72, 20, 3340, 820, 880], [2440, -40, 440, -88, -96, 0, 920, 5040, 3580], [2820, 1920, -88, -60, -100, 840, 2760, 2500, 8920], [460, -12, 660, -20, -44, -44, 460, 2140, 5240], [-36, 800, 2240, 360, -132, -20, 1360, 1840, 3300]]
INFO:root:Count MDP: 6
INFO:root:Ship 4 command: n actual position: Position(18, 28) new position: Position(18, 27)
INFO:root:Time: 0.05862903594970703
INFO:root:=============== TURN 020 ================
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 4), (4, 5), (4, 6), (4, 7), (4, 8), (5, 1), (5, 3), (5, 4), (5, 5), (5, 6), (5, 7), (5, 8), (6, 2), (6, 3), (6, 4), (6, 5), (6, 6), (6, 7), (6, 8), (7, 1), (7, 2), (7, 3), (7, 4), (7, 5), (7, 6), (7, 7), (7, 8), (8, 2), (8, 3), (8, 4), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[4600, 1660, 2440, 1800, 700, 1900, 5900, 6160, 3200], [920, 420, 180, 920, -12, 860, 4340, 4820, 4660], [320, 400, -36, 240, 1520, 1600, 2080, 2400, 4600], [-160, -36, -36, 420, 780, 1380, 1760, 6240, 6380], [-52, -12, -4, -24, 740, 2980, 2140, 2740, 8260], [-24, 360, -12, 20, 400, 780, 660, 2580, 7040], [-32, -36, 560, 440, 1500, 940, 1880, 2400, 3040], [-72, 20, 3340, 820, 880, 2520, 6740, 2700, 2160], [-96, 0, 920, 5040, 3580, 2420, 4620, 6060, 3540]]
INFO:root:Count MDP: 4
INFO:root:Ship 0 command: o actual position: Position(15, 32) new position: Position(15, 32)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 5), (1, 6), (1, 8), (2, 0), (2, 8), (3, 0), (3, 2), (3, 3), (4, 4), (4, 6), (4, 8), (5, 4), (5, 7), (5, 8), (6, 3), (6, 6), (6, 7), (6, 8), (7, 1), (7, 3), (7, 7), (7, 8), (8, 0), (8, 1), (8, 2), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[700, 320, 380, 140, 320, 920, 420, 180, 920], [1200, -40000, 20, -28, -16, 320, 400, -36, 240], [320, -8, -12, -8000, -44, -160, -36, -36, 420], [1160, -84, 620, 160, -52, -52, -12, -4, -24], [0, -160, -156, -148, 640, -24, 360, -12, 20], [-84, -76, -4, -108, 820, -32, -36, 560, 440], [-80, -40, -64, 140, -8000, -72, 20, 3340, 820], [-16, 2440, -40, 440, -88, -96, 0, 920, 5040], [420, 2820, 1920, -88, -60, -100, 840, 2760, 2500]]
INFO:root:Count MDP: 5
INFO:root:Ship 8 command: o actual position: Position(16, 27) new position: Position(16, 27)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 1), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 0), (4, 2), (4, 3), (4, 4), (4, 5), (4, 8), (5, 1), (5, 2), (5, 3), (6, 0), (6, 2), (6, 3), (6, 5), (6, 6), (7, 2), (7, 7), (8, 1), (8, 2), (8, 7)]
INFO:root:Rewards:
[[2760, 3300, 5700, 5400, 10060, 9180, 3360, 3600, 2900], [1580, 1880, 5560, 3600, 5340, 2780, 2520, 2960, 6700], [1120, 3840, 3880, 1460, 1700, 2000, 2140, 1580, 4600], [1060, 140, -12, 700, 320, 380, 140, 320, 920], [860, -4, 2140, 1200, 1660, 20, -28, -16, 320], [-120, 1600, 1860, 320, -8, -12, -8000, -44, -160], [40, -84, 900, 1160, -84, 620, 160, -52, -52], [-160, -32, 980, 0, -160, -156, -148, -40000, -24], [-120, 280, 360, -84, -76, -4, -108, 820, -32]]
INFO:root:Count MDP: 5
INFO:root:Ship 6 command: o actual position: Position(13, 24) new position: Position(13, 24)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 1), (3, 2), (3, 3), (3, 6), (3, 7), (4, 0), (4, 1), (5, 0), (5, 1), (5, 3), (5, 4), (6, 0), (6, 5), (6, 7), (7, 0), (7, 5), (7, 8), (8, 0), (8, 4), (8, 7), (8, 8)]
INFO:root:Rewards:
[[5560, 3600, 5340, 2780, 2520, 2960, 6700, 4560, 1420], [3880, 1460, 1700, 2000, 2140, 1580, 4600, 1660, 2440], [-12, 700, 320, 380, 140, 320, 920, 420, 180], [2140, 1200, -40000, 20, -28, -16, 320, 400, -36], [1860, 320, -8, -12, -88, -44, -160, -36, -36], [900, 1160, -84, 620, 160, -52, -52, -12, -4], [980, 0, -160, -156, -148, -40000, -24, 360, -12], [360, -84, -76, -4, -108, 820, -32, -36, 560], [180, -80, -40, -64, 140, -8000, -72, 20, 3340]]
INFO:root:Count MDP: 5
INFO:root:Ship 2 command: n actual position: Position(14, 26) new position: Position(14, 25)
INFO:root:Terminais: [(0, 0), (0, 8), (1, 0), (1, 2), (1, 3), (2, 4), (2, 6), (2, 8), (3, 4), (3, 7), (3, 8), (4, 3), (4, 6), (4, 7), (4, 8), (5, 1), (5, 3), (5, 7), (5, 8), (6, 0), (6, 1), (6, 2), (6, 6), (6, 7), (6, 8), (7, 0), (7, 1), (7, 3), (7, 7), (7, 8), (8, 2), (8, 3), (8, 4), (8, 7), (8, 8)]
INFO:root:Rewards:
[[320, -8, -8000, -88, -44, -160, -36, -36, 420], [1160, -84, 620, 160, -52, -52, -12, -4, -24], [0, -160, -156, -148, -40000, -24, 360, -12, 20], [-84, -76, -4, -108, 820, -32, -36, 560, 440], [-80, -40, -64, 140, -36, -72, 20, 3340, 820], [-16, 2440, -40, 440, -88, -96, 0, 920, 5040], [420, 2820, 1920, -88, -60, -100, 840, 2760, 2500], [480, 460, -12, 660, -20, -44, -44, 460, 2140], [-8, -36, 800, 2240, 360, -132, -20, 1360, 1840]]
INFO:root:Count MDP: 5
INFO:root:Ship 4 command: e actual position: Position(18, 27) new position: Position(19, 27)
INFO:root:Time: 0.0527646541595459
INFO:root:=============== TURN 021 ================
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 4), (4, 5), (4, 6), (4, 7), (4, 8), (5, 1), (5, 3), (5, 4), (5, 5), (5, 6), (5, 7), (5, 8), (6, 2), (6, 3), (6, 4), (6, 5), (6, 6), (6, 7), (6, 8), (7, 1), (7, 2), (7, 3), (7, 4), (7, 5), (7, 6), (7, 7), (7, 8), (8, 2), (8, 3), (8, 4), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[4600, 1660, 2440, 1800, 700, 1900, 5900, 6160, 3200], [920, 420, 180, 920, -12, 860, 4340, 4820, 4660], [320, 400, -36, 240, 1520, 1600, 2080, 2400, 4600], [-160, -36, -36, 420, 780, 1380, 1760, 6240, 6380], [-52, -12, -4, -24, 340, 2980, 2140, 2740, 8260], [-24, 360, -12, 20, 400, 780, 660, 2580, 7040], [-32, -36, 560, 440, 1500, 940, 1880, 2400, 3040], [-72, 20, 3340, 820, 880, 2520, 6740, 2700, 2160], [-96, 0, 920, 5040, 3580, 2420, 4620, 6060, 3540]]
INFO:root:Count MDP: 3
INFO:root:Ship 0 command: o actual position: Position(15, 32) new position: Position(15, 32)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 5), (1, 6), (1, 8), (2, 0), (2, 8), (3, 0), (3, 2), (3, 3), (4, 4), (4, 6), (4, 8), (5, 4), (5, 7), (5, 8), (6, 3), (6, 6), (6, 7), (6, 8), (7, 1), (7, 3), (7, 7), (7, 8), (8, 0), (8, 1), (8, 2), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[700, 320, 380, 140, 320, 920, 420, 180, 920], [1200, -40000, 20, -28, -16, 320, 400, -36, 240], [320, -8, -8000, -88, -44, -160, -36, -36, 420], [1160, -84, 620, 160, -52, -52, -12, -4, -24], [0, -160, -156, -148, 280, -24, 360, -12, 20], [-84, -76, -4, -108, 820, -32, -36, 560, 440], [-80, -40, -64, 140, -36, -72, 20, 3340, 820], [-16, 2440, -40, 440, -8000, -96, 0, 920, 5040], [420, 2820, 1920, -88, -60, -100, 840, 2760, 2500]]
INFO:root:Count MDP: 5
INFO:root:Ship 8 command: o actual position: Position(16, 27) new position: Position(16, 27)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 1), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 0), (4, 2), (4, 3), (4, 4), (4, 5), (4, 8), (5, 1), (5, 2), (5, 3), (6, 0), (6, 2), (6, 3), (6, 5), (6, 6), (7, 2), (7, 7), (8, 1), (8, 2), (8, 7)]
INFO:root:Rewards:
[[2760, 3300, 5700, 5400, 10060, 9180, 3360, 3600, 2900], [1580, 1880, 5560, 3600, 5340, 2780, 2520, 2960, 6700], [1120, 3840, 3880, 1460, 1700, 2000, 2140, 1580, 4600], [1060, 140, -12, 700, 320, 380, 140, 320, 920], [860, -4, 2140, 1200, 1040, 20, -28, -16, 320], [-120, 1600, 1860, 320, -8, -8000, -88, -44, -160], [40, -84, 900, 1160, -84, 620, 160, -52, -52], [-160, -32, 980, 0, -160, -156, -148, -40000, -24], [-120, 280, 360, -84, -76, -4, -108, 820, -32]]
INFO:root:Count MDP: 4
INFO:root:Ship 6 command: o actual position: Position(13, 24) new position: Position(13, 24)
INFO:root:Terminais: [(0, 0), (0, 2), (0, 3), (1, 4), (1, 6), (1, 8), (2, 4), (2, 7), (2, 8), (3, 3), (3, 6), (3, 7), (3, 8), (4, 1), (4, 3), (4, 7), (4, 8), (5, 0), (5, 1), (5, 2), (5, 6), (5, 7), (5, 8), (6, 0), (6, 1), (6, 3), (6, 7), (6, 8), (7, 2), (7, 3), (7, 4), (7, 7), (7, 8), (8, 2), (8, 3), (8, 7), (8, 8)]
INFO:root:Rewards:
[[1160, -84, 620, 160, -52, -52, -12, -4, -24], [0, -160, -156, -148, -40000, -24, 360, -12, 20], [-84, -76, -4, -108, 820, -32, -36, 560, 440], [-80, -40, -64, 140, -36, -72, 20, 3340, 820], [-16, 2440, -40, 440, -88, -96, 0, 920, 5040], [420, 2820, 1920, -88, -60, -100, 840, 2760, 2500], [480, 460, -12, 660, -20, -44, -44, 460, 2140], [-8, -36, 800, 2240, 360, -132, -20, 1360, 1840], [-4, -4, 1220, 280, -16, -128, -88, 1280, 300]]
INFO:root:Count MDP: 6
INFO:root:Ship 4 command: e actual position: Position(19, 27) new position: Position(20, 27)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 1), (3, 2), (3, 3), (3, 4), (3, 7), (3, 8), (4, 0), (4, 1), (4, 2), (5, 1), (5, 2), (5, 4), (5, 5), (6, 1), (6, 6), (6, 8), (7, 0), (7, 1), (7, 6), (8, 1), (8, 5), (8, 8)]
INFO:root:Rewards:
[[1880, 5560, 3600, 5340, 2780, 2520, 2960, 6700, 4560], [3840, 3880, 1460, 1700, 2000, 2140, 1580, 4600, 1660], [140, -12, 700, 320, 380, 140, 320, 920, 420], [-4, 2140, 1200, -40000, 20, -28, -16, 320, 400], [1600, 1860, 320, -8, -12, -88, -44, -160, -36], [-84, 900, 1160, -84, 620, 160, -52, -52, -12], [-32, 980, 0, -160, -156, -148, -40000, -24, 360], [280, 360, -84, -76, -4, -108, 820, -32, -36], [-52, 180, -80, -40, -64, 140, -36, -72, 20]]
INFO:root:Count MDP: 5
INFO:root:Ship 2 command: n actual position: Position(14, 25) new position: Position(14, 24)
INFO:root:Time: 0.0508122444152832
INFO:root:=============== TURN 022 ================
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 4), (4, 5), (4, 6), (4, 7), (4, 8), (5, 1), (5, 3), (5, 4), (5, 5), (5, 6), (5, 7), (5, 8), (6, 2), (6, 3), (6, 4), (6, 5), (6, 6), (6, 7), (6, 8), (7, 1), (7, 2), (7, 3), (7, 4), (7, 5), (7, 6), (7, 7), (7, 8), (8, 2), (8, 3), (8, 4), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[4600, 1660, 2440, 1800, 700, 1900, 5900, 6160, 3200], [920, 420, 180, 920, -12, 860, 4340, 4820, 4660], [320, 400, -36, 240, 1520, 1600, 2080, 2400, 4600], [-160, -36, -36, 420, 780, 1380, 1760, 6240, 6380], [-52, -12, -4, -24, 40, 2980, 2140, 2740, 8260], [-24, 360, -12, 20, 400, 780, 660, 2580, 7040], [-32, -36, 560, 440, 1500, 940, 1880, 2400, 3040], [-72, 20, 3340, 820, 880, 2520, 6740, 2700, 2160], [-96, 0, 920, 5040, 3580, 2420, 4620, 6060, 3540]]
INFO:root:Count MDP: 3
INFO:root:Ship 0 command: o actual position: Position(15, 32) new position: Position(15, 32)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 5), (1, 6), (1, 8), (2, 0), (2, 8), (3, 0), (3, 2), (3, 3), (4, 6), (4, 8), (5, 4), (5, 7), (5, 8), (6, 3), (6, 6), (6, 7), (6, 8), (7, 1), (7, 3), (7, 7), (7, 8), (8, 0), (8, 1), (8, 2), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[700, 320, 380, 140, 320, 920, 420, 180, 920], [1200, -40000, 20, -28, -16, 320, 400, -36, 240], [320, -8000, -12, -88, -44, -160, -36, -36, 420], [1160, -84, 620, 160, -52, -52, -12, -4, -24], [0, -160, -156, -148, 0, -24, 360, -12, 20], [-84, -76, -4, -108, 820, -32, -36, 560, 440], [-80, -40, -64, 140, -36, -72, 20, 3340, 820], [-16, 2440, -40, 440, -88, -96, 0, 920, 5040], [420, 2820, 1920, -88, -8000, -100, 840, 2760, 2500]]
INFO:root:Count MDP: 6
INFO:root:Ship 8 command: n actual position: Position(16, 27) new position: Position(16, 26)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 1), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 0), (4, 2), (4, 3), (4, 4), (4, 5), (4, 8), (5, 1), (5, 2), (5, 3), (6, 0), (6, 2), (6, 3), (6, 5), (6, 6), (7, 2), (8, 1), (8, 2), (8, 7)]
INFO:root:Rewards:
[[2760, 3300, 5700, 5400, 10060, 9180, 3360, 3600, 2900], [1580, 1880, 5560, 3600, 5340, 2780, 2520, 2960, 6700], [1120, 3840, 3880, 1460, 1700, 2000, 2140, 1580, 4600], [1060, 140, -12, 700, 320, 380, 140, 320, 920], [860, -4, 2140, 1200, 580, 20, -28, -16, 320], [-120, 1600, 1860, 320, -8000, -12, -88, -44, -160], [40, -84, 900, 1160, -84, 620, 160, -52, -52], [-160, -32, 980, 0, -160, -156, -8000, 0, -24], [-120, 280, 360, -84, -76, -4, -108, 820, -32]]
INFO:root:Count MDP: 5
INFO:root:Ship 6 command: o actual position: Position(13, 24) new position: Position(13, 24)
INFO:root:Terminais: [(0, 6), (0, 8), (1, 4), (1, 7), (1, 8), (2, 3), (2, 6), (2, 7), (2, 8), (3, 1), (3, 3), (3, 7), (3, 8), (4, 0), (4, 1), (4, 2), (4, 6), (4, 7), (4, 8), (5, 0), (5, 1), (5, 3), (5, 7), (5, 8), (6, 2), (6, 3), (6, 4), (6, 7), (6, 8), (7, 2), (7, 3), (7, 7), (7, 8), (8, 3), (8, 4), (8, 7)]
INFO:root:Rewards:
[[0, -160, -156, -8000, 0, -24, 360, -12, 20], [-84, -76, -4, -108, 820, -32, -36, 560, 440], [-80, -40, -64, 140, -36, -72, 20, 3340, 820], [-16, 2440, -40, 440, -88, -96, 0, 920, 5040], [420, 2820, 1920, -88, -60, -100, 840, 2760, 2500], [480, 460, -12, 660, -20, -44, -44, 460, 2140], [-8, -36, 800, 2240, 360, -132, -20, 1360, 1840], [-4, -4, 1220, 280, -16, -128, -88, 1280, 300], [-36, -160, -60, 1760, 280, -156, -120, 1220, -68]]
INFO:root:Count MDP: 7
INFO:root:Ship 4 command: n actual position: Position(20, 27) new position: Position(20, 26)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 2), (3, 3), (3, 4), (3, 5), (3, 8), (4, 1), (4, 2), (4, 3), (5, 0), (5, 2), (5, 3), (5, 5), (5, 6), (6, 2), (7, 1), (7, 2), (7, 7), (8, 2), (8, 6)]
INFO:root:Rewards:
[[1580, 1880, 5560, 3600, 5340, 2780, 2520, 2960, 6700], [1120, 3840, 3880, 1460, 1700, 2000, 2140, 1580, 4600], [1060, 140, -12, 700, 320, 380, 140, 320, 920], [860, -4, 2140, 1200, -40000, 20, -28, -16, 320], [-120, 1600, 1860, 320, -8, -12, -88, -44, -160], [40, -84, 900, 1160, -84, 620, 160, -52, -52], [-160, -32, 980, 0, -160, -156, -8000, 0, -24], [-120, 280, 360, -84, -76, -4, -108, 820, -32], [-120, -52, 180, -80, -40, -64, 140, -36, -72]]
INFO:root:Count MDP: 4
INFO:root:Ship 2 command: e actual position: Position(14, 24) new position: Position(15, 24)
INFO:root:Time: 0.056664466857910156
INFO:root:=============== TURN 023 ================
INFO:root:Terminais: [(0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 6), (1, 7), (2, 0), (2, 1), (3, 0), (3, 1), (3, 3), (3, 4), (4, 0), (4, 7), (5, 0), (5, 5), (5, 8), (6, 0), (6, 4), (6, 7), (6, 8), (7, 0), (7, 2), (7, 4), (7, 8), (8, 1), (8, 2), (8, 3), (8, 7), (8, 8)]
INFO:root:Rewards:
[[-12, 700, 320, 380, 140, 320, 920, 420, 180], [2140, 1200, -40000, 20, -28, -16, 320, 400, -36], [1860, 320, -8, -12, -88, -44, -160, -36, -36], [900, 1160, -8000, 620, 160, -52, -52, -12, -4], [980, 0, -160, -156, -148, 0, -24, 360, -12], [360, -84, -76, -4, -108, 820, -32, -36, 560], [180, -80, -40, -64, 140, -36, -72, 20, 3340], [60, -16, 2440, -40, 440, -88, -96, 0, 920], [-4, 420, 2820, 1920, -8000, -60, -100, 840, 2760]]
INFO:root:Count MDP: 6
INFO:root:Ship 8 command: e actual position: Position(16, 26) new position: Position(17, 26)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 5), (4, 6), (4, 7), (4, 8), (5, 1), (5, 3), (5, 4), (5, 5), (5, 6), (5, 7), (5, 8), (6, 2), (6, 3), (6, 4), (6, 5), (6, 6), (6, 7), (6, 8), (7, 1), (7, 2), (7, 3), (7, 4), (7, 5), (7, 6), (7, 7), (7, 8), (8, 2), (8, 3), (8, 4), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[4600, 1660, 2440, 1800, 700, 1900, 5900, 6160, 3200], [920, 420, 180, 920, -12, 860, 4340, 4820, 4660], [320, 400, -36, 240, 1520, 1600, 2080, 2400, 4600], [-160, -36, -36, 420, 780, 1380, 1760, 6240, 6380], [-52, -12, -4, -24, -36, 2980, 2140, 2740, 8260], [-24, 360, -12, 20, 400, 780, 660, 2580, 7040], [-32, -36, 560, 440, 1500, 940, 1880, 2400, 3040], [-72, 20, 3340, 820, 880, 2520, 6740, 2700, 2160], [-96, 0, 920, 5040, 3580, 2420, 4620, 6060, 3540]]
INFO:root:Count MDP: 7
INFO:root:Ship 0 command: s actual position: Position(15, 32) new position: Position(15, 33)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 1), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 0), (4, 2), (4, 3), (4, 4), (4, 5), (4, 8), (5, 1), (5, 2), (5, 3), (6, 0), (6, 2), (6, 3), (6, 5), (6, 6), (7, 2), (8, 1), (8, 2), (8, 7)]
INFO:root:Rewards:
[[2760, 3300, 5700, 5400, 10060, 9180, 3360, 3600, 2900], [1580, 1880, 5560, 3600, 5340, 2780, 2520, 2960, 6700], [1120, 3840, 3880, 1460, 1700, 2000, 2140, 1580, 4600], [1060, 140, -12, 700, 320, 380, 140, 320, 920], [860, -4, 2140, 1200, 220, 20, -28, -16, 320], [-120, 1600, 1860, 320, -8, -12, -88, -44, -160], [40, -84, 900, 1160, -8000, 620, 160, -52, -52], [-160, -32, 980, 0, -160, -156, -148, 0, -24], [-120, 280, 360, -84, -76, -4, -8000, 820, -32]]
INFO:root:Count MDP: 3
INFO:root:Ship 6 command: o actual position: Position(13, 24) new position: Position(13, 24)
INFO:root:Terminais: [(0, 0), (0, 7), (1, 0), (1, 5), (1, 8), (2, 0), (2, 4), (2, 7), (2, 8), (3, 0), (3, 2), (3, 4), (3, 8), (4, 1), (4, 2), (4, 3), (4, 7), (4, 8), (5, 0), (5, 1), (5, 2), (5, 4), (5, 8), (6, 0), (6, 3), (6, 4), (6, 5), (6, 8), (7, 0), (7, 3), (7, 4), (7, 8), (8, 0), (8, 4), (8, 5), (8, 8)]
INFO:root:Rewards:
[[980, 0, -160, -156, -148, 0, -24, 360, -12], [360, -84, -76, -4, -8000, 820, -32, -36, 560], [180, -80, -40, -64, 140, -36, -72, 20, 3340], [60, -16, 2440, -40, 440, -88, -96, 0, 920], [-4, 420, 2820, 1920, -88, -60, -100, 840, 2760], [580, 480, 460, -12, 660, -20, -44, -44, 460], [660, -8, -36, 800, 2240, 360, -132, -20, 1360], [3840, -4, -4, 1220, 280, -16, -128, -88, 1280], [5140, -36, -160, -60, 1760, 280, -156, -120, 1220]]
INFO:root:Count MDP: 4
INFO:root:Ship 4 command: n actual position: Position(20, 26) new position: Position(20, 25)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 2), (2, 3), (2, 4), (2, 5), (2, 8), (3, 1), (3, 2), (3, 3), (4, 0), (4, 2), (4, 3), (4, 5), (4, 6), (5, 2), (6, 1), (6, 2), (6, 7), (7, 2), (7, 6), (8, 0), (8, 2), (8, 4), (8, 6)]
INFO:root:Rewards:
[[1120, 3840, 3880, 1460, 1700, 2000, 2140, 1580, 4600], [1060, 140, -12, 700, 320, 380, 140, 320, 920], [860, -4, 2140, 1200, -40000, 20, -28, -16, 320], [-120, 1600, 1860, 320, -8, -12, -88, -44, -160], [40, -84, 900, 1160, -84, 620, 160, -52, -52], [-160, -32, 980, 0, -160, -156, -148, 0, -24], [-120, 280, 360, -84, -76, -4, -8000, 820, -32], [-120, -52, 180, -80, -40, -64, 140, -36, -72], [2180, -36, 60, -16, 2440, -40, 440, -88, -96]]
INFO:root:Count MDP: 6
INFO:root:Ship 2 command: e actual position: Position(15, 24) new position: Position(16, 24)
INFO:root:Time: 0.05667400360107422
INFO:root:=============== TURN 024 ================
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 1), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 0), (4, 2), (4, 3), (4, 5), (4, 8), (5, 1), (5, 2), (5, 3), (6, 0), (6, 2), (6, 3), (6, 5), (6, 6), (7, 2), (8, 1), (8, 2), (8, 7)]
INFO:root:Rewards:
[[2760, 3300, 5700, 5400, 10060, 9180, 3360, 3600, 2900], [1580, 1880, 5560, 3600, 5340, 2780, 2520, 2960, 6700], [1120, 3840, 3880, 1460, 1700, 2000, 2140, 1580, 4600], [1060, 140, -12, 700, 320, 380, 140, 320, 920], [860, -4, 2140, 1200, -8, 20, -28, -16, 320], [-120, 1600, 1860, 320, -8, -12, -88, -44, -160], [40, -84, 900, 1160, -84, 620, 160, -52, -52], [-160, -32, 980, 0, -8000, -156, -148, 0, -24], [-120, 280, 360, -84, -76, -4, -8000, 820, -32]]
INFO:root:Count MDP: 4
INFO:root:Ship 6 command: n actual position: Position(13, 24) new position: Position(13, 23)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 4), (4, 5), (4, 6), (4, 7), (4, 8), (5, 0), (5, 2), (5, 3), (5, 4), (5, 5), (5, 6), (5, 7), (5, 8), (6, 1), (6, 2), (6, 3), (6, 4), (6, 5), (6, 6), (6, 7), (6, 8), (7, 0), (7, 1), (7, 2), (7, 3), (7, 4), (7, 5), (7, 6), (7, 7), (7, 8), (8, 1), (8, 2), (8, 3), (8, 4), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[1660, 2440, 1800, 700, 1900, 5900, 6160, 3200, 3860], [420, 180, 920, -12, 860, 4340, 4820, 4660, 3980], [400, -36, 240, 1520, 1600, 2080, 2400, 4600, 3160], [-36, -36, 420, 780, 1380, 1760, 6240, 6380, 3220], [-12, -4, -24, -36, 2980, 2140, 2740, 8260, 4200], [360, -12, 20, 400, 780, 660, 2580, 7040, 4220], [-36, 560, 440, 1500, 940, 1880, 2400, 3040, 4160], [20, 3340, 820, 880, 2520, 6740, 2700, 2160, 7280], [0, 920, 5040, 3580, 2420, 4620, 6060, 3540, 8900]]
INFO:root:Count MDP: 3
INFO:root:Ship 0 command: o actual position: Position(15, 33) new position: Position(15, 33)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 3), (0, 6), (0, 7), (1, 0), (1, 1), (2, 0), (2, 1), (2, 3), (2, 4), (3, 0), (3, 7), (4, 0), (4, 5), (4, 8), (5, 0), (5, 4), (5, 7), (5, 8), (6, 0), (6, 2), (6, 4), (6, 8), (7, 1), (7, 2), (7, 3), (7, 7), (7, 8), (8, 0), (8, 1), (8, 2), (8, 4), (8, 8)]
INFO:root:Rewards:
[[2140, -40000, -8, 20, -28, -16, 320, 400, -36], [1860, 320, -8, -12, -88, -44, -160, -36, -36], [900, 1160, -84, 620, 160, -52, -52, -12, -4], [980, 0, -8000, -156, -148, 0, -24, 360, -12], [360, -84, -76, -4, -108, 820, -32, -36, 560], [180, -80, -40, -64, 140, -36, -72, 20, 3340], [60, -16, 2440, -40, 440, -88, -96, 0, 920], [-4, 420, 2820, -40000, -88, -60, -100, 840, 2760], [580, 480, 460, -12, 660, -20, -44, -44, 460]]
INFO:root:Count MDP: 8
INFO:root:Ship 8 command: n actual position: Position(17, 26) new position: Position(17, 25)
INFO:root:Terminais: [(0, 1), (0, 8), (1, 0), (1, 1), (1, 6), (2, 1), (2, 5), (2, 8), (3, 1), (3, 3), (3, 5), (4, 0), (4, 2), (4, 3), (4, 4), (4, 8), (5, 0), (5, 1), (5, 2), (5, 3), (5, 5), (6, 0), (6, 1), (6, 4), (6, 5), (6, 6), (7, 0), (7, 1), (7, 4), (7, 5), (8, 0), (8, 1), (8, 5), (8, 6)]
INFO:root:Rewards:
[[-32, 980, 0, -8000, -156, -148, 0, -24, 360], [280, 360, -84, -76, -8000, -108, 820, -32, -36], [-52, 180, -80, -40, -64, 140, -36, -72, 20], [-36, 60, -16, 2440, -40, 440, -88, -96, 0], [400, -4, 420, 2820, 1920, -88, -60, -100, 840], [2000, 580, 480, 460, -12, 660, -20, -44, -44], [1480, 660, -8, -36, 800, 2240, 360, -132, -20], [3220, 3840, -4, -4, 1220, 280, -16, -128, -88], [1880, 5140, -36, -160, -60, 1760, 280, -156, -120]]
INFO:root:Count MDP: 5
INFO:root:Ship 4 command: o actual position: Position(20, 25) new position: Position(20, 25)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 2), (1, 3), (1, 5), (1, 8), (2, 1), (2, 2), (2, 3), (3, 0), (3, 2), (3, 3), (3, 5), (3, 6), (4, 2), (5, 1), (5, 2), (5, 7), (6, 2), (6, 6), (7, 0), (7, 2), (7, 4), (7, 6), (8, 0), (8, 1), (8, 3), (8, 4), (8, 5)]
INFO:root:Rewards:
[[1060, 140, -12, 700, 320, 380, 140, 320, 920], [860, -4, 2140, -40000, -8, 20, -28, -16, 320], [-120, 1600, 1860, 320, -8, -12, -88, -44, -160], [40, -84, 900, 1160, -84, 620, 160, -52, -52], [-160, -32, 980, 0, -160, -156, -148, 0, -24], [-120, 280, 360, -84, -76, -8000, -108, 820, -32], [-120, -52, 180, -80, -40, -64, 140, -36, -72], [2180, -36, 60, -16, 2440, -40, 440, -88, -96], [1660, 400, -4, 420, 2820, -40000, -88, -60, -100]]
INFO:root:Count MDP: 6
INFO:root:Ship 2 command: e actual position: Position(16, 24) new position: Position(17, 24)
INFO:root:Time: 0.06162452697753906
INFO:root:=============== TURN 025 ================
INFO:root:Terminais: [(0, 1), (0, 2), (0, 4), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (2, 1), (2, 2), (2, 4), (2, 5), (3, 1), (3, 8), (4, 0), (4, 1), (4, 6), (5, 1), (5, 5), (5, 8), (6, 1), (6, 3), (6, 5), (7, 0), (7, 2), (7, 3), (7, 4), (7, 8), (8, 0), (8, 1), (8, 2), (8, 3), (8, 5)]
INFO:root:Rewards:
[[-4, 2140, -40000, -8, 20, -28, -16, 320, 400], [1600, 1860, 320, -8, -12, -88, -44, -160, -36], [-84, 900, 1160, -84, 620, 160, -52, -52, -12], [-32, 980, 0, -160, -156, -148, 0, -24, 360], [280, 360, -84, -8000, -4, -108, 820, -32, -36], [-52, 180, -80, -40, -64, 140, -36, -72, 20], [-36, 60, -16, 2440, -40, 440, -88, -96, 0], [400, -4, 420, 2820, -40000, -88, -60, -100, 840], [2000, 580, 480, 460, -12, 660, -20, -44, -44]]
INFO:root:Count MDP: 7
INFO:root:Ship 8 command: e actual position: Position(17, 25) new position: Position(18, 25)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 4), (4, 5), (4, 6), (4, 7), (4, 8), (5, 0), (5, 2), (5, 3), (5, 4), (5, 5), (5, 6), (5, 7), (5, 8), (6, 1), (6, 2), (6, 3), (6, 4), (6, 5), (6, 6), (6, 7), (6, 8), (7, 0), (7, 1), (7, 2), (7, 3), (7, 4), (7, 5), (7, 6), (7, 7), (7, 8), (8, 1), (8, 2), (8, 3), (8, 4), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[1660, 2440, 1800, 700, 1900, 5900, 6160, 3200, 3860], [420, 180, 920, -12, 860, 4340, 4820, 4660, 3980], [400, -36, 240, 1520, 1600, 2080, 2400, 4600, 3160], [-36, -36, 420, 780, 1380, 1760, 6240, 6380, 3220], [-12, -4, -24, -36, 2020, 2140, 2740, 8260, 4200], [360, -12, 20, 400, 780, 660, 2580, 7040, 4220], [-36, 560, 440, 1500, 940, 1880, 2400, 3040, 4160], [20, 3340, 820, 880, 2520, 6740, 2700, 2160, 7280], [0, 920, 5040, 3580, 2420, 4620, 6060, 3540, 8900]]
INFO:root:Count MDP: 3
INFO:root:Ship 0 command: o actual position: Position(15, 33) new position: Position(15, 33)
INFO:root:Terminais: [(0, 1), (0, 8), (1, 0), (1, 1), (1, 6), (2, 1), (2, 5), (2, 8), (3, 1), (3, 3), (3, 5), (4, 0), (4, 2), (4, 3), (4, 4), (4, 8), (5, 0), (5, 1), (5, 2), (5, 3), (5, 5), (6, 0), (6, 1), (6, 4), (6, 5), (6, 6), (7, 0), (7, 1), (7, 4), (7, 5), (8, 0), (8, 1), (8, 5), (8, 6)]
INFO:root:Rewards:
[[-32, 980, 0, -160, -156, -148, 0, -24, 360], [280, 360, -84, -8000, -4, -108, 820, -32, -36], [-52, 180, -80, -40, -8000, 140, -36, -72, 20], [-36, 60, -16, 2440, -40, 440, -88, -96, 0], [400, -4, 420, 2820, 1240, -88, -60, -100, 840], [2000, 580, 480, 460, -12, 660, -20, -44, -44], [1480, 660, -8, -36, 800, 2240, 360, -132, -20], [3220, 3840, -4, -4, 1220, 280, -16, -128, -88], [1880, 5140, -36, -160, -60, 1760, 280, -156, -120]]
INFO:root:Count MDP: 5
INFO:root:Ship 4 command: o actual position: Position(20, 25) new position: Position(20, 25)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 1), (3, 2), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 1), (4, 3), (4, 4), (4, 6), (5, 2), (5, 3), (5, 4), (6, 1), (6, 3), (6, 4), (6, 6), (6, 7), (7, 3), (8, 2), (8, 3), (8, 8)]
INFO:root:Rewards:
[[1660, 2760, 3300, 5700, 5400, 10060, 9180, 3360, 3600], [2400, 1580, 1880, 5560, 3600, 5340, 2780, 2520, 2960], [540, 1120, 3840, 3880, 1460, 1700, 2000, 2140, 1580], [60, 1060, 140, -12, 700, 320, 380, 140, 320], [-12, 860, -4, 2140, 1200, -8, 20, -28, -16], [-108, -120, 1600, 1860, 320, -8, -12, -88, -44], [-120, 40, -84, 900, 1160, -84, 620, 160, -52], [-156, -160, -32, 980, 0, -160, -156, -148, 0], [-80, -120, 280, 360, -84, -8000, -4, -108, 820]]
INFO:root:Count MDP: 4
INFO:root:Ship 6 command: o actual position: Position(13, 23) new position: Position(13, 23)
INFO:root:Terminais: [(0, 0), (0, 2), (0, 3), (0, 5), (0, 8), (1, 1), (1, 2), (1, 3), (2, 0), (2, 2), (2, 3), (2, 5), (2, 6), (3, 2), (4, 1), (4, 2), (4, 7), (5, 2), (5, 6), (6, 0), (6, 2), (6, 4), (6, 6), (7, 0), (7, 1), (7, 3), (7, 4), (7, 5), (8, 0), (8, 1), (8, 2), (8, 3), (8, 4), (8, 6)]
INFO:root:Rewards:
[[860, -4, 2140, -40000, -8, 20, -28, -16, 320], [-120, 1600, 1860, 320, -8, -12, -88, -44, -160], [40, -84, 900, 1160, -84, 620, 160, -52, -52], [-160, -32, 980, 0, -160, -156, -148, 0, -24], [-120, 280, 360, -84, -76, -4, -108, 820, -32], [-120, -52, 180, -80, -40, -8000, 140, -36, -72], [2180, -36, 60, -16, 2440, -40, 440, -88, -96], [1660, 400, -4, 420, 2820, -40000, -88, -60, -100], [800, 2000, 580, 480, 460, -12, 660, -20, -44]]
INFO:root:Count MDP: 7
INFO:root:Ship 2 command: e actual position: Position(17, 24) new position: Position(18, 24)
INFO:root:Time: 0.06058049201965332
INFO:root:=============== TURN 026 ================
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (1, 1), (1, 2), (1, 4), (1, 5), (2, 1), (2, 8), (3, 0), (3, 1), (3, 6), (4, 1), (4, 5), (4, 8), (5, 1), (5, 3), (5, 5), (6, 0), (6, 2), (6, 3), (6, 4), (6, 8), (7, 0), (7, 1), (7, 2), (7, 3), (7, 5), (8, 0), (8, 1), (8, 4), (8, 5), (8, 6)]
INFO:root:Rewards:
[[1600, 1860, 320, -8, -12, -88, -44, -160, -36], [-84, 900, 1160, -84, 620, 160, -52, -52, -12], [-32, 980, 0, -160, -156, -148, 0, -24, 360], [280, 360, -84, -76, -4, -108, 820, -32, -36], [-52, 180, -80, -8000, -64, 140, -36, -72, 20], [-36, 60, -16, 2440, -40, 440, -88, -96, 0], [400, -4, 420, 2820, -40000, -88, -60, -100, 840], [2000, 580, 480, 460, -12, 660, -20, -44, -44], [1480, 660, -8, -36, 800, 2240, 360, -132, -20]]
INFO:root:Count MDP: 6
INFO:root:Ship 8 command: e actual position: Position(18, 25) new position: Position(19, 25)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 4), (4, 5), (4, 6), (4, 7), (4, 8), (5, 0), (5, 2), (5, 3), (5, 4), (5, 5), (5, 6), (5, 7), (5, 8), (6, 1), (6, 2), (6, 3), (6, 4), (6, 5), (6, 6), (6, 7), (6, 8), (7, 0), (7, 1), (7, 2), (7, 3), (7, 4), (7, 5), (7, 6), (7, 7), (7, 8), (8, 1), (8, 2), (8, 3), (8, 4), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[1660, 2440, 1800, 700, 1900, 5900, 6160, 3200, 3860], [420, 180, 920, -12, 860, 4340, 4820, 4660, 3980], [400, -36, 240, 1520, 1600, 2080, 2400, 4600, 3160], [-36, -36, 420, 780, 1380, 1760, 6240, 6380, 3220], [-12, -4, -24, -36, 1300, 2140, 2740, 8260, 4200], [360, -12, 20, 400, 780, 660, 2580, 7040, 4220], [-36, 560, 440, 1500, 940, 1880, 2400, 3040, 4160], [20, 3340, 820, 880, 2520, 6740, 2700, 2160, 7280], [0, 920, 5040, 3580, 2420, 4620, 6060, 3540, 8900]]
INFO:root:Count MDP: 4
INFO:root:Ship 0 command: o actual position: Position(15, 33) new position: Position(15, 33)
INFO:root:Terminais: [(0, 1), (0, 8), (1, 0), (1, 1), (1, 6), (2, 1), (2, 5), (2, 8), (3, 1), (3, 3), (3, 5), (4, 0), (4, 2), (4, 3), (4, 4), (4, 8), (5, 0), (5, 1), (5, 2), (5, 3), (5, 5), (6, 0), (6, 1), (6, 4), (6, 5), (6, 6), (7, 0), (7, 1), (7, 4), (7, 5), (8, 0), (8, 1), (8, 5), (8, 6)]
INFO:root:Rewards:
[[-32, 980, 0, -160, -156, -148, 0, -24, 360], [280, 360, -84, -76, -4, -108, 820, -32, -36], [-52, 180, -80, -8000, -64, 140, -36, -72, 20], [-36, 60, -16, 2440, -8000, 440, -88, -96, 0], [400, -4, 420, 2820, 720, -88, -60, -100, 840], [2000, 580, 480, 460, -12, 660, -20, -44, -44], [1480, 660, -8, -36, 800, 2240, 360, -132, -20], [3220, 3840, -4, -4, 1220, 280, -16, -128, -88], [1880, 5140, -36, -160, -60, 1760, 280, -156, -120]]
INFO:root:Count MDP: 6
INFO:root:Ship 4 command: o actual position: Position(20, 25) new position: Position(20, 25)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 1), (3, 2), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 1), (4, 3), (4, 4), (4, 6), (5, 2), (5, 3), (5, 4), (6, 1), (6, 3), (6, 4), (6, 6), (6, 7), (7, 3), (8, 2), (8, 3), (8, 8)]
INFO:root:Rewards:
[[1660, 2760, 3300, 5700, 5400, 10060, 9180, 3360, 3600], [2400, 1580, 1880, 5560, 3600, 5340, 2780, 2520, 2960], [540, 1120, 3840, 3880, 1460, 1700, 2000, 2140, 1580], [60, 1060, 140, -12, 700, 320, 380, 140, 320], [-12, 860, -4, 2140, 700, -8, 20, -28, -16], [-108, -120, 1600, 1860, 320, -8, -12, -88, -44], [-120, 40, -84, 900, 1160, -84, 620, 160, -52], [-156, -160, -32, 980, 0, -160, -156, -148, 0], [-80, -120, 280, 360, -84, -76, -4, -108, 820]]
INFO:root:Count MDP: 3
INFO:root:Ship 6 command: o actual position: Position(13, 23) new position: Position(13, 23)
INFO:root:Terminais: [(0, 1), (0, 2), (0, 3), (1, 0), (1, 2), (1, 3), (1, 5), (1, 6), (2, 2), (3, 1), (3, 2), (3, 7), (4, 2), (4, 6), (5, 0), (5, 2), (5, 4), (5, 6), (6, 0), (6, 1), (6, 3), (6, 4), (6, 5), (7, 0), (7, 1), (7, 2), (7, 3), (7, 4), (7, 6), (8, 0), (8, 1), (8, 2), (8, 5), (8, 6), (8, 7)]
INFO:root:Rewards:
[[-120, 1600, 1860, 320, -8, -12, -88, -44, -160], [40, -84, 900, 1160, -84, 620, 160, -52, -52], [-160, -32, 980, 0, -160, -156, -148, 0, -24], [-120, 280, 360, -84, -76, -4, -108, 820, -32], [-120, -52, 180, -80, -40, -64, 140, -36, -72], [2180, -36, 60, -16, 2440, -8000, 440, -88, -96], [1660, 400, -4, 420, 2820, -40000, -88, -60, -100], [800, 2000, 580, 480, 460, -12, 660, -20, -44], [1100, 1480, 660, -8, -36, 800, 2240, 360, -132]]
INFO:root:Count MDP: 6
INFO:root:Ship 2 command: e actual position: Position(18, 24) new position: Position(19, 24)
INFO:root:Time: 0.05765199661254883
INFO:root:=============== TURN 027 ================
INFO:root:Terminais: [(0, 1), (0, 2), (0, 4), (0, 5), (1, 1), (1, 8), (2, 0), (2, 1), (2, 6), (3, 1), (3, 5), (3, 8), (4, 1), (4, 3), (4, 5), (5, 0), (5, 2), (5, 3), (5, 4), (5, 8), (6, 0), (6, 1), (6, 2), (6, 3), (6, 5), (7, 0), (7, 1), (7, 4), (7, 5), (7, 6), (8, 0), (8, 1), (8, 4), (8, 5)]
INFO:root:Rewards:
[[-84, 900, 1160, -84, 620, 160, -52, -52, -12], [-32, 980, 0, -160, -156, -148, 0, -24, 360], [280, 360, -84, -76, -4, -108, 820, -32, -36], [-52, 180, -80, -40, -64, 140, -36, -72, 20], [-36, 60, -16, -40000, -40, 440, -88, -96, 0], [400, -4, 420, 2820, -40000, -88, -60, -100, 840], [2000, 580, 480, 460, -12, 660, -20, -44, -44], [1480, 660, -8, -36, 800, 2240, 360, -132, -20], [3220, 3840, -4, -4, 1220, 280, -16, -128, -88]]
INFO:root:Count MDP: 4
INFO:root:Ship 8 command: w actual position: Position(19, 25) new position: Position(18, 25)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 4), (4, 5), (4, 6), (4, 7), (4, 8), (5, 0), (5, 2), (5, 3), (5, 4), (5, 5), (5, 6), (5, 7), (5, 8), (6, 1), (6, 2), (6, 3), (6, 4), (6, 5), (6, 6), (6, 7), (6, 8), (7, 0), (7, 1), (7, 2), (7, 3), (7, 4), (7, 5), (7, 6), (7, 7), (7, 8), (8, 1), (8, 2), (8, 3), (8, 4), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[1660, 2440, 1800, 700, 1900, 5900, 6160, 3200, 3860], [420, 180, 920, -12, 860, 4340, 4820, 4660, 3980], [400, -36, 240, 1520, 1600, 2080, 2400, 4600, 3160], [-36, -36, 420, 780, 1380, 1760, 6240, 6380, 3220], [-12, -4, -24, -36, 760, 2140, 2740, 8260, 4200], [360, -12, 20, 400, 780, 660, 2580, 7040, 4220], [-36, 560, 440, 1500, 940, 1880, 2400, 3040, 4160], [20, 3340, 820, 880, 2520, 6740, 2700, 2160, 7280], [0, 920, 5040, 3580, 2420, 4620, 6060, 3540, 8900]]
INFO:root:Count MDP: 3
INFO:root:Ship 0 command: o actual position: Position(15, 33) new position: Position(15, 33)
INFO:root:Terminais: [(0, 1), (0, 8), (1, 0), (1, 1), (1, 6), (2, 1), (2, 5), (2, 8), (3, 1), (3, 3), (3, 5), (4, 0), (4, 2), (4, 3), (4, 4), (4, 8), (5, 0), (5, 1), (5, 2), (5, 3), (5, 5), (6, 0), (6, 1), (6, 4), (6, 5), (6, 6), (7, 0), (7, 1), (7, 4), (7, 5), (8, 0), (8, 1), (8, 5), (8, 6)]
INFO:root:Rewards:
[[-32, 980, 0, -160, -156, -148, 0, -24, 360], [280, 360, -84, -76, -4, -108, 820, -32, -36], [-52, 180, -80, -40, -8000, 140, -36, -72, 20], [-36, 60, -16, -40000, -40, 440, -88, -96, 0], [400, -4, 420, 2820, 340, -88, -60, -100, 840], [2000, 580, 480, 460, -12, 660, -20, -44, -44], [1480, 660, -8, -36, 800, 2240, 360, -132, -20], [3220, 3840, -4, -4, 1220, 280, -16, -128, -88], [1880, 5140, -36, -160, -60, 1760, 280, -156, -120]]
INFO:root:Count MDP: 4
INFO:root:Ship 4 command: o actual position: Position(20, 25) new position: Position(20, 25)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 1), (3, 2), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 1), (4, 3), (4, 4), (4, 6), (5, 2), (5, 3), (5, 4), (6, 1), (6, 3), (6, 4), (6, 6), (6, 7), (7, 3), (8, 2), (8, 3), (8, 8)]
INFO:root:Rewards:
[[1660, 2760, 3300, 5700, 5400, 10060, 9180, 3360, 3600], [2400, 1580, 1880, 5560, 3600, 5340, 2780, 2520, 2960], [540, 1120, 3840, 3880, 1460, 1700, 2000, 2140, 1580], [60, 1060, 140, -12, 700, 320, 380, 140, 320], [-12, 860, -4, 2140, 320, -8, 20, -28, -16], [-108, -120, 1600, 1860, 320, -8, -12, -88, -44], [-120, 40, -84, 900, 1160, -84, 620, 160, -52], [-156, -160, -32, 980, 0, -160, -156, -148, 0], [-80, -120, 280, 360, -84, -76, -4, -108, 820]]
INFO:root:Count MDP: 4
INFO:root:Ship 6 command: o actual position: Position(13, 23) new position: Position(13, 23)
INFO:root:Terminais: [(0, 0), (0, 2), (0, 3), (0, 5), (0, 6), (1, 2), (2, 1), (2, 2), (2, 7), (3, 2), (3, 6), (4, 0), (4, 2), (4, 4), (4, 6), (5, 0), (5, 1), (5, 3), (5, 4), (5, 5), (6, 0), (6, 1), (6, 2), (6, 3), (6, 4), (6, 6), (7, 0), (7, 1), (7, 2), (7, 5), (7, 6), (7, 7), (8, 0), (8, 1), (8, 2), (8, 5), (8, 6)]
INFO:root:Rewards:
[[40, -84, 900, 1160, -84, 620, 160, -52, -52], [-160, -32, 980, 0, -160, -156, -148, 0, -24], [-120, 280, 360, -84, -76, -4, -108, 820, -32], [-120, -52, 180, -80, -40, -8000, 140, -36, -72], [2180, -36, 60, -16, 2440, -40, 440, -88, -96], [1660, 400, -4, 420, 2820, -40000, -88, -60, -100], [800, 2000, 580, 480, 460, -12, 660, -20, -44], [1100, 1480, 660, -8, -36, 800, 2240, 360, -132], [2400, 3220, 3840, -4, -4, 1220, 280, -16, -128]]
INFO:root:Count MDP: 6
INFO:root:Ship 2 command: o actual position: Position(19, 24) new position: Position(19, 24)
INFO:root:Time: 0.050810813903808594
INFO:root:=============== TURN 028 ================
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (1, 1), (1, 2), (1, 4), (1, 5), (2, 1), (2, 8), (3, 0), (3, 1), (3, 6), (4, 1), (4, 5), (4, 8), (5, 1), (5, 3), (5, 5), (6, 0), (6, 2), (6, 3), (6, 4), (6, 8), (7, 0), (7, 1), (7, 2), (7, 3), (7, 5), (8, 0), (8, 1), (8, 4), (8, 5), (8, 6)]
INFO:root:Rewards:
[[1600, 1860, 320, -8, -12, -88, -44, -160, -36], [-84, 900, 1160, -84, 620, 160, -52, -52, -12], [-32, 980, 0, -160, -156, -148, 0, -24, 360], [280, 360, -84, -76, -4, -108, 820, -32, -36], [-52, 180, -80, -40, -64, 140, -36, -72, 20], [-36, 60, -16, -40000, -40, 440, -88, -96, 0], [400, -4, 420, 2820, -40000, -88, -60, -100, 840], [2000, 580, 480, 460, -12, 660, -20, -44, -44], [1480, 660, -8, -36, 800, 2240, 360, -132, -20]]
INFO:root:Count MDP: 5
INFO:root:Ship 8 command: w actual position: Position(18, 25) new position: Position(17, 25)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 4), (4, 5), (4, 6), (4, 7), (4, 8), (5, 0), (5, 2), (5, 3), (5, 4), (5, 5), (5, 6), (5, 7), (5, 8), (6, 1), (6, 2), (6, 3), (6, 4), (6, 5), (6, 6), (6, 7), (6, 8), (7, 0), (7, 1), (7, 2), (7, 3), (7, 4), (7, 5), (7, 6), (7, 7), (7, 8), (8, 1), (8, 2), (8, 3), (8, 4), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[1660, 2440, 1800, 700, 1900, 5900, 6160, 3200, 3860], [420, 180, 920, -12, 860, 4340, 4820, 4660, 3980], [400, -36, 240, 1520, 1600, 2080, 2400, 4600, 3160], [-36, -36, 420, 780, 1380, 1760, 6240, 6380, 3220], [-12, -4, -24, -36, 360, 2140, 2740, 8260, 4200], [360, -12, 20, 400, 780, 660, 2580, 7040, 4220], [-36, 560, 440, 1500, 940, 1880, 2400, 3040, 4160], [20, 3340, 820, 880, 2520, 6740, 2700, 2160, 7280], [0, 920, 5040, 3580, 2420, 4620, 6060, 3540, 8900]]
INFO:root:Count MDP: 4
INFO:root:Ship 0 command: o actual position: Position(15, 33) new position: Position(15, 33)
INFO:root:Terminais: [(0, 1), (0, 8), (1, 0), (1, 1), (1, 6), (2, 1), (2, 5), (2, 8), (3, 1), (3, 3), (3, 5), (4, 0), (4, 2), (4, 3), (4, 4), (4, 8), (5, 0), (5, 1), (5, 2), (5, 3), (5, 5), (6, 0), (6, 1), (6, 4), (6, 5), (6, 6), (7, 0), (7, 1), (7, 4), (7, 5), (8, 0), (8, 1), (8, 5), (8, 6)]
INFO:root:Rewards:
[[-32, 980, 0, -160, -156, -148, 0, -24, 360], [280, 360, -84, -76, -8000, -108, 820, -32, -36], [-52, 180, -80, -40, -64, 140, -36, -72, 20], [-36, 60, -16, -40000, -40, 440, -88, -96, 0], [400, -4, 420, 2820, 40, -88, -60, -100, 840], [2000, 580, 480, 460, -12, 660, -20, -44, -44], [1480, 660, -8, -36, 800, 2240, 360, -132, -20], [3220, 3840, -4, -4, 1220, 280, -16, -128, -88], [1880, 5140, -36, -160, -60, 1760, 280, -156, -120]]
INFO:root:Count MDP: 4
INFO:root:Ship 4 command: o actual position: Position(20, 25) new position: Position(20, 25)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 1), (3, 2), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 1), (4, 3), (4, 4), (4, 6), (5, 2), (5, 3), (5, 4), (6, 1), (6, 3), (6, 4), (6, 6), (6, 7), (7, 3), (8, 2), (8, 3), (8, 8)]
INFO:root:Rewards:
[[1660, 2760, 3300, 5700, 5400, 10060, 9180, 3360, 3600], [2400, 1580, 1880, 5560, 3600, 5340, 2780, 2520, 2960], [540, 1120, 3840, 3880, 1460, 1700, 2000, 2140, 1580], [60, 1060, 140, -12, 700, 320, 380, 140, 320], [-12, 860, -4, 2140, 40, -8, 20, -28, -16], [-108, -120, 1600, 1860, 320, -8, -12, -88, -44], [-120, 40, -84, 900, 1160, -84, 620, 160, -52], [-156, -160, -32, 980, 0, -160, -156, -148, 0], [-80, -120, 280, 360, -84, -76, -8000, -108, 820]]
INFO:root:Count MDP: 4
INFO:root:Ship 6 command: o actual position: Position(13, 23) new position: Position(13, 23)
INFO:root:Terminais: [(0, 0), (0, 2), (0, 3), (0, 5), (0, 6), (1, 2), (2, 1), (2, 2), (2, 7), (3, 2), (3, 6), (4, 0), (4, 2), (4, 4), (4, 6), (5, 0), (5, 1), (5, 3), (5, 4), (5, 5), (6, 0), (6, 1), (6, 2), (6, 3), (6, 4), (6, 6), (7, 0), (7, 1), (7, 2), (7, 5), (7, 6), (7, 7), (8, 0), (8, 1), (8, 2), (8, 5), (8, 6)]
INFO:root:Rewards:
[[40, -84, 900, 1160, -84, 620, 160, -52, -52], [-160, -32, 980, 0, -160, -156, -148, 0, -24], [-120, 280, 360, -84, -76, -8000, -108, 820, -32], [-120, -52, 180, -80, -40, -64, 140, -36, -72], [2180, -36, 60, -16, 1620, -40, 440, -88, -96], [1660, 400, -4, 420, 2820, -40000, -88, -60, -100], [800, 2000, 580, 480, 460, -12, 660, -20, -44], [1100, 1480, 660, -8, -36, 800, 2240, 360, -132], [2400, 3220, 3840, -4, -4, 1220, 280, -16, -128]]
INFO:root:Count MDP: 5
INFO:root:Ship 2 command: o actual position: Position(19, 24) new position: Position(19, 24)
INFO:root:Time: 0.05903220176696777
INFO:root:=============== TURN 029 ================
INFO:root:Terminais: [(0, 1), (0, 4), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (2, 1), (2, 2), (2, 4), (2, 5), (3, 1), (3, 8), (4, 0), (4, 1), (4, 6), (5, 1), (5, 5), (5, 8), (6, 1), (6, 3), (6, 5), (7, 0), (7, 2), (7, 3), (7, 8), (8, 0), (8, 1), (8, 2), (8, 3), (8, 5)]
INFO:root:Rewards:
[[-4, 2140, -8000, -8, 20, -28, -16, 320, 400], [1600, 1860, 320, -8, -12, -88, -44, -160, -36], [-84, 900, 1160, -84, 620, 160, -52, -52, -12], [-32, 980, 0, -160, -156, -148, 0, -24, 360], [280, 360, -84, -76, -4, -108, 820, -32, -36], [-52, 180, -80, -40, -64, 140, -36, -72, 20], [-36, 60, -16, -40000, -40, 440, -88, -96, 0], [400, -4, 420, 2820, -8000, -88, -60, -100, 840], [2000, 580, 480, 460, -12, 660, -20, -44, -44]]
INFO:root:Count MDP: 5
INFO:root:Ship 8 command: n actual position: Position(17, 25) new position: Position(17, 24)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 4), (4, 5), (4, 6), (4, 7), (4, 8), (5, 0), (5, 2), (5, 3), (5, 4), (5, 5), (5, 6), (5, 7), (5, 8), (6, 1), (6, 2), (6, 3), (6, 4), (6, 5), (6, 6), (6, 7), (6, 8), (7, 0), (7, 1), (7, 2), (7, 3), (7, 4), (7, 5), (7, 6), (7, 7), (7, 8), (8, 1), (8, 2), (8, 3), (8, 4), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[1660, 2440, 1800, 700, 1900, 5900, 6160, 3200, 3860], [420, 180, 920, -12, 860, 4340, 4820, 4660, 3980], [400, -36, 240, 1520, 1600, 2080, 2400, 4600, 3160], [-36, -36, 420, 780, 1380, 1760, 6240, 6380, 3220], [-12, -4, -24, -36, 60, 2140, 2740, 8260, 4200], [360, -12, 20, 400, 780, 660, 2580, 7040, 4220], [-36, 560, 440, 1500, 940, 1880, 2400, 3040, 4160], [20, 3340, 820, 880, 2520, 6740, 2700, 2160, 7280], [0, 920, 5040, 3580, 2420, 4620, 6060, 3540, 8900]]
INFO:root:Count MDP: 3
INFO:root:Ship 0 command: o actual position: Position(15, 33) new position: Position(15, 33)
INFO:root:Terminais: [(0, 1), (0, 8), (1, 0), (1, 1), (1, 6), (2, 1), (2, 5), (2, 8), (3, 1), (3, 3), (3, 5), (4, 0), (4, 2), (4, 3), (4, 8), (5, 0), (5, 1), (5, 2), (5, 3), (5, 5), (6, 0), (6, 1), (6, 4), (6, 5), (6, 6), (7, 0), (7, 1), (7, 4), (7, 5), (8, 0), (8, 1), (8, 5), (8, 6)]
INFO:root:Rewards:
[[-32, 980, 0, -160, -156, -148, 0, -24, 360], [280, 360, -84, -8000, -4, -108, 820, -32, -36], [-52, 180, -80, -40, -64, 140, -36, -72, 20], [-36, 60, -16, -40000, -40, 440, -88, -96, 0], [400, -4, 420, 2820, -36, -88, -60, -100, 840], [2000, 580, 480, 460, -12, 660, -20, -44, -44], [1480, 660, -8, -36, 800, 2240, 360, -132, -20], [3220, 3840, -4, -4, 1220, 280, -16, -128, -88], [1880, 5140, -36, -160, -60, 1760, 280, -156, -120]]
INFO:root:Count MDP: 8
INFO:root:Ship 4 command: n actual position: Position(20, 25) new position: Position(20, 24)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 1), (3, 2), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 1), (4, 3), (4, 6), (5, 2), (5, 3), (5, 4), (6, 1), (6, 3), (6, 4), (6, 6), (6, 7), (7, 3), (8, 2), (8, 3), (8, 8)]
INFO:root:Rewards:
[[1660, 2760, 3300, 5700, 5400, 10060, 9180, 3360, 3600], [2400, 1580, 1880, 5560, 3600, 5340, 2780, 2520, 2960], [540, 1120, 3840, 3880, 1460, 1700, 2000, 2140, 1580], [60, 1060, 140, -12, 700, 320, 380, 140, 320], [-12, 860, -4, 2140, -36, -8, 20, -28, -16], [-108, -120, 1600, 1860, 320, -8, -12, -88, -44], [-120, 40, -84, 900, 1160, -84, 620, 160, -52], [-156, -160, -32, 980, 0, -160, -156, -148, 0], [-80, -120, 280, 360, -84, -8000, -4, -108, 820]]
INFO:root:Count MDP: 6
INFO:root:Ship 6 command: n actual position: Position(13, 23) new position: Position(13, 22)
INFO:root:Terminais: [(0, 0), (0, 2), (0, 3), (0, 5), (0, 6), (1, 2), (2, 1), (2, 2), (2, 7), (3, 2), (3, 6), (4, 0), (4, 2), (4, 4), (4, 6), (5, 0), (5, 1), (5, 3), (5, 4), (6, 0), (6, 1), (6, 2), (6, 3), (6, 4), (6, 6), (7, 0), (7, 1), (7, 2), (7, 5), (7, 6), (7, 7), (8, 0), (8, 1), (8, 2), (8, 5), (8, 6)]
INFO:root:Rewards:
[[40, -84, 900, 1160, -84, 620, 160, -52, -52], [-160, -32, 980, 0, -160, -156, -148, 0, -24], [-120, 280, 360, -84, -8000, -4, -108, 820, -32], [-120, -52, 180, -80, -40, -64, 140, -36, -72], [2180, -36, 60, -16, 1000, -40, 440, -88, -96], [1660, 400, -4, 420, -40000, -36, -88, -60, -100], [800, 2000, 580, 480, 460, -12, 660, -20, -44], [1100, 1480, 660, -8, -36, 800, 2240, 360, -132], [2400, 3220, 3840, -4, -4, 1220, 280, -16, -128]]
INFO:root:Count MDP: 5
INFO:root:Ship 2 command: o actual position: Position(19, 24) new position: Position(19, 24)
INFO:root:Time: 0.07185196876525879
INFO:root:=============== TURN 030 ================
INFO:root:Terminais: [(0, 0), (0, 2), (0, 5), (0, 8), (1, 1), (1, 2), (1, 3), (2, 0), (2, 2), (2, 3), (2, 5), (2, 6), (3, 2), (4, 1), (4, 2), (4, 7), (5, 2), (5, 6), (6, 0), (6, 2), (6, 4), (6, 6), (7, 0), (7, 1), (7, 3), (7, 4), (8, 0), (8, 1), (8, 2), (8, 3), (8, 4), (8, 6)]
INFO:root:Rewards:
[[860, -4, -40000, -36, -8, 20, -28, -16, 320], [-120, 1600, 1860, 320, -8, -12, -88, -44, -160], [40, -84, 900, 1160, -84, 620, 160, -52, -52], [-160, -32, 980, 0, -160, -156, -148, 0, -24], [-120, 280, 360, -84, -76, -4, -108, 820, -32], [-120, -52, 180, -80, -40, -64, 140, -36, -72], [2180, -36, 60, -16, -40000, -40, 440, -88, -96], [1660, 400, -4, 420, -40000, -36, -88, -60, -100], [800, 2000, 580, 480, 460, -12, 660, -20, -44]]
INFO:root:Count MDP: 4
INFO:root:Ship 8 command: n actual position: Position(17, 24) new position: Position(17, 23)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 5), (4, 6), (4, 7), (4, 8), (5, 0), (5, 2), (5, 3), (5, 4), (5, 5), (5, 6), (5, 7), (5, 8), (6, 1), (6, 2), (6, 3), (6, 4), (6, 5), (6, 6), (6, 7), (6, 8), (7, 0), (7, 1), (7, 2), (7, 3), (7, 4), (7, 5), (7, 6), (7, 7), (7, 8), (8, 1), (8, 2), (8, 3), (8, 4), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[1660, 2440, 1800, 700, 1900, 5900, 6160, 3200, 3860], [420, 180, 920, -12, 860, 4340, 4820, 4660, 3980], [400, -36, 240, 1520, 1600, 2080, 2400, 4600, 3160], [-36, -36, 420, 780, 1380, 1760, 6240, 6380, 3220], [-12, -4, -24, -36, -32, 2140, 2740, 8260, 4200], [360, -12, 20, 400, 780, 660, 2580, 7040, 4220], [-36, 560, 440, 1500, 940, 1880, 2400, 3040, 4160], [20, 3340, 820, 880, 2520, 6740, 2700, 2160, 7280], [0, 920, 5040, 3580, 2420, 4620, 6060, 3540, 8900]]
INFO:root:Count MDP: 4
INFO:root:Ship 0 command: s actual position: Position(15, 33) new position: Position(15, 34)
INFO:root:Terminais: [(0, 0), (0, 2), (0, 3), (0, 5), (0, 6), (1, 2), (2, 1), (2, 2), (2, 7), (3, 2), (3, 6), (4, 0), (4, 2), (4, 4), (4, 6), (5, 0), (5, 1), (5, 3), (5, 4), (6, 0), (6, 1), (6, 2), (6, 3), (6, 4), (6, 6), (7, 0), (7, 1), (7, 2), (7, 5), (7, 6), (7, 7), (8, 0), (8, 1), (8, 2), (8, 5), (8, 6)]
INFO:root:Rewards:
[[40, -84, 900, 1160, -84, 620, 160, -52, -52], [-160, -32, 980, 0, -160, -156, -148, 0, -24], [-120, 280, 360, -8000, -76, -4, -108, 820, -32], [-120, -52, 180, -80, -40, -64, 140, -36, -72], [2180, -36, 60, -16, 540, -40, 440, -88, -96], [1660, 400, -4, 420, -40000, -36, -88, -60, -100], [800, 2000, 580, 480, 460, -12, 660, -20, -44], [1100, 1480, 660, -8, -36, 800, 2240, 360, -132], [2400, 3220, 3840, -4, -4, 1220, 280, -16, -128]]
INFO:root:Count MDP: 4
INFO:root:Ship 2 command: o actual position: Position(19, 24) new position: Position(19, 24)
INFO:root:Terminais: [(0, 2), (1, 1), (1, 2), (1, 7), (2, 2), (2, 6), (3, 0), (3, 2), (3, 4), (3, 6), (4, 0), (4, 1), (4, 3), (4, 4), (5, 0), (5, 1), (5, 2), (5, 3), (5, 4), (5, 6), (6, 0), (6, 1), (6, 2), (6, 5), (6, 6), (6, 7), (7, 0), (7, 1), (7, 2), (7, 5), (7, 6), (8, 0), (8, 1), (8, 2), (8, 6), (8, 7)]
INFO:root:Rewards:
[[-160, -32, 980, 0, -160, -156, -148, 0, -24], [-120, 280, 360, -8000, -76, -4, -108, 820, -32], [-120, -52, 180, -80, -40, -64, 140, -36, -72], [2180, -36, 60, -16, -40000, -40, 440, -88, -96], [1660, 400, -4, 420, 2820, -36, -88, -60, -100], [800, 2000, 580, 480, 460, -12, 660, -20, -44], [1100, 1480, 660, -8, -36, 800, 2240, 360, -132], [2400, 3220, 3840, -4, -4, 1220, 280, -16, -128], [4160, 1880, 5140, -36, -160, -60, 1760, 280, -156]]
INFO:root:Count MDP: 6
INFO:root:Ship 4 command: o actual position: Position(20, 24) new position: Position(20, 24)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 1), (3, 2), (3, 3), (3, 5), (3, 6), (3, 7), (3, 8), (4, 2), (4, 4), (4, 7), (5, 3), (5, 4), (5, 5), (6, 2), (6, 4), (6, 5), (6, 7), (6, 8), (7, 4), (8, 3), (8, 4)]
INFO:root:Rewards:
[[1080, 1660, 2760, 3300, 5700, 5400, 10060, 9180, 3360], [-84, 2400, 1580, 1880, 5560, 3600, 5340, 2780, 2520], [820, 540, 1120, 3840, 3880, 1460, 1700, 2000, 2140], [740, 60, 1060, 140, -12, 700, 320, 380, 140], [-76, -12, 860, -4, 2140, -36, -8, 20, -28], [-148, -108, -120, 1600, 1860, 320, -8, -12, -88], [-120, -120, 40, -84, 900, 1160, -84, 620, 160], [-160, -156, -160, -32, 980, 0, -160, -156, -148], [-4, -80, -120, 280, 360, -8000, -76, -4, -108]]
INFO:root:Count MDP: 5
INFO:root:Ship 6 command: o actual position: Position(13, 22) new position: Position(13, 22)
INFO:root:Time: 0.06449079513549805
INFO:root:=============== TURN 031 ================
INFO:root:Terminais: [(0, 0), (0, 2), (0, 3), (0, 5), (0, 6), (1, 2), (2, 1), (2, 2), (2, 7), (3, 2), (3, 6), (4, 0), (4, 2), (4, 4), (4, 6), (5, 0), (5, 1), (5, 3), (5, 4), (6, 0), (6, 1), (6, 2), (6, 3), (6, 4), (6, 6), (7, 0), (7, 1), (7, 2), (7, 5), (7, 6), (7, 7), (8, 0), (8, 1), (8, 2), (8, 5), (8, 6)]
INFO:root:Rewards:
[[40, -84, 900, 1160, -84, 620, 160, -52, -52], [-160, -32, 980, 0, -160, -156, -148, 0, -24], [-120, 280, 360, -8000, -76, -4, -108, 820, -32], [-120, -52, 180, -80, -40, -64, 140, -36, -72], [2180, -36, 60, -16, 200, -40, 440, -88, -96], [1660, 400, -4, 420, -40000, -36, -88, -60, -100], [800, 2000, 580, 480, 460, -12, 660, -20, -44], [1100, 1480, 660, -8, -36, 800, 2240, 360, -132], [2400, 3220, 3840, -4, -4, 1220, 280, -16, -128]]
INFO:root:Count MDP: 4
INFO:root:Ship 2 command: o actual position: Position(19, 24) new position: Position(19, 24)
INFO:root:Terminais: [(0, 2), (1, 1), (1, 2), (1, 7), (2, 2), (2, 6), (3, 0), (3, 2), (3, 4), (3, 6), (4, 0), (4, 1), (4, 3), (4, 4), (5, 0), (5, 1), (5, 2), (5, 3), (5, 4), (5, 6), (6, 0), (6, 1), (6, 2), (6, 5), (6, 6), (6, 7), (7, 0), (7, 1), (7, 2), (7, 5), (7, 6), (8, 0), (8, 1), (8, 2), (8, 6), (8, 7)]
INFO:root:Rewards:
[[-160, -32, 980, 0, -160, -156, -148, 0, -24], [-120, 280, 360, -8000, -76, -4, -108, 820, -32], [-120, -52, 180, -80, -40, -64, 140, -36, -72], [2180, -36, 60, -16, -40000, -40, 440, -88, -96], [1660, 400, -4, 420, 1900, -36, -88, -60, -100], [800, 2000, 580, 480, 460, -12, 660, -20, -44], [1100, 1480, 660, -8, -36, 800, 2240, 360, -132], [2400, 3220, 3840, -4, -4, 1220, 280, -16, -128], [4160, 1880, 5140, -36, -160, -60, 1760, 280, -156]]
INFO:root:Count MDP: 5
INFO:root:Ship 4 command: o actual position: Position(20, 24) new position: Position(20, 24)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 1), (3, 2), (3, 3), (3, 5), (3, 6), (3, 7), (3, 8), (4, 2), (4, 4), (4, 7), (5, 3), (5, 4), (5, 5), (6, 2), (6, 4), (6, 5), (6, 7), (6, 8), (7, 4), (8, 3), (8, 4)]
INFO:root:Rewards:
[[1080, 1660, 2760, 3300, 5700, 5400, 10060, 9180, 3360], [-84, 2400, 1580, 1880, 5560, 3600, 5340, 2780, 2520], [820, 540, 1120, 3840, 3880, 1460, 1700, 2000, 2140], [740, 60, 1060, 140, -12, 700, 320, 380, 140], [-76, -12, 860, -4, 1400, -36, -8, 20, -28], [-148, -108, -120, 1600, 1860, 320, -8, -12, -88], [-120, -120, 40, -84, 900, 1160, -84, 620, 160], [-160, -156, -160, -32, 980, 0, -160, -156, -148], [-4, -80, -120, 280, 360, -8000, -76, -4, -108]]
INFO:root:Count MDP: 4
INFO:root:Ship 6 command: o actual position: Position(13, 22) new position: Position(13, 22)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 4), (4, 5), (4, 6), (4, 7), (4, 8), (5, 1), (5, 2), (5, 3), (5, 4), (5, 5), (5, 6), (5, 7), (5, 8), (6, 0), (6, 1), (6, 2), (6, 3), (6, 4), (6, 5), (6, 6), (6, 7), (6, 8), (7, 0), (7, 1), (7, 2), (7, 3), (7, 4), (7, 5), (7, 6), (7, 7), (7, 8), (8, 0), (8, 1), (8, 2), (8, 3), (8, 4), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[2440, 1800, 700, 1900, 5900, 6160, 3200, 3860, 4820], [180, 920, -12, 860, 4340, 4820, 4660, 3980, 2320], [-36, 240, 1520, 1600, 2080, 2400, 4600, 3160, 5600], [-36, 420, 780, 1380, 1760, 6240, 6380, 3220, 2720], [-4, -24, -36, -32, 2140, 2740, 8260, 4200, 3480], [-12, 20, 400, 780, 660, 2580, 7040, 4220, 3940], [560, 440, 1500, 940, 1880, 2400, 3040, 4160, 6460], [3340, 820, 880, 2520, 6740, 2700, 2160, 7280, 10360], [920, 5040, 3580, 2420, 4620, 6060, 3540, 8900, 7600]]
INFO:root:Count MDP: 4
INFO:root:Ship 0 command: o actual position: Position(15, 34) new position: Position(15, 34)
INFO:root:Terminais: [(0, 1), (0, 3), (0, 6), (1, 2), (1, 3), (1, 4), (2, 1), (2, 3), (2, 4), (2, 6), (2, 7), (3, 3), (4, 2), (4, 3), (4, 8), (5, 0), (5, 3), (5, 7), (6, 0), (6, 1), (6, 3), (6, 5), (6, 7), (7, 0), (7, 1), (7, 2), (7, 4), (7, 5), (8, 0), (8, 1), (8, 2), (8, 3), (8, 4), (8, 5), (8, 7)]
INFO:root:Rewards:
[[-12, 860, -4, -40000, -36, -8, 20, -28, -16], [-108, -120, 1600, 1860, 320, -8, -12, -88, -44], [-120, 40, -84, 900, 1160, -84, 620, 160, -52], [-156, -160, -32, 980, 0, -160, -156, -148, 0], [-80, -120, 280, 360, -84, -76, -4, -108, 820], [640, -120, -52, 180, -80, -40, -64, 140, -36], [280, 2180, -36, 60, -16, -40000, -40, 440, -88], [1120, 1660, 400, -4, 420, -40000, -36, -88, -60], [2980, 800, 2000, 580, 480, 460, -12, 660, -20]]
INFO:root:Count MDP: 5
INFO:root:Ship 8 command: w actual position: Position(17, 23) new position: Position(16, 23)
INFO:root:Time: 0.06253719329833984
INFO:root:=============== TURN 032 ================
INFO:root:Terminais: [(0, 0), (0, 2), (0, 3), (0, 5), (0, 6), (1, 2), (2, 1), (2, 2), (2, 7), (3, 2), (3, 6), (4, 0), (4, 2), (4, 6), (5, 0), (5, 1), (5, 3), (5, 4), (6, 0), (6, 1), (6, 2), (6, 3), (6, 4), (6, 6), (7, 0), (7, 1), (7, 2), (7, 5), (7, 6), (7, 7), (8, 0), (8, 1), (8, 2), (8, 5), (8, 6)]
INFO:root:Rewards:
[[40, -84, 900, 1160, -84, 620, 160, -52, -52], [-160, -32, 980, -8000, -160, -156, -148, 0, -24], [-120, 280, 360, -84, -76, -4, -108, 820, -32], [-120, -52, 180, -80, -40, -64, 140, -36, -72], [2180, -36, 60, -16, -12, -40, 440, -88, -96], [1660, 400, -4, 420, -40000, -36, -88, -60, -100], [800, 2000, 580, 480, 460, -12, 660, -20, -44], [1100, 1480, 660, -8, -36, 800, 2240, 360, -132], [2400, 3220, 3840, -4, -4, 1220, 280, -16, -128]]
INFO:root:Count MDP: 5
INFO:root:Ship 2 command: s actual position: Position(19, 24) new position: Position(19, 25)
INFO:root:Terminais: [(0, 2), (1, 1), (1, 2), (1, 7), (2, 2), (2, 6), (3, 0), (3, 2), (3, 6), (4, 0), (4, 1), (4, 3), (4, 4), (5, 0), (5, 1), (5, 2), (5, 3), (5, 4), (5, 6), (6, 0), (6, 1), (6, 2), (6, 5), (6, 6), (6, 7), (7, 0), (7, 1), (7, 2), (7, 5), (7, 6), (8, 0), (8, 1), (8, 2), (8, 6), (8, 7)]
INFO:root:Rewards:
[[-160, -32, 980, -8000, -160, -156, -148, 0, -24], [-120, 280, 360, -84, -76, -4, -108, 820, -32], [-120, -52, 180, -80, -40, -64, 140, -36, -72], [2180, -36, 60, -16, -12, -8000, 440, -88, -96], [1660, 400, -4, 420, 1220, -36, -88, -60, -100], [800, 2000, 580, 480, 460, -12, 660, -20, -44], [1100, 1480, 660, -8, -36, 800, 2240, 360, -132], [2400, 3220, 3840, -4, -4, 1220, 280, -16, -128], [4160, 1880, 5140, -36, -160, -60, 1760, 280, -156]]
INFO:root:Count MDP: 5
INFO:root:Ship 4 command: o actual position: Position(20, 24) new position: Position(20, 24)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 1), (3, 2), (3, 3), (3, 5), (3, 6), (3, 7), (3, 8), (4, 2), (4, 4), (4, 7), (5, 3), (5, 4), (5, 5), (6, 2), (6, 4), (6, 5), (6, 7), (6, 8), (7, 4), (8, 3), (8, 4)]
INFO:root:Rewards:
[[1080, 1660, 2760, 3300, 5700, 5400, 10060, 9180, 3360], [-84, 2400, 1580, 1880, 5560, 3600, 5340, 2780, 2520], [820, 540, 1120, 3840, 3880, 1460, 1700, 2000, 2140], [740, 60, 1060, 140, -12, 700, 320, 380, 140], [-76, -12, 860, -4, 840, -36, -8, 20, -28], [-148, -108, -120, 1600, 1860, 320, -8, -12, -88], [-120, -120, 40, -84, 900, 1160, -84, 620, 160], [-160, -156, -160, -32, 980, -8000, -160, -156, -148], [-4, -80, -120, 280, 360, -84, -76, -4, -108]]
INFO:root:Count MDP: 4
INFO:root:Ship 6 command: o actual position: Position(13, 22) new position: Position(13, 22)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 1), (1, 3), (1, 6), (2, 2), (2, 3), (2, 4), (3, 1), (3, 3), (3, 4), (3, 6), (3, 7), (4, 3), (5, 2), (5, 3), (5, 8), (6, 0), (6, 3), (6, 7), (7, 0), (7, 1), (7, 3), (7, 7), (8, 0), (8, 1), (8, 2), (8, 4), (8, 5)]
INFO:root:Rewards:
[[60, 1060, 140, -12, 700, 320, 380, 140, 320], [-12, 860, -4, -40000, -36, -8, 20, -28, -16], [-108, -120, 1600, 1860, 320, -8, -12, -88, -44], [-120, 40, -84, 900, 1160, -84, 620, 160, -52], [-156, -160, -32, 980, 0, -160, -156, -148, 0], [-80, -120, 280, 360, -84, -76, -4, -108, 820], [640, -120, -52, 180, -80, -40, -64, 140, -36], [280, 2180, -36, 60, -16, -12, -8000, 440, -88], [1120, 1660, 400, -4, 420, -40000, -36, -88, -60]]
INFO:root:Count MDP: 5
INFO:root:Ship 8 command: w actual position: Position(16, 23) new position: Position(15, 23)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 4), (4, 5), (4, 6), (4, 7), (4, 8), (5, 1), (5, 2), (5, 3), (5, 4), (5, 5), (5, 6), (5, 7), (5, 8), (6, 0), (6, 1), (6, 2), (6, 3), (6, 4), (6, 5), (6, 6), (6, 7), (6, 8), (7, 0), (7, 1), (7, 2), (7, 3), (7, 4), (7, 5), (7, 6), (7, 7), (7, 8), (8, 0), (8, 1), (8, 2), (8, 3), (8, 4), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[2440, 1800, 700, 1900, 5900, 6160, 3200, 3860, 4820], [180, 920, -12, 860, 4340, 4820, 4660, 3980, 2320], [-36, 240, 1520, 1600, 2080, 2400, 4600, 3160, 5600], [-36, 420, 780, 1380, 1760, 6240, 6380, 3220, 2720], [-4, -24, -36, -32, 1400, 2740, 8260, 4200, 3480], [-12, 20, 400, 780, 660, 2580, 7040, 4220, 3940], [560, 440, 1500, 940, 1880, 2400, 3040, 4160, 6460], [3340, 820, 880, 2520, 6740, 2700, 2160, 7280, 10360], [920, 5040, 3580, 2420, 4620, 6060, 3540, 8900, 7600]]
INFO:root:Count MDP: 4
INFO:root:Ship 0 command: o actual position: Position(15, 34) new position: Position(15, 34)
INFO:root:Time: 0.06547260284423828
INFO:root:=============== TURN 033 ================
INFO:root:Terminais: [(0, 2), (1, 1), (1, 2), (1, 7), (2, 2), (2, 6), (3, 0), (3, 2), (3, 6), (4, 0), (4, 1), (4, 3), (4, 4), (5, 0), (5, 1), (5, 2), (5, 3), (5, 4), (5, 6), (6, 0), (6, 1), (6, 2), (6, 5), (6, 6), (6, 7), (7, 0), (7, 1), (7, 2), (7, 5), (7, 6), (8, 0), (8, 1), (8, 2), (8, 6), (8, 7)]
INFO:root:Rewards:
[[-160, -32, 980, 0, -160, -156, -148, 0, -24], [-120, 280, 360, -84, -76, -4, -108, 820, -32], [-120, -52, 180, -80, -40, -64, 140, -36, -72], [2180, -36, 60, -16, -12, -8000, 440, -88, -96], [1660, 400, -4, 420, 700, -36, -88, -60, -100], [800, 2000, 580, 480, 460, -12, 660, -20, -44], [1100, 1480, 660, -8, -36, 800, 2240, 360, -132], [2400, 3220, 3840, -4, -4, 1220, 280, -16, -128], [4160, 1880, 5140, -36, -160, -60, 1760, 280, -156]]
INFO:root:Count MDP: 4
INFO:root:Ship 4 command: o actual position: Position(20, 24) new position: Position(20, 24)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 1), (3, 2), (3, 3), (3, 5), (3, 6), (3, 7), (3, 8), (4, 2), (4, 4), (4, 7), (5, 3), (5, 4), (5, 5), (6, 2), (6, 4), (6, 5), (6, 7), (6, 8), (7, 4), (8, 3), (8, 4)]
INFO:root:Rewards:
[[1080, 1660, 2760, 3300, 5700, 5400, 10060, 9180, 3360], [-84, 2400, 1580, 1880, 5560, 3600, 5340, 2780, 2520], [820, 540, 1120, 3840, 3880, 1460, 1700, 2000, 2140], [740, 60, 1060, 140, -12, 700, 320, 380, 140], [-76, -12, 860, -4, 420, -36, -8, 20, -28], [-148, -108, -120, 1600, 1860, 320, -8, -12, -88], [-120, -120, 40, -84, 900, -40000, -84, 620, 160], [-160, -156, -160, -32, 980, 0, -160, -156, -148], [-4, -80, -120, 280, 360, -84, -76, -4, -108]]
INFO:root:Count MDP: 4
INFO:root:Ship 6 command: o actual position: Position(13, 22) new position: Position(13, 22)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 1), (2, 3), (2, 6), (3, 2), (3, 3), (3, 4), (4, 1), (4, 3), (4, 4), (4, 6), (4, 7), (5, 3), (6, 2), (6, 3), (6, 8), (7, 0), (7, 3), (7, 7), (8, 0), (8, 1), (8, 3), (8, 7)]
INFO:root:Rewards:
[[540, 1120, 3840, 3880, 1460, 1700, 2000, 2140, 1580], [60, 1060, 140, -12, 700, 320, 380, 140, 320], [-12, 860, -4, -40000, -36, -8, 20, -28, -16], [-108, -120, 1600, 1860, 320, -8, -12, -88, -44], [-120, 40, -84, 900, 1160, -84, 620, 160, -52], [-156, -160, -32, 980, 0, -160, -156, -148, 0], [-80, -120, 280, 360, -84, -76, -4, -108, 820], [640, -120, -52, 180, -80, -40, -64, 140, -36], [280, 2180, -36, 60, -16, -12, -8000, 440, -88]]
INFO:root:Count MDP: 5
INFO:root:Ship 8 command: o actual position: Position(15, 23) new position: Position(15, 23)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 4), (4, 5), (4, 6), (4, 7), (4, 8), (5, 1), (5, 2), (5, 3), (5, 4), (5, 5), (5, 6), (5, 7), (5, 8), (6, 0), (6, 1), (6, 2), (6, 3), (6, 4), (6, 5), (6, 6), (6, 7), (6, 8), (7, 0), (7, 1), (7, 2), (7, 3), (7, 4), (7, 5), (7, 6), (7, 7), (7, 8), (8, 0), (8, 1), (8, 2), (8, 3), (8, 4), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[2440, 1800, 700, 1900, 5900, 6160, 3200, 3860, 4820], [180, 920, -12, 860, 4340, 4820, 4660, 3980, 2320], [-36, 240, 1520, 1600, 2080, 2400, 4600, 3160, 5600], [-36, 420, 780, 1380, 1760, 6240, 6380, 3220, 2720], [-4, -24, -36, -32, 840, 2740, 8260, 4200, 3480], [-12, 20, 400, 780, 660, 2580, 7040, 4220, 3940], [560, 440, 1500, 940, 1880, 2400, 3040, 4160, 6460], [3340, 820, 880, 2520, 6740, 2700, 2160, 7280, 10360], [920, 5040, 3580, 2420, 4620, 6060, 3540, 8900, 7600]]
INFO:root:Count MDP: 4
INFO:root:Ship 0 command: o actual position: Position(15, 34) new position: Position(15, 34)
INFO:root:Terminais: [(0, 1), (0, 2), (0, 4), (0, 5), (1, 1), (1, 8), (2, 0), (2, 1), (2, 6), (3, 1), (3, 5), (3, 8), (4, 1), (4, 5), (5, 0), (5, 2), (5, 3), (5, 8), (6, 0), (6, 1), (6, 2), (6, 3), (6, 5), (7, 0), (7, 1), (7, 4), (7, 5), (7, 6), (8, 0), (8, 1), (8, 4), (8, 5)]
INFO:root:Rewards:
[[-84, 900, -40000, -84, 620, 160, -52, -52, -12], [-32, 980, 0, -160, -156, -148, 0, -24, 360], [280, 360, -84, -76, -4, -108, 820, -32, -36], [-52, 180, -80, -40, -64, 140, -36, -72, 20], [-36, 60, -16, -12, -40, 440, -88, -96, 0], [400, -4, 420, -40000, -36, -88, -60, -100, 840], [2000, 580, 480, 460, -12, 660, -20, -44, -44], [1480, 660, -8, -36, 800, 2240, 360, -132, -20], [3220, 3840, -4, -4, 1220, 280, -16, -128, -88]]
INFO:root:Count MDP: 4
INFO:root:Ship 2 command: e actual position: Position(19, 25) new position: Position(20, 25)
INFO:root:Time: 0.050810813903808594
INFO:root:=============== TURN 034 ================
INFO:root:Terminais: [(0, 2), (1, 1), (1, 2), (1, 7), (2, 2), (2, 6), (3, 0), (3, 2), (3, 6), (4, 0), (4, 1), (4, 3), (4, 4), (5, 0), (5, 1), (5, 2), (5, 3), (5, 4), (5, 6), (6, 0), (6, 1), (6, 2), (6, 5), (6, 6), (6, 7), (7, 0), (7, 1), (7, 2), (7, 5), (7, 6), (8, 0), (8, 1), (8, 2), (8, 6), (8, 7)]
INFO:root:Rewards:
[[-160, -32, 980, 0, -160, -156, -148, 0, -24], [-120, 280, 360, -84, -76, -4, -108, 820, -32], [-120, -52, 180, -80, -40, -64, 140, -36, -72], [2180, -36, 60, -16, -12, -40, 440, -88, -96], [1660, 400, -4, 420, 320, -8000, -88, -60, -100], [800, 2000, 580, 480, 460, -12, 660, -20, -44], [1100, 1480, 660, -8, -36, 800, 2240, 360, -132], [2400, 3220, 3840, -4, -4, 1220, 280, -16, -128], [4160, 1880, 5140, -36, -160, -60, 1760, 280, -156]]
INFO:root:Count MDP: 5
INFO:root:Ship 4 command: o actual position: Position(20, 24) new position: Position(20, 24)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 1), (3, 2), (3, 3), (3, 5), (3, 6), (3, 7), (3, 8), (4, 2), (4, 4), (4, 7), (5, 3), (5, 4), (5, 5), (6, 2), (6, 4), (6, 5), (6, 7), (6, 8), (7, 4), (8, 3), (8, 4)]
INFO:root:Rewards:
[[1080, 1660, 2760, 3300, 5700, 5400, 10060, 9180, 3360], [-84, 2400, 1580, 1880, 5560, 3600, 5340, 2780, 2520], [820, 540, 1120, 3840, 3880, 1460, 1700, 2000, 2140], [740, 60, 1060, 140, -12, 700, 320, 380, 140], [-76, -12, 860, -4, 100, -36, -8, 20, -28], [-148, -108, -120, 1600, 1860, 320, -8, -12, -88], [-120, -120, 40, -84, 900, -40000, -84, 620, 160], [-160, -156, -160, -32, 980, 0, -160, -156, -148], [-4, -80, -120, 280, 360, -84, -76, -4, -108]]
INFO:root:Count MDP: 4
INFO:root:Ship 6 command: o actual position: Position(13, 22) new position: Position(13, 22)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 1), (2, 3), (2, 6), (3, 2), (3, 3), (3, 4), (4, 1), (4, 3), (4, 4), (4, 6), (4, 7), (5, 3), (6, 2), (6, 3), (6, 8), (7, 0), (7, 3), (7, 7), (8, 0), (8, 1), (8, 3), (8, 7)]
INFO:root:Rewards:
[[540, 1120, 3840, 3880, 1460, 1700, 2000, 2140, 1580], [60, 1060, 140, -12, 700, 320, 380, 140, 320], [-12, 860, -4, -40000, -36, -8, 20, -28, -16], [-108, -120, 1600, 1860, 320, -8, -12, -88, -44], [-120, 40, -84, 900, 660, -84, 620, 160, -52], [-156, -160, -32, 980, 0, -160, -156, -148, 0], [-80, -120, 280, 360, -84, -76, -4, -108, 820], [640, -120, -52, 180, -80, -40, -64, 140, -36], [280, 2180, -36, 60, -16, -12, -40, 440, -88]]
INFO:root:Count MDP: 5
INFO:root:Ship 8 command: o actual position: Position(15, 23) new position: Position(15, 23)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 4), (4, 5), (4, 6), (4, 7), (4, 8), (5, 1), (5, 2), (5, 3), (5, 4), (5, 5), (5, 6), (5, 7), (5, 8), (6, 0), (6, 1), (6, 2), (6, 3), (6, 4), (6, 5), (6, 6), (6, 7), (6, 8), (7, 0), (7, 1), (7, 2), (7, 3), (7, 4), (7, 5), (7, 6), (7, 7), (7, 8), (8, 0), (8, 1), (8, 2), (8, 3), (8, 4), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[2440, 1800, 700, 1900, 5900, 6160, 3200, 3860, 4820], [180, 920, -12, 860, 4340, 4820, 4660, 3980, 2320], [-36, 240, 1520, 1600, 2080, 2400, 4600, 3160, 5600], [-36, 420, 780, 1380, 1760, 6240, 6380, 3220, 2720], [-4, -24, -36, -32, 420, 2740, 8260, 4200, 3480], [-12, 20, 400, 780, 660, 2580, 7040, 4220, 3940], [560, 440, 1500, 940, 1880, 2400, 3040, 4160, 6460], [3340, 820, 880, 2520, 6740, 2700, 2160, 7280, 10360], [920, 5040, 3580, 2420, 4620, 6060, 3540, 8900, 7600]]
INFO:root:Count MDP: 4
INFO:root:Ship 0 command: o actual position: Position(15, 34) new position: Position(15, 34)
INFO:root:Terminais: [(0, 1), (0, 8), (1, 0), (1, 1), (1, 6), (2, 1), (2, 5), (2, 8), (3, 1), (3, 5), (4, 0), (4, 2), (4, 3), (4, 8), (5, 0), (5, 1), (5, 2), (5, 3), (5, 5), (6, 0), (6, 1), (6, 4), (6, 5), (6, 6), (7, 0), (7, 1), (7, 4), (7, 5), (8, 0), (8, 1), (8, 5), (8, 6)]
INFO:root:Rewards:
[[-32, 980, 0, -160, -156, -148, 0, -24, 360], [280, 360, -84, -76, -4, -108, 820, -32, -36], [-52, 180, -80, -40, -64, 140, -36, -72, 20], [-36, 60, -16, -12, -40, 440, -88, -96, 0], [400, -4, 420, -40000, -36, -88, -60, -100, 840], [2000, 580, 480, 460, -12, 660, -20, -44, -44], [1480, 660, -8, -36, 800, 2240, 360, -132, -20], [3220, 3840, -4, -4, 1220, 280, -16, -128, -88], [1880, 5140, -36, -160, -60, 1760, 280, -156, -120]]
INFO:root:Count MDP: 4
INFO:root:Ship 2 command: e actual position: Position(20, 25) new position: Position(21, 25)
INFO:root:Time: 0.05766129493713379
INFO:root:=============== TURN 035 ================
INFO:root:Terminais: [(0, 2), (1, 1), (1, 2), (1, 7), (2, 2), (2, 6), (3, 0), (3, 2), (3, 6), (4, 0), (4, 1), (4, 3), (4, 4), (5, 0), (5, 1), (5, 2), (5, 3), (5, 4), (5, 6), (6, 0), (6, 1), (6, 2), (6, 5), (6, 6), (6, 7), (7, 0), (7, 1), (7, 2), (7, 5), (7, 6), (8, 0), (8, 1), (8, 2), (8, 6), (8, 7)]
INFO:root:Rewards:
[[-160, -32, 980, 0, -160, -156, -148, 0, -24], [-120, 280, 360, -84, -76, -4, -108, 820, -32], [-120, -52, 180, -80, -40, -64, 140, -36, -72], [2180, -36, 60, -16, -12, -40, 440, -88, -96], [1660, 400, -4, 420, 40, -36, -88, -60, -100], [800, 2000, 580, 480, 460, -8000, 660, -20, -44], [1100, 1480, 660, -8, -36, 800, 2240, 360, -132], [2400, 3220, 3840, -4, -4, 1220, 280, -16, -128], [4160, 1880, 5140, -36, -160, -60, 1760, 280, -156]]
INFO:root:Count MDP: 4
INFO:root:Ship 4 command: o actual position: Position(20, 24) new position: Position(20, 24)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 1), (3, 2), (3, 3), (3, 5), (3, 6), (3, 7), (3, 8), (4, 2), (4, 7), (5, 3), (5, 4), (5, 5), (6, 2), (6, 4), (6, 5), (6, 7), (6, 8), (7, 4), (8, 3), (8, 4)]
INFO:root:Rewards:
[[1080, 1660, 2760, 3300, 5700, 5400, 10060, 9180, 3360], [-84, 2400, 1580, 1880, 5560, 3600, 5340, 2780, 2520], [820, 540, 1120, 3840, 3880, 1460, 1700, 2000, 2140], [740, 60, 1060, 140, -12, 700, 320, 380, 140], [-76, -12, 860, -4, -28, -36, -8, 20, -28], [-148, -108, -120, 1600, 1860, 320, -8, -12, -88], [-120, -120, 40, -84, 900, -40000, -84, 620, 160], [-160, -156, -160, -32, 980, 0, -160, -156, -148], [-4, -80, -120, 280, 360, -84, -76, -4, -108]]
INFO:root:Count MDP: 6
INFO:root:Ship 6 command: w actual position: Position(13, 22) new position: Position(12, 22)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 1), (2, 6), (3, 2), (3, 3), (3, 4), (4, 1), (4, 3), (4, 4), (4, 6), (4, 7), (5, 3), (6, 2), (6, 3), (6, 8), (7, 0), (7, 3), (7, 7), (8, 0), (8, 1), (8, 3), (8, 7)]
INFO:root:Rewards:
[[540, 1120, 3840, 3880, 1460, 1700, 2000, 2140, 1580], [60, 1060, 140, -8000, 700, 320, 380, 140, 320], [-12, 860, -4, -28, -36, -8, 20, -28, -16], [-108, -120, 1600, 1860, 320, -8, -12, -88, -44], [-120, 40, -84, 900, 280, -84, 620, 160, -52], [-156, -160, -32, 980, 0, -160, -156, -148, 0], [-80, -120, 280, 360, -84, -76, -4, -108, 820], [640, -120, -52, 180, -80, -40, -64, 140, -36], [280, 2180, -36, 60, -16, -12, -40, 440, -88]]
INFO:root:Count MDP: 5
INFO:root:Ship 8 command: o actual position: Position(15, 23) new position: Position(15, 23)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 4), (4, 5), (4, 6), (4, 7), (4, 8), (5, 1), (5, 2), (5, 3), (5, 4), (5, 5), (5, 6), (5, 7), (5, 8), (6, 0), (6, 1), (6, 2), (6, 3), (6, 4), (6, 5), (6, 6), (6, 7), (6, 8), (7, 0), (7, 1), (7, 2), (7, 3), (7, 4), (7, 5), (7, 6), (7, 7), (7, 8), (8, 0), (8, 1), (8, 2), (8, 3), (8, 4), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[2440, 1800, 700, 1900, 5900, 6160, 3200, 3860, 4820], [180, 920, -12, 860, 4340, 4820, 4660, 3980, 2320], [-36, 240, 1520, 1600, 2080, 2400, 4600, 3160, 5600], [-36, 420, 780, 1380, 1760, 6240, 6380, 3220, 2720], [-4, -24, -36, -32, 100, 2740, 8260, 4200, 3480], [-12, 20, 400, 780, 660, 2580, 7040, 4220, 3940], [560, 440, 1500, 940, 1880, 2400, 3040, 4160, 6460], [3340, 820, 880, 2520, 6740, 2700, 2160, 7280, 10360], [920, 5040, 3580, 2420, 4620, 6060, 3540, 8900, 7600]]
INFO:root:Count MDP: 3
INFO:root:Ship 0 command: o actual position: Position(15, 34) new position: Position(15, 34)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 6), (1, 1), (1, 5), (1, 8), (2, 1), (2, 5), (3, 0), (3, 2), (3, 3), (3, 8), (4, 0), (4, 1), (4, 2), (4, 3), (4, 5), (5, 0), (5, 1), (5, 4), (5, 5), (5, 6), (6, 0), (6, 1), (6, 4), (6, 5), (7, 0), (7, 1), (7, 5), (7, 6), (8, 0), (8, 1), (8, 2), (8, 5), (8, 7), (8, 8)]
INFO:root:Rewards:
[[280, 360, -84, -76, -4, -108, 820, -32, -36], [-52, 180, -80, -40, -64, 140, -36, -72, 20], [-36, 60, -16, -12, -40, 440, -88, -96, 0], [400, -4, 420, -40000, -36, -88, -60, -100, 840], [2000, 580, 480, 460, -12, 660, -20, -44, -44], [1480, 660, -8, -36, 800, 2240, 360, -132, -20], [3220, 3840, -4, -4, 1220, 280, -16, -128, -88], [1880, 5140, -36, -160, -60, 1760, 280, -156, -120], [1460, 2600, 560, -144, -112, 200, -60, 440, 20]]
INFO:root:Count MDP: 4
INFO:root:Ship 2 command: e actual position: Position(21, 25) new position: Position(22, 25)
INFO:root:Time: 0.05471968650817871
INFO:root:=============== TURN 036 ================
INFO:root:Terminais: [(0, 2), (1, 1), (1, 2), (1, 7), (2, 2), (2, 6), (3, 0), (3, 2), (3, 6), (4, 0), (4, 1), (4, 3), (5, 0), (5, 1), (5, 2), (5, 3), (5, 4), (5, 6), (6, 0), (6, 1), (6, 2), (6, 5), (6, 6), (6, 7), (7, 0), (7, 1), (7, 2), (7, 5), (7, 6), (8, 0), (8, 1), (8, 2), (8, 6), (8, 7)]
INFO:root:Rewards:
[[-160, -32, 980, 0, -160, -156, -148, 0, -24], [-120, 280, 360, -84, -76, -4, -108, 820, -32], [-120, -52, 180, -80, -40, -64, 140, -36, -72], [2180, -36, 60, -16, -12, -40, 440, -88, -96], [1660, 400, -4, 420, -36, -36, -88, -60, -100], [800, 2000, 580, 480, 460, -12, 660, -20, -44], [1100, 1480, 660, -8, -36, -40000, 2240, 360, -132], [2400, 3220, 3840, -4, -4, 1220, 280, -16, -128], [4160, 1880, 5140, -36, -160, -60, 1760, 280, -156]]
INFO:root:Count MDP: 5
INFO:root:Ship 4 command: s actual position: Position(20, 24) new position: Position(20, 25)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 1), (2, 6), (3, 2), (3, 3), (3, 4), (4, 1), (4, 3), (4, 6), (4, 7), (5, 3), (6, 2), (6, 3), (6, 8), (7, 0), (7, 3), (7, 7), (8, 0), (8, 1), (8, 3), (8, 7)]
INFO:root:Rewards:
[[540, 1120, 3840, 3880, 1460, 1700, 2000, 2140, 1580], [60, 1060, 140, -8000, 700, 320, 380, 140, 320], [-12, 860, -4, -28, -36, -8, 20, -28, -16], [-108, -120, 1600, 1860, 320, -8, -12, -88, -44], [-120, 40, -84, 900, 0, -84, 620, 160, -52], [-156, -160, -32, 980, 0, -160, -156, -148, 0], [-80, -120, 280, 360, -84, -76, -4, -108, 820], [640, -120, -52, 180, -80, -40, -64, 140, -36], [280, 2180, -36, 60, -16, -12, -40, 440, -88]]
INFO:root:Count MDP: 5
INFO:root:Ship 8 command: s actual position: Position(15, 23) new position: Position(15, 24)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 5), (4, 6), (4, 7), (4, 8), (5, 1), (5, 2), (5, 3), (5, 4), (5, 5), (5, 6), (5, 7), (5, 8), (6, 0), (6, 1), (6, 2), (6, 3), (6, 4), (6, 5), (6, 6), (6, 7), (6, 8), (7, 0), (7, 1), (7, 2), (7, 3), (7, 4), (7, 5), (7, 6), (7, 7), (7, 8), (8, 0), (8, 1), (8, 2), (8, 3), (8, 4), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[2440, 1800, 700, 1900, 5900, 6160, 3200, 3860, 4820], [180, 920, -12, 860, 4340, 4820, 4660, 3980, 2320], [-36, 240, 1520, 1600, 2080, 2400, 4600, 3160, 5600], [-36, 420, 780, 1380, 1760, 6240, 6380, 3220, 2720], [-4, -24, -36, -32, -28, 2740, 8260, 4200, 3480], [-12, 20, 400, 780, 660, 2580, 7040, 4220, 3940], [560, 440, 1500, 940, 1880, 2400, 3040, 4160, 6460], [3340, 820, 880, 2520, 6740, 2700, 2160, 7280, 10360], [920, 5040, 3580, 2420, 4620, 6060, 3540, 8900, 7600]]
INFO:root:Count MDP: 4
INFO:root:Ship 0 command: s actual position: Position(15, 34) new position: Position(15, 35)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 0), (4, 1), (4, 2), (4, 3), (4, 5), (4, 6), (4, 7), (4, 8), (5, 2), (5, 7), (6, 3), (6, 4), (6, 5), (7, 2), (7, 4), (7, 7), (7, 8), (8, 4)]
INFO:root:Rewards:
[[3600, 3660, 5500, 3520, 3920, 10100, 18960, 10200, 5760], [1080, 1660, 2760, 3300, 5700, 5400, 10060, 9180, 3360], [-84, 2400, 1580, 1880, 5560, 3600, 5340, 2780, 2520], [820, 540, 1120, 3840, 3880, 1460, 1700, 2000, 2140], [740, 60, 1060, 140, -12, 700, 320, 380, 140], [-76, -12, 860, -4, -28, -36, -8, 20, -28], [-148, -108, -120, 1600, 1860, 320, -8, -12, -88], [-120, -120, 40, -84, 900, 0, -8000, 620, 160], [-160, -156, -160, -32, 980, 0, -160, -156, -148]]
INFO:root:Count MDP: 4
INFO:root:Ship 6 command: w actual position: Position(12, 22) new position: Position(11, 22)
INFO:root:Terminais: [(0, 1), (0, 5), (0, 8), (1, 1), (1, 5), (2, 0), (2, 2), (2, 8), (3, 0), (3, 1), (3, 2), (3, 3), (3, 5), (4, 0), (4, 1), (4, 4), (4, 5), (4, 6), (5, 0), (5, 1), (5, 4), (5, 5), (6, 0), (6, 1), (6, 5), (6, 6), (7, 0), (7, 1), (7, 2), (7, 5), (7, 7), (7, 8), (8, 0), (8, 1), (8, 2), (8, 5)]
INFO:root:Rewards:
[[-52, 180, -80, -40, -64, 140, -36, -72, 20], [-36, 60, -16, -12, -40, 440, -88, -96, 0], [400, -4, 420, -36, -8000, -88, -60, -100, 840], [2000, 580, 480, 460, -12, 660, -20, -44, -44], [1480, 660, -8, -36, 800, 2240, 360, -132, -20], [3220, 3840, -4, -4, 1220, 280, -16, -128, -88], [1880, 5140, -36, -160, -60, 1760, 280, -156, -120], [1460, 2600, 560, -144, -112, 200, -60, 440, 20], [1700, 60, 240, -132, -52, 140, -80, -84, -28]]
INFO:root:Count MDP: 4
INFO:root:Ship 2 command: o actual position: Position(22, 25) new position: Position(22, 25)
INFO:root:Time: 0.049834489822387695
INFO:root:=============== TURN 037 ================
INFO:root:Terminais: [(0, 1), (0, 5), (0, 8), (1, 1), (1, 5), (2, 0), (2, 2), (2, 8), (3, 0), (3, 1), (3, 2), (3, 3), (3, 5), (4, 0), (4, 1), (4, 4), (4, 5), (4, 6), (5, 0), (5, 1), (5, 4), (5, 5), (6, 0), (6, 1), (6, 5), (6, 6), (7, 0), (7, 1), (7, 2), (7, 5), (7, 7), (7, 8), (8, 0), (8, 1), (8, 2), (8, 5)]
INFO:root:Rewards:
[[-52, 180, -80, -40, -64, 140, -36, -72, 20], [-36, 60, -16, -12, -40, 440, -88, -96, 0], [400, -4, 420, -36, -8000, -88, -60, -100, 840], [2000, 580, 480, 460, -12, 660, -20, -44, -44], [1480, 660, -8, -36, 400, 2240, 360, -132, -20], [3220, 3840, -4, -4, 1220, 280, -16, -128, -88], [1880, 5140, -36, -160, -60, 1760, 280, -156, -120], [1460, 2600, 560, -144, -112, 200, -60, 440, 20], [1700, 60, 240, -132, -52, 140, -80, -84, -28]]
INFO:root:Count MDP: 4
INFO:root:Ship 2 command: o actual position: Position(22, 25) new position: Position(22, 25)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 4), (4, 5), (4, 6), (4, 7), (4, 8), (5, 0), (5, 1), (5, 2), (5, 3), (5, 4), (5, 5), (5, 6), (5, 7), (5, 8), (6, 0), (6, 1), (6, 2), (6, 3), (6, 4), (6, 5), (6, 6), (6, 7), (6, 8), (7, 0), (7, 1), (7, 2), (7, 3), (7, 4), (7, 5), (7, 6), (7, 7), (7, 8), (8, 0), (8, 1), (8, 2), (8, 3), (8, 4), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[1800, 700, 1900, 5900, 6160, 3200, 3860, 4820, 3100], [920, -12, 860, 4340, 4820, 4660, 3980, 2320, 2140], [240, 1520, 1600, 2080, 2400, 4600, 3160, 5600, 4620], [420, 780, 1380, 1760, 6240, 6380, 3220, 2720, 8480], [-24, -36, -32, -28, 2740, 8260, 4200, 3480, 10760], [20, 400, 780, 660, 2580, 7040, 4220, 3940, 8060], [440, 1500, 940, 1880, 2400, 3040, 4160, 6460, 8280], [820, 880, 2520, 6740, 2700, 2160, 7280, 10360, 7880], [5040, 3580, 2420, 4620, 6060, 3540, 8900, 7600, 8220]]
INFO:root:Count MDP: 2
INFO:root:Ship 0 command: o actual position: Position(15, 35) new position: Position(15, 35)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 5), (2, 8), (3, 1), (3, 2), (3, 3), (4, 0), (4, 2), (4, 5), (4, 6), (5, 2), (6, 1), (6, 2), (6, 7), (7, 2), (7, 6), (8, 0), (8, 2), (8, 6)]
INFO:root:Rewards:
[[1120, 3840, -40000, 1460, 1700, 2000, 2140, 1580, 4600], [1060, 140, -12, 700, 320, 380, 140, 320, 920], [860, -4, -28, -36, -8, 20, -28, -16, 320], [-120, 1600, 1860, 320, -8, -12, -88, -44, -160], [40, -84, 900, 0, -84, 620, 160, -52, -52], [-160, -32, 980, 0, -160, -156, -148, 0, -24], [-120, 280, 360, -84, -76, -4, -108, 820, -32], [-120, -52, 180, -80, -40, -64, 140, -36, -72], [2180, -36, 60, -16, -12, -40, 440, -88, -96]]
INFO:root:Count MDP: 6
INFO:root:Ship 8 command: w actual position: Position(15, 24) new position: Position(14, 24)
INFO:root:Terminais: [(0, 1), (0, 8), (1, 0), (1, 1), (1, 6), (2, 1), (2, 5), (2, 8), (3, 1), (3, 5), (4, 0), (4, 2), (4, 8), (5, 0), (5, 1), (5, 2), (5, 3), (5, 5), (6, 0), (6, 1), (6, 4), (6, 5), (6, 6), (7, 0), (7, 1), (7, 4), (7, 5), (8, 0), (8, 1), (8, 5), (8, 6)]
INFO:root:Rewards:
[[-32, 980, 0, -160, -156, -148, 0, -24, 360], [280, 360, -84, -76, -4, -108, 820, -32, -36], [-52, 180, -80, -40, -64, 140, -36, -72, 20], [-36, 60, -16, -12, -40, 440, -88, -96, 0], [400, -4, 420, -36, -36, -88, -60, -100, 840], [2000, 580, 480, 460, -12, 660, -20, -44, -44], [1480, 660, -8, -36, -40000, 2240, 360, -132, -20], [3220, 3840, -4, -4, 1220, 280, -16, -128, -88], [1880, 5140, -36, -160, -60, 1760, 280, -156, -120]]
INFO:root:Count MDP: 5
INFO:root:Ship 4 command: e actual position: Position(20, 25) new position: Position(21, 25)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 0), (4, 1), (4, 2), (4, 3), (4, 4), (4, 5), (4, 6), (4, 7), (4, 8), (5, 0), (5, 1), (5, 2), (5, 3), (5, 5), (5, 6), (5, 7), (5, 8), (6, 2), (6, 7), (7, 3), (7, 4), (7, 5), (8, 2), (8, 4), (8, 7), (8, 8)]
INFO:root:Rewards:
[[3260, 2280, 1800, 3040, 4180, 9380, 9300, 7220, 5480], [3600, 3660, 5500, 3520, 3920, 10100, 18960, 10200, 5760], [1080, 1660, 2760, 3300, 5700, 5400, 10060, 9180, 3360], [-84, 2400, 1580, 1880, 5560, 3600, 5340, 2780, 2520], [820, 540, 1120, 3840, 3880, 1460, 1700, 2000, 2140], [740, 60, 1060, 140, -12, 700, 320, 380, 140], [-76, -12, 860, -4, -28, -36, -8, 20, -28], [-148, -108, -120, 1600, 1860, 320, -8000, -12, -88], [-120, -120, 40, -84, 900, 0, -84, 620, 160]]
INFO:root:Count MDP: 3
INFO:root:Ship 6 command: o actual position: Position(11, 22) new position: Position(11, 22)
INFO:root:Time: 0.047879934310913086
INFO:root:=============== TURN 038 ================
INFO:root:Terminais: [(0, 1), (0, 5), (0, 8), (1, 1), (1, 5), (2, 0), (2, 2), (2, 8), (3, 0), (3, 1), (3, 2), (3, 3), (3, 5), (4, 0), (4, 1), (4, 4), (4, 5), (4, 6), (5, 0), (5, 1), (5, 4), (5, 5), (6, 0), (6, 1), (6, 5), (6, 6), (7, 0), (7, 1), (7, 2), (7, 5), (7, 7), (7, 8), (8, 0), (8, 1), (8, 2), (8, 5)]
INFO:root:Rewards:
[[-52, 180, -80, -40, -64, 140, -36, -72, 20], [-36, 60, -16, -12, -40, 440, -88, -96, 0], [400, -4, 420, -36, -36, -88, -60, -100, 840], [2000, 580, 480, 460, -8000, 660, -20, -44, -44], [1480, 660, -8, -36, 100, 2240, 360, -132, -20], [3220, 3840, -4, -4, 1220, 280, -16, -128, -88], [1880, 5140, -36, -160, -60, 1760, 280, -156, -120], [1460, 2600, 560, -144, -112, 200, -60, 440, 20], [1700, 60, 240, -132, -52, 140, -80, -84, -28]]
INFO:root:Count MDP: 4
INFO:root:Ship 2 command: o actual position: Position(22, 25) new position: Position(22, 25)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 5), (3, 8), (4, 1), (4, 2), (4, 3), (5, 0), (5, 2), (5, 5), (5, 6), (6, 2), (7, 1), (7, 2), (7, 7), (8, 2), (8, 6)]
INFO:root:Rewards:
[[1580, 1880, 5560, 3600, 5340, 2780, 2520, 2960, 6700], [1120, 3840, -40000, 1460, 1700, 2000, 2140, 1580, 4600], [1060, 140, -12, 700, 320, 380, 140, 320, 920], [860, -4, -28, -36, -8, 20, -28, -16, 320], [-120, 1600, 1860, 320, -8, -12, -88, -44, -160], [40, -84, 900, 0, -84, 620, 160, -52, -52], [-160, -32, 980, 0, -160, -156, -148, 0, -24], [-120, 280, 360, -84, -76, -4, -108, 820, -32], [-120, -52, 180, -80, -40, -64, 140, -36, -72]]
INFO:root:Count MDP: 6
INFO:root:Ship 8 command: w actual position: Position(14, 24) new position: Position(13, 24)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 4), (4, 5), (4, 6), (4, 7), (4, 8), (5, 0), (5, 1), (5, 2), (5, 3), (5, 4), (5, 5), (5, 6), (5, 7), (5, 8), (6, 0), (6, 1), (6, 2), (6, 3), (6, 4), (6, 5), (6, 6), (6, 7), (6, 8), (7, 0), (7, 1), (7, 2), (7, 3), (7, 4), (7, 5), (7, 6), (7, 7), (7, 8), (8, 0), (8, 1), (8, 2), (8, 3), (8, 4), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[1800, 700, 1900, 5900, 6160, 3200, 3860, 4820, 3100], [920, -12, 860, 4340, 4820, 4660, 3980, 2320, 2140], [240, 1520, 1600, 2080, 2400, 4600, 3160, 5600, 4620], [420, 780, 1380, 1760, 6240, 6380, 3220, 2720, 8480], [-24, -36, -32, -28, 1840, 8260, 4200, 3480, 10760], [20, 400, 780, 660, 2580, 7040, 4220, 3940, 8060], [440, 1500, 940, 1880, 2400, 3040, 4160, 6460, 8280], [820, 880, 2520, 6740, 2700, 2160, 7280, 10360, 7880], [5040, 3580, 2420, 4620, 6060, 3540, 8900, 7600, 8220]]
INFO:root:Count MDP: 1
INFO:root:Ship 0 command: o actual position: Position(15, 35) new position: Position(15, 35)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 0), (4, 1), (4, 2), (4, 3), (4, 4), (4, 5), (4, 6), (4, 7), (4, 8), (5, 0), (5, 1), (5, 2), (5, 3), (5, 5), (5, 6), (5, 7), (5, 8), (6, 2), (6, 7), (7, 3), (7, 4), (7, 5), (8, 2), (8, 4), (8, 7), (8, 8)]
INFO:root:Rewards:
[[3260, 2280, 1800, 3040, 4180, 9380, 9300, 7220, 5480], [3600, 3660, 5500, 3520, 3920, 10100, 18960, 10200, 5760], [1080, 1660, 2760, 3300, 5700, 5400, 10060, 9180, 3360], [-84, 2400, 1580, 1880, 5560, 3600, 5340, 2780, 2520], [820, 540, 1120, 3840, 2700, 1460, 1700, 2000, 2140], [740, 60, 1060, 140, -12, 700, 320, 380, 140], [-76, -12, 860, -4, -28, -36, -8000, 20, -28], [-148, -108, -120, 1600, 1860, 320, -8, -12, -88], [-120, -120, 40, -84, 900, 0, -84, 620, 160]]
INFO:root:Count MDP: 3
INFO:root:Ship 6 command: o actual position: Position(11, 22) new position: Position(11, 22)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 6), (1, 1), (1, 5), (1, 8), (2, 1), (2, 5), (3, 0), (3, 2), (3, 8), (4, 0), (4, 1), (4, 2), (4, 3), (4, 5), (5, 0), (5, 1), (5, 4), (5, 5), (5, 6), (6, 0), (6, 1), (6, 4), (6, 5), (7, 0), (7, 1), (7, 5), (7, 6), (8, 0), (8, 1), (8, 2), (8, 5), (8, 7), (8, 8)]
INFO:root:Rewards:
[[280, 360, -84, -76, -4, -108, 820, -32, -36], [-52, 180, -80, -40, -64, 140, -36, -72, 20], [-36, 60, -16, -12, -40, 440, -88, -96, 0], [400, -4, 420, -36, -36, -88, -60, -100, 840], [2000, 580, 480, 460, -12, 660, -20, -44, -44], [1480, 660, -8, -36, -40000, 2240, 360, -132, -20], [3220, 3840, -4, -4, 1220, 280, -16, -128, -88], [1880, 5140, -36, -160, -60, 1760, 280, -156, -120], [1460, 2600, 560, -144, -112, 200, -60, 440, 20]]
INFO:root:Count MDP: 4
INFO:root:Ship 4 command: s actual position: Position(21, 25) new position: Position(21, 26)
INFO:root:Time: 0.0429844856262207
INFO:root:=============== TURN 039 ================
INFO:root:Terminais: [(0, 1), (0, 5), (0, 8), (1, 1), (1, 5), (2, 0), (2, 2), (2, 8), (3, 0), (3, 1), (3, 2), (3, 3), (3, 5), (4, 0), (4, 1), (4, 5), (4, 6), (5, 0), (5, 1), (5, 4), (5, 5), (6, 0), (6, 1), (6, 5), (6, 6), (7, 0), (7, 1), (7, 2), (7, 5), (7, 7), (7, 8), (8, 0), (8, 1), (8, 2), (8, 5)]
INFO:root:Rewards:
[[-52, 180, -80, -40, -64, 140, -36, -72, 20], [-36, 60, -16, -12, -40, 440, -88, -96, 0], [400, -4, 420, -36, -36, -88, -60, -100, 840], [2000, 580, 480, 460, -12, -40000, -20, -44, -44], [1480, 660, -8, -36, -28, 2240, 360, -132, -20], [3220, 3840, -4, -4, 1220, 280, -16, -128, -88], [1880, 5140, -36, -160, -60, 1760, 280, -156, -120], [1460, 2600, 560, -144, -112, 200, -60, 440, 20], [1700, 60, 240, -132, -52, 140, -80, -84, -28]]
INFO:root:Count MDP: 8
INFO:root:Ship 2 command: n actual position: Position(22, 25) new position: Position(22, 24)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 1), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 0), (4, 5), (4, 8), (5, 1), (5, 2), (5, 3), (6, 0), (6, 2), (6, 5), (6, 6), (7, 2), (8, 1), (8, 2), (8, 7)]
INFO:root:Rewards:
[[2760, 3300, 5700, 5400, 10060, 9180, 3360, 3600, 2900], [1580, 1880, 5560, 3600, 5340, 2780, 2520, 2960, 6700], [1120, 3840, -40000, 1460, 1700, 2000, 2140, 1580, 4600], [1060, 140, -12, 700, 320, 380, 140, 320, 920], [860, -4, -28, -36, -8, 20, -28, -16, 320], [-120, 1600, 1860, 320, -8, -12, -88, -44, -160], [40, -84, 900, 0, -84, 620, 160, -52, -52], [-160, -32, 980, 0, -160, -156, -148, 0, -24], [-120, 280, 360, -84, -76, -4, -108, 820, -32]]
INFO:root:Count MDP: 6
INFO:root:Ship 8 command: n actual position: Position(13, 24) new position: Position(13, 23)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 4), (4, 5), (4, 6), (4, 7), (4, 8), (5, 0), (5, 1), (5, 2), (5, 3), (5, 4), (5, 5), (5, 6), (5, 7), (5, 8), (6, 0), (6, 1), (6, 2), (6, 3), (6, 4), (6, 5), (6, 6), (6, 7), (6, 8), (7, 0), (7, 1), (7, 2), (7, 3), (7, 4), (7, 5), (7, 6), (7, 7), (7, 8), (8, 0), (8, 1), (8, 2), (8, 3), (8, 4), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[1800, 700, 1900, 5900, 6160, 3200, 3860, 4820, 3100], [920, -12, 860, 4340, 4820, 4660, 3980, 2320, 2140], [240, 1520, 1600, 2080, 2400, 4600, 3160, 5600, 4620], [420, 780, 1380, 1760, 6240, 6380, 3220, 2720, 8480], [-24, -36, -32, -28, 1180, 8260, 4200, 3480, 10760], [20, 400, 780, 660, 2580, 7040, 4220, 3940, 8060], [440, 1500, 940, 1880, 2400, 3040, 4160, 6460, 8280], [820, 880, 2520, 6740, 2700, 2160, 7280, 10360, 7880], [5040, 3580, 2420, 4620, 6060, 3540, 8900, 7600, 8220]]
INFO:root:Count MDP: 2
INFO:root:Ship 0 command: o actual position: Position(15, 35) new position: Position(15, 35)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 0), (4, 1), (4, 2), (4, 3), (4, 4), (4, 5), (4, 6), (4, 7), (4, 8), (5, 0), (5, 1), (5, 2), (5, 3), (5, 5), (5, 6), (5, 7), (5, 8), (6, 2), (6, 7), (7, 3), (7, 4), (7, 5), (8, 2), (8, 4), (8, 7), (8, 8)]
INFO:root:Rewards:
[[3260, 2280, 1800, 3040, 4180, 9380, 9300, 7220, 5480], [3600, 3660, 5500, 3520, 3920, 10100, 18960, 10200, 5760], [1080, 1660, 2760, 3300, 5700, 5400, 10060, 9180, 3360], [-84, 2400, 1580, 1880, 5560, 3600, 5340, 2780, 2520], [820, 540, 1120, 3840, 1820, 1460, 1700, 2000, 2140], [740, 60, 1060, 140, -12, 700, 320, 380, 140], [-76, -12, 860, -4, -28, -8000, -8, 20, -28], [-148, -108, -120, 1600, 1860, 320, -8, -12, -88], [-120, -120, 40, -84, 900, 0, -84, 620, 160]]
INFO:root:Count MDP: 3
INFO:root:Ship 6 command: o actual position: Position(11, 22) new position: Position(11, 22)
INFO:root:Terminais: [(0, 0), (0, 5), (0, 8), (1, 0), (1, 4), (1, 7), (1, 8), (2, 0), (2, 4), (2, 8), (3, 1), (3, 7), (3, 8), (4, 0), (4, 1), (4, 2), (4, 4), (4, 8), (5, 0), (5, 4), (5, 5), (5, 8), (6, 0), (6, 3), (6, 4), (6, 8), (7, 0), (7, 4), (7, 5), (7, 8), (8, 0), (8, 1), (8, 4), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[360, -84, -76, -4, -108, 820, -32, -36, 560], [180, -80, -40, -64, 140, -36, -72, 20, 3340], [60, -16, -12, -40, 440, -88, -96, 0, 920], [-4, 420, -36, -36, -88, -60, -100, 840, 2760], [580, 480, 460, -12, 660, -20, -44, -44, 460], [660, -8, -8000, -28, 2240, 360, -132, -20, 1360], [3840, -4, -4, 1220, 280, -16, -128, -88, 1280], [5140, -36, -160, -60, 1760, 280, -156, -120, 1220], [2600, 560, -144, -112, 200, -60, 440, 20, 220]]
INFO:root:Count MDP: 6
INFO:root:Ship 4 command: o actual position: Position(21, 26) new position: Position(21, 26)
INFO:root:Time: 0.05522871017456055
INFO:root:=============== TURN 040 ================
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 1), (3, 2), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 1), (4, 6), (5, 2), (5, 3), (5, 4), (6, 1), (6, 3), (6, 6), (6, 7), (7, 3), (8, 2), (8, 3), (8, 8)]
INFO:root:Rewards:
[[1660, 2760, 3300, 5700, 5400, 10060, 9180, 3360, 3600], [2400, 1580, 1880, 5560, 3600, 5340, 2780, 2520, 2960], [540, 1120, 3840, -40000, 1460, 1700, 2000, 2140, 1580], [60, 1060, 140, -12, 700, 320, 380, 140, 320], [-12, 860, -4, -28, -36, -8, 20, -28, -16], [-108, -120, 1600, 1860, 320, -8, -12, -88, -44], [-120, 40, -84, 900, 0, -84, 620, 160, -52], [-156, -160, -32, 980, 0, -160, -156, -148, 0], [-80, -120, 280, 360, -84, -76, -4, -108, 820]]
INFO:root:Count MDP: 5
INFO:root:Ship 8 command: n actual position: Position(13, 23) new position: Position(13, 22)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 4), (4, 5), (4, 6), (4, 7), (4, 8), (5, 0), (5, 1), (5, 2), (5, 3), (5, 4), (5, 5), (5, 6), (5, 7), (5, 8), (6, 0), (6, 1), (6, 2), (6, 3), (6, 4), (6, 5), (6, 6), (6, 7), (6, 8), (7, 0), (7, 1), (7, 2), (7, 3), (7, 4), (7, 5), (7, 6), (7, 7), (7, 8), (8, 0), (8, 1), (8, 2), (8, 3), (8, 4), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[1800, 700, 1900, 5900, 6160, 3200, 3860, 4820, 3100], [920, -12, 860, 4340, 4820, 4660, 3980, 2320, 2140], [240, 1520, 1600, 2080, 2400, 4600, 3160, 5600, 4620], [420, 780, 1380, 1760, 6240, 6380, 3220, 2720, 8480], [-24, -36, -32, -28, 680, 8260, 4200, 3480, 10760], [20, 400, 780, 660, 2580, 7040, 4220, 3940, 8060], [440, 1500, 940, 1880, 2400, 3040, 4160, 6460, 8280], [820, 880, 2520, 6740, 2700, 2160, 7280, 10360, 7880], [5040, 3580, 2420, 4620, 6060, 3540, 8900, 7600, 8220]]
INFO:root:Count MDP: 2
INFO:root:Ship 0 command: o actual position: Position(15, 35) new position: Position(15, 35)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 0), (4, 1), (4, 2), (4, 3), (4, 4), (4, 5), (4, 6), (4, 7), (4, 8), (5, 0), (5, 1), (5, 2), (5, 3), (5, 5), (5, 6), (5, 7), (5, 8), (6, 2), (6, 7), (7, 3), (7, 4), (7, 5), (8, 2), (8, 4), (8, 7), (8, 8)]
INFO:root:Rewards:
[[3260, 2280, 1800, 3040, 4180, 9380, 9300, 7220, 5480], [3600, 3660, 5500, 3520, 3920, 10100, 18960, 10200, 5760], [1080, 1660, 2760, 3300, 5700, 5400, 10060, 9180, 3360], [-84, 2400, 1580, 1880, 5560, 3600, 5340, 2780, 2520], [820, 540, 1120, 3840, 1160, 1460, 1700, 2000, 2140], [740, 60, 1060, 140, -12, 700, 320, 380, 140], [-76, -12, 860, -4, -8000, -36, -8, 20, -28], [-148, -108, -120, 1600, 1860, 320, -8, -12, -88], [-120, -120, 40, -84, 900, 0, -84, 620, 160]]
INFO:root:Count MDP: 3
INFO:root:Ship 6 command: o actual position: Position(11, 22) new position: Position(11, 22)
INFO:root:Terminais: [(0, 0), (0, 5), (0, 8), (1, 0), (1, 4), (1, 7), (1, 8), (2, 0), (2, 4), (2, 8), (3, 1), (3, 7), (3, 8), (4, 0), (4, 1), (4, 2), (4, 4), (4, 8), (5, 0), (5, 4), (5, 5), (5, 8), (6, 0), (6, 3), (6, 4), (6, 8), (7, 0), (7, 4), (7, 5), (7, 8), (8, 0), (8, 1), (8, 4), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[360, -84, -76, -4, -108, 820, -32, -36, 560], [180, -80, -40, -64, 140, -36, -72, 20, 3340], [60, -16, -12, -40, 440, -88, -96, 0, 920], [-4, 420, -36, -36, -88, -60, -100, 840, 2760], [580, 480, 460, -12, 280, -20, -44, -44, 460], [660, -8, -8000, -28, 2240, 360, -132, -20, 1360], [3840, -4, -4, 1220, 280, -16, -128, -88, 1280], [5140, -36, -160, -60, 1760, 280, -156, -120, 1220], [2600, 560, -144, -112, 200, -60, 440, 20, 220]]
INFO:root:Count MDP: 7
INFO:root:Ship 4 command: o actual position: Position(21, 26) new position: Position(21, 26)
INFO:root:Terminais: [(0, 2), (0, 6), (1, 0), (1, 2), (1, 6), (2, 0), (2, 1), (2, 3), (3, 0), (3, 1), (3, 2), (3, 3), (3, 4), (3, 6), (4, 0), (4, 1), (4, 2), (4, 6), (4, 7), (5, 0), (5, 1), (5, 2), (5, 5), (5, 6), (6, 0), (6, 1), (6, 2), (6, 6), (6, 7), (7, 0), (7, 1), (7, 2), (7, 3), (7, 6), (7, 8), (8, 0), (8, 1), (8, 2), (8, 3), (8, 6)]
INFO:root:Rewards:
[[-120, -52, 180, -80, -40, -64, 140, -36, -72], [2180, -36, 60, -16, -12, -40, 440, -88, -96], [1660, 400, -4, 420, -36, -36, -88, -60, -100], [800, 2000, 580, 480, 460, -12, -40000, -20, -44], [1100, 1480, 660, -8, -36, -28, 2240, 360, -132], [2400, 3220, 3840, -4, -4, 1220, 280, -16, -128], [4160, 1880, 5140, -36, -160, -60, 1760, 280, -156], [2120, 1460, 2600, 560, -144, -112, 200, -60, 440], [860, 1700, 60, 240, -132, -52, 140, -80, -84]]
INFO:root:Count MDP: 7
INFO:root:Ship 2 command: e actual position: Position(22, 24) new position: Position(23, 24)
INFO:root:Time: 0.05569720268249512
INFO:root:=============== TURN 041 ================
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 1), (3, 2), (3, 3), (3, 5), (3, 6), (3, 7), (3, 8), (4, 2), (4, 7), (5, 3), (5, 4), (5, 5), (6, 2), (6, 4), (6, 7), (6, 8), (7, 4), (8, 3), (8, 4)]
INFO:root:Rewards:
[[1080, 1660, 2760, 3300, 5700, 5400, 10060, 9180, 3360], [-84, 2400, 1580, 1880, 5560, 3600, 5340, 2780, 2520], [820, 540, 1120, 3840, -40000, 1460, 1700, 2000, 2140], [740, 60, 1060, 140, -12, 700, 320, 380, 140], [-76, -12, 860, -4, -28, -36, -8, 20, -28], [-148, -108, -120, 1600, 1860, 320, -8, -12, -88], [-120, -120, 40, -84, 900, 0, -84, 620, 160], [-160, -156, -160, -32, 980, 0, -160, -156, -148], [-4, -80, -120, 280, 360, -84, -76, -4, -108]]
INFO:root:Count MDP: 5
INFO:root:Ship 8 command: e actual position: Position(13, 22) new position: Position(14, 22)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 4), (4, 5), (4, 6), (4, 7), (4, 8), (5, 0), (5, 1), (5, 2), (5, 3), (5, 4), (5, 5), (5, 6), (5, 7), (5, 8), (6, 0), (6, 1), (6, 2), (6, 3), (6, 4), (6, 5), (6, 6), (6, 7), (6, 8), (7, 0), (7, 1), (7, 2), (7, 3), (7, 4), (7, 5), (7, 6), (7, 7), (7, 8), (8, 0), (8, 1), (8, 2), (8, 3), (8, 4), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[1800, 700, 1900, 5900, 6160, 3200, 3860, 4820, 3100], [920, -12, 860, 4340, 4820, 4660, 3980, 2320, 2140], [240, 1520, 1600, 2080, 2400, 4600, 3160, 5600, 4620], [420, 780, 1380, 1760, 6240, 6380, 3220, 2720, 8480], [-24, -36, -32, -28, 300, 8260, 4200, 3480, 10760], [20, 400, 780, 660, 2580, 7040, 4220, 3940, 8060], [440, 1500, 940, 1880, 2400, 3040, 4160, 6460, 8280], [820, 880, 2520, 6740, 2700, 2160, 7280, 10360, 7880], [5040, 3580, 2420, 4620, 6060, 3540, 8900, 7600, 8220]]
INFO:root:Count MDP: 2
INFO:root:Ship 0 command: o actual position: Position(15, 35) new position: Position(15, 35)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 0), (4, 1), (4, 2), (4, 3), (4, 4), (4, 5), (4, 6), (4, 7), (4, 8), (5, 0), (5, 1), (5, 2), (5, 3), (5, 5), (5, 6), (5, 7), (5, 8), (6, 2), (6, 7), (7, 3), (7, 4), (7, 5), (8, 2), (8, 4), (8, 7), (8, 8)]
INFO:root:Rewards:
[[3260, 2280, 1800, 3040, 4180, 9380, 9300, 7220, 5480], [3600, 3660, 5500, 3520, 3920, 10100, 18960, 10200, 5760], [1080, 1660, 2760, 3300, 5700, 5400, 10060, 9180, 3360], [-84, 2400, 1580, 1880, 5560, 3600, 5340, 2780, 2520], [820, 540, 1120, 3840, 660, 1460, 1700, 2000, 2140], [740, 60, 1060, 140, -12, 700, 320, 380, 140], [-76, -12, 860, -4, -28, -36, -8, 20, -28], [-148, -108, -120, 1600, -40000, 320, -8, -12, -88], [-120, -120, 40, -84, 900, 0, -84, 620, 160]]
INFO:root:Count MDP: 4
INFO:root:Ship 6 command: o actual position: Position(11, 22) new position: Position(11, 22)
INFO:root:Terminais: [(0, 0), (0, 5), (0, 8), (1, 0), (1, 4), (1, 7), (1, 8), (2, 0), (2, 4), (2, 8), (3, 1), (3, 7), (3, 8), (4, 0), (4, 1), (4, 2), (4, 8), (5, 0), (5, 4), (5, 5), (5, 8), (6, 0), (6, 3), (6, 4), (6, 8), (7, 0), (7, 4), (7, 5), (7, 8), (8, 0), (8, 1), (8, 4), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[360, -84, -76, -4, -108, 820, -32, -36, 560], [180, -80, -40, -64, 140, -36, -72, 20, 3340], [60, -16, -12, -40, 440, -88, -96, 0, 920], [-4, 420, -36, -36, -88, -60, -100, 840, 2760], [580, 480, 460, -12, 0, -20, -44, -44, 460], [660, -8, -36, -28, 2240, 360, -132, -20, 1360], [3840, -4, -8000, 1220, 280, -16, -128, -88, 1280], [5140, -36, -160, -60, 1760, 280, -156, -120, 1220], [2600, 560, -144, -112, 200, -60, 440, 20, 220]]
INFO:root:Count MDP: 7
INFO:root:Ship 4 command: n actual position: Position(21, 26) new position: Position(21, 25)
INFO:root:Terminais: [(0, 0), (0, 2), (0, 6), (1, 0), (1, 1), (1, 3), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (3, 0), (3, 1), (3, 2), (3, 6), (3, 7), (4, 0), (4, 1), (4, 2), (4, 5), (4, 6), (5, 0), (5, 1), (5, 2), (5, 6), (5, 7), (6, 0), (6, 1), (6, 2), (6, 3), (6, 6), (6, 8), (7, 0), (7, 1), (7, 2), (7, 3), (7, 6), (8, 0), (8, 2), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[2180, -36, 60, -16, -12, -40, 440, -88, -96], [1660, 400, -4, 420, -36, -36, -88, -60, -100], [800, 2000, 580, 480, 460, -8000, 0, -20, -44], [1100, 1480, 660, -8, -36, -28, 2240, 360, -132], [2400, 3220, 3840, -4, -4, 1220, 280, -16, -128], [4160, 1880, 5140, -36, -160, -60, 1760, 280, -156], [2120, 1460, 2600, 560, -144, -112, 200, -60, 440], [860, 1700, 60, 240, -132, -52, 140, -80, -84], [140, -8, 1480, -124, -156, -104, 1860, 2100, 340]]
INFO:root:Count MDP: 5
INFO:root:Ship 2 command: n actual position: Position(23, 24) new position: Position(23, 23)
INFO:root:Time: 0.051788330078125
INFO:root:=============== TURN 042 ================
INFO:root:Terminais: [(0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 5), (2, 6), (2, 7), (2, 8), (3, 2), (3, 7), (4, 3), (4, 4), (4, 5), (5, 2), (5, 4), (5, 7), (5, 8), (6, 4), (7, 3), (7, 4), (8, 1), (8, 4), (8, 8)]
INFO:root:Rewards:
[[-84, 2400, 1580, 1880, 5560, 3600, 5340, 2780, 2520], [820, 540, 1120, 3840, -40000, 1460, 1700, 2000, 2140], [740, 60, 1060, 140, -12, 700, 320, 380, 140], [-76, -12, 860, -4, -28, -36, -8, 20, -28], [-148, -108, -120, 1600, 1860, 320, -8, -12, -88], [-120, -120, 40, -84, 900, 0, -84, 620, 160], [-160, -156, -160, -32, 980, 0, -160, -156, -148], [-4, -80, -120, 280, 360, -84, -76, -4, -108], [-100, 640, -120, -52, 180, -80, -40, -64, 140]]
INFO:root:Count MDP: 5
INFO:root:Ship 8 command: o actual position: Position(14, 22) new position: Position(14, 22)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 0), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 4), (4, 5), (4, 6), (4, 7), (4, 8), (5, 0), (5, 1), (5, 2), (5, 3), (5, 4), (5, 5), (5, 6), (5, 7), (5, 8), (6, 0), (6, 1), (6, 2), (6, 3), (6, 4), (6, 5), (6, 6), (6, 7), (6, 8), (7, 0), (7, 1), (7, 2), (7, 3), (7, 4), (7, 5), (7, 6), (7, 7), (7, 8), (8, 0), (8, 1), (8, 2), (8, 3), (8, 4), (8, 5), (8, 6), (8, 7), (8, 8)]
INFO:root:Rewards:
[[1800, 700, 1900, 5900, 6160, 3200, 3860, 4820, 3100], [920, -12, 860, 4340, 4820, 4660, 3980, 2320, 2140], [240, 1520, 1600, 2080, 2400, 4600, 3160, 5600, 4620], [420, 780, 1380, 1760, 6240, 6380, 3220, 2720, 8480], [-24, -36, -32, -28, 20, 8260, 4200, 3480, 10760], [20, 400, 780, 660, 2580, 7040, 4220, 3940, 8060], [440, 1500, 940, 1880, 2400, 3040, 4160, 6460, 8280], [820, 880, 2520, 6740, 2700, 2160, 7280, 10360, 7880], [5040, 3580, 2420, 4620, 6060, 3540, 8900, 7600, 8220]]
INFO:root:Count MDP: 2
INFO:root:Ship 0 command: o actual position: Position(15, 35) new position: Position(15, 35)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 2), (0, 3), (0, 4), (0, 5), (0, 6), (0, 7), (0, 8), (1, 0), (1, 1), (1, 2), (1, 3), (1, 4), (1, 5), (1, 6), (1, 7), (1, 8), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (2, 6), (2, 7), (2, 8), (3, 1), (3, 2), (3, 3), (3, 4), (3, 5), (3, 6), (3, 7), (3, 8), (4, 0), (4, 1), (4, 2), (4, 3), (4, 4), (4, 5), (4, 6), (4, 7), (4, 8), (5, 0), (5, 1), (5, 2), (5, 3), (5, 5), (5, 6), (5, 7), (5, 8), (6, 2), (6, 7), (7, 3), (7, 4), (7, 5), (8, 2), (8, 4), (8, 7), (8, 8)]
INFO:root:Rewards:
[[3260, 2280, 1800, 3040, 4180, 9380, 9300, 7220, 5480], [3600, 3660, 5500, 3520, 3920, 10100, 18960, 10200, 5760], [1080, 1660, 2760, 3300, 5700, 5400, 10060, 9180, 3360], [-84, 2400, 1580, 1880, 5560, 3600, 5340, 2780, 2520], [820, 540, 1120, 3840, 280, 1460, 1700, 2000, 2140], [740, 60, 1060, 140, -12, 700, 320, 380, 140], [-76, -12, 860, -4, -28, -36, -8, 20, -28], [-148, -108, -120, 1600, -40000, 320, -8, -12, -88], [-120, -120, 40, -84, 900, 0, -84, 620, 160]]
INFO:root:Count MDP: 4
INFO:root:Ship 6 command: o actual position: Position(11, 22) new position: Position(11, 22)
INFO:root:Terminais: [(0, 0), (0, 1), (0, 3), (0, 7), (1, 0), (1, 1), (1, 2), (1, 4), (2, 0), (2, 1), (2, 2), (2, 3), (2, 4), (2, 5), (3, 0), (3, 1), (3, 2), (3, 3), (3, 7), (3, 8), (4, 0), (4, 1), (4, 2), (4, 3), (4, 6), (4, 7), (5, 0), (5, 1), (5, 2), (5, 3), (5, 7), (5, 8), (6, 0), (6, 1), (6, 2), (6, 3), (6, 4), (6, 7), (7, 0), (7, 1), (7, 2), (7, 3), (7, 4), (7, 7), (8, 0), (8, 1), (8, 3), (8, 7), (8, 8)]