brtdp_example.py calls def run_sample_trial(self, verbose=True): in BoundedRTDPClass.py,
while not state.is_terminal(): seems in a dead loop
s: (1,1) Action: left Gap: 99.07540345871926 MaxDiff: 9.908648275251627
s: (1,1) Action: left Gap: 99.07540345871926 MaxDiff: 9.908648275251627
s: (1,1) Action: left Gap: 99.07540345871926 MaxDiff: 9.908648275251627
s: (1,1) Action: left Gap: 99.07540345871926 MaxDiff: 9.908648275251627
s: (1,1) Action: left Gap: 99.07540345871926 MaxDiff: 9.908648275251627
s: (1,1) Action: left Gap: 99.07540345871926 MaxDiff: 9.908648275251627
s: (1,1) Action: left Gap: 99.07540345871926 MaxDiff: 9.908648275251627
s: (1,1) Action: left Gap: 99.07540345871926 MaxDiff: 9.908648275251627
s: (1,1) Action: left Gap: 99.07540345871926 MaxDiff: 9.908648275251627
s: (1,1) Action: left Gap: 99.07540345871926 MaxDiff: 9.908648275251627
s: (1,1) Action: left Gap: 99.07540345871926 MaxDiff: 9.908648275251627
s: (1,1) Action: left Gap: 99.07540345871926 MaxDiff: 9.908648275251627
brtdp_example.py calls def run_sample_trial(self, verbose=True): in BoundedRTDPClass.py,
while not state.is_terminal(): seems in a dead loop
s: (1,1) Action: left Gap: 99.07540345871926 MaxDiff: 9.908648275251627
s: (1,1) Action: left Gap: 99.07540345871926 MaxDiff: 9.908648275251627
s: (1,1) Action: left Gap: 99.07540345871926 MaxDiff: 9.908648275251627
s: (1,1) Action: left Gap: 99.07540345871926 MaxDiff: 9.908648275251627
s: (1,1) Action: left Gap: 99.07540345871926 MaxDiff: 9.908648275251627
s: (1,1) Action: left Gap: 99.07540345871926 MaxDiff: 9.908648275251627
s: (1,1) Action: left Gap: 99.07540345871926 MaxDiff: 9.908648275251627
s: (1,1) Action: left Gap: 99.07540345871926 MaxDiff: 9.908648275251627
s: (1,1) Action: left Gap: 99.07540345871926 MaxDiff: 9.908648275251627
s: (1,1) Action: left Gap: 99.07540345871926 MaxDiff: 9.908648275251627
s: (1,1) Action: left Gap: 99.07540345871926 MaxDiff: 9.908648275251627
s: (1,1) Action: left Gap: 99.07540345871926 MaxDiff: 9.908648275251627