game: coop_box_pushing

GameType.chance_mode = ChanceMode.EXPLICIT_STOCHASTIC
GameType.dynamics = Dynamics.SIMULTANEOUS
GameType.information = Information.IMPERFECT_INFORMATION
GameType.long_name = "Cooperative Box Pushing"
GameType.max_num_players = 2
GameType.min_num_players = 2
GameType.parameter_specification = ["fully_observable", "horizon"]
GameType.provides_information_state_string = False
GameType.provides_information_state_tensor = False
GameType.provides_observation_string = True
GameType.provides_observation_tensor = True
GameType.provides_factored_observation_string = False
GameType.reward_model = RewardModel.REWARDS
GameType.short_name = "coop_box_pushing"
GameType.utility = Utility.IDENTICAL

NumDistinctActions() = 4
PolicyTensorShape() = [4]
MaxChanceOutcomes() = 4
GetParameters() = {fully_observable=False,horizon=100}
NumPlayers() = 2
MinUtility() = -1020.0
MaxUtility() = 1.998e+04
UtilitySum() = None
ObservationTensorShape() = [5]
ObservationTensorLayout() = TensorLayout.CHW
ObservationTensorSize() = 5
MaxGameLength() = 100
ToString() = "coop_box_pushing()"

# State 0
# Total moves: 0
# Most recent reward: 0
# Total rewards: 0
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>....<.
# ........
IsTerminal() = False
History() = []
HistoryString() = ""
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
Rewards() = [0.0, 0.0]
Returns() = [0.0, 0.0]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["stay", "move forward"]
actions: [3, 2]

# State 1
# Total moves: 0
# Most recent reward: 0
# Total rewards: 0
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>....<.
# ........
IsTerminal() = False
History() = [3, 2]
HistoryString() = "3, 2"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 2
# Total moves: 0
# Most recent reward: 0
# Total rewards: 0
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>....<.
# ........
IsTerminal() = False
History() = [3, 2, 1]
HistoryString() = "3, 2, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 3
# Total moves: 0
# Most recent reward: 0
# Total rewards: 0
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>....<.
# ........
IsTerminal() = False
History() = [3, 2, 1, 0]
HistoryString() = "3, 2, 1, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "move forward"
action: 2

# State 4
# Total moves: 1
# Most recent reward: -0.1
# Total rewards: -0.1
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>...<..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2]
HistoryString() = "3, 2, 1, 0, 2"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-0.1, -0.1]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn left", "turn left"]
actions: [0, 0]

# State 5
# Total moves: 1
# Most recent reward: -0.1
# Total rewards: -0.1
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>...<..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 6
# Total moves: 1
# Most recent reward: -0.1
# Total rewards: -0.1
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>...<..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 7
# Total moves: 1
# Most recent reward: -0.1
# Total rewards: -0.1
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>...<..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 8
# Total moves: 2
# Most recent reward: -0.1
# Total rewards: -0.2
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>...v..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-0.2, -0.2]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn left", "turn right"]
actions: [0, 1]

# State 9
# Total moves: 2
# Most recent reward: -0.1
# Total rewards: -0.2
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>...v..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 10
# Total moves: 2
# Most recent reward: -0.1
# Total rewards: -0.2
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>...v..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 11
# Total moves: 2
# Most recent reward: -0.1
# Total rewards: -0.2
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>...v..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "move forward"
action: 2

# State 12
# Total moves: 3
# Most recent reward: -0.1
# Total rewards: -0.3
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>...v..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-0.30000000000000004, -0.30000000000000004]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn left", "move forward"]
actions: [0, 2]

# State 13
# Total moves: 3
# Most recent reward: -0.1
# Total rewards: -0.3
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>...v..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 14
# Total moves: 3
# Most recent reward: -0.1
# Total rewards: -0.3
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>...v..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 15
# Total moves: 3
# Most recent reward: -0.1
# Total rewards: -0.3
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>...v..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 16
# Total moves: 4
# Most recent reward: -0.1
# Total rewards: -0.4
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>...v..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-0.4, -0.4]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn left", "turn left"]
actions: [0, 0]

# State 17
# Total moves: 4
# Most recent reward: -0.1
# Total rewards: -0.4
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>...v..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 18
# Total moves: 4
# Most recent reward: -0.1
# Total rewards: -0.4
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>...v..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 19
# Total moves: 4
# Most recent reward: -0.1
# Total rewards: -0.4
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>...v..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 20
# Total moves: 5
# Most recent reward: -0.1
# Total rewards: -0.5
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>...>..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-0.5, -0.5]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["stay", "turn right"]
actions: [3, 1]

# State 21
# Total moves: 5
# Most recent reward: -0.1
# Total rewards: -0.5
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>...>..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 22
# Total moves: 5
# Most recent reward: -0.1
# Total rewards: -0.5
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>...>..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 23
# Total moves: 5
# Most recent reward: -0.1
# Total rewards: -0.5
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>...>..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 24
# Total moves: 6
# Most recent reward: -0.1
# Total rewards: -0.6
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>...v..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-0.6, -0.6]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["move forward", "turn left"]
actions: [2, 0]

# State 25
# Total moves: 6
# Most recent reward: -0.1
# Total rewards: -0.6
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>...v..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 26
# Total moves: 6
# Most recent reward: -0.1
# Total rewards: -0.6
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>...v..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 27
# Total moves: 6
# Most recent reward: -0.1
# Total rewards: -0.6
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>...v..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "move forward"
action: 2

# State 28
# Total moves: 7
# Most recent reward: -0.1
# Total rewards: -0.7
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>...v..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-0.7, -0.7]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn left", "turn left"]
actions: [0, 0]

# State 29
# Total moves: 7
# Most recent reward: -0.1
# Total rewards: -0.7
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>...v..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 30
# Total moves: 7
# Most recent reward: -0.1
# Total rewards: -0.7
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>...v..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 31
# Total moves: 7
# Most recent reward: -0.1
# Total rewards: -0.7
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>...v..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "move forward"
action: 2

# State 32
# Total moves: 8
# Most recent reward: -0.1
# Total rewards: -0.8
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>...v..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-0.7999999999999999, -0.7999999999999999]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["stay", "turn right"]
actions: [3, 1]

# State 33
# Total moves: 8
# Most recent reward: -0.1
# Total rewards: -0.8
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>...v..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 34
# Total moves: 8
# Most recent reward: -0.1
# Total rewards: -0.8
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>...v..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 35
# Total moves: 8
# Most recent reward: -0.1
# Total rewards: -0.8
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>...v..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 36
# Total moves: 9
# Most recent reward: -0.1
# Total rewards: -0.9
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>...v..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-0.8999999999999999, -0.8999999999999999]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["move forward", "turn right"]
actions: [2, 1]

# State 37
# Total moves: 9
# Most recent reward: -0.1
# Total rewards: -0.9
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>...v..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 38
# Total moves: 9
# Most recent reward: -0.1
# Total rewards: -0.9
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>...v..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 39
# Total moves: 9
# Most recent reward: -0.1
# Total rewards: -0.9
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>...v..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "move forward"
action: 2

# State 40
# Total moves: 10
# Most recent reward: -0.1
# Total rewards: -1
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>...v..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-0.9999999999999999, -0.9999999999999999]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn left", "turn left"]
actions: [0, 0]

# State 41
# Total moves: 10
# Most recent reward: -0.1
# Total rewards: -1
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>...v..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 42
# Total moves: 10
# Most recent reward: -0.1
# Total rewards: -1
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>...v..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 43
# Total moves: 10
# Most recent reward: -0.1
# Total rewards: -1
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>...v..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "move forward"
action: 2

# State 44
# Total moves: 11
# Most recent reward: -0.1
# Total rewards: -1.1
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .^...v..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-1.0999999999999999, -1.0999999999999999]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn right", "move forward"]
actions: [1, 2]

# State 45
# Total moves: 11
# Most recent reward: -0.1
# Total rewards: -1.1
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .^...v..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 46
# Total moves: 11
# Most recent reward: -0.1
# Total rewards: -1.1
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .^...v..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 47
# Total moves: 11
# Most recent reward: -0.1
# Total rewards: -1.1
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .^...v..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "move forward"
action: 2

# State 48
# Total moves: 12
# Most recent reward: -0.1
# Total rewards: -1.2
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>...v..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-1.2, -1.2]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["stay", "move forward"]
actions: [3, 2]

# State 49
# Total moves: 12
# Most recent reward: -0.1
# Total rewards: -1.2
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>...v..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 50
# Total moves: 12
# Most recent reward: -0.1
# Total rewards: -1.2
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>...v..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 51
# Total moves: 12
# Most recent reward: -0.1
# Total rewards: -1.2
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>...v..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "move forward"
action: 2

# State 52
# Total moves: 13
# Most recent reward: -0.1
# Total rewards: -1.3
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>......
# .....v..
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-1.3, -1.3]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["move forward", "stay"]
actions: [2, 3]

# State 53
# Total moves: 13
# Most recent reward: -0.1
# Total rewards: -1.3
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>......
# .....v..
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 54
# Total moves: 13
# Most recent reward: -0.1
# Total rewards: -1.3
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>......
# .....v..
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 55
# Total moves: 13
# Most recent reward: -0.1
# Total rewards: -1.3
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>......
# .....v..
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 56
# Total moves: 14
# Most recent reward: -0.1
# Total rewards: -1.4
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>......
# .....v..
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-1.4000000000000001, -1.4000000000000001]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["move forward", "stay"]
actions: [2, 3]

# State 57
# Total moves: 14
# Most recent reward: -0.1
# Total rewards: -1.4
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>......
# .....v..
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 58
# Total moves: 14
# Most recent reward: -0.1
# Total rewards: -1.4
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>......
# .....v..
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 59
# Total moves: 14
# Most recent reward: -0.1
# Total rewards: -1.4
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .>......
# .....v..
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 60
# Total moves: 15
# Most recent reward: -0.1
# Total rewards: -1.5
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# ..>.....
# .....v..
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-1.5000000000000002, -1.5000000000000002]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["move forward", "move forward"]
actions: [2, 2]

# State 61
# Total moves: 15
# Most recent reward: -0.1
# Total rewards: -1.5
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# ..>.....
# .....v..
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 62
# Total moves: 15
# Most recent reward: -0.1
# Total rewards: -1.5
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# ..>.....
# .....v..
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 63
# Total moves: 15
# Most recent reward: -0.1
# Total rewards: -1.5
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# ..>.....
# .....v..
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 64
# Total moves: 16
# Most recent reward: -0.1
# Total rewards: -1.6
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# ...>....
# .....v..
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-1.6000000000000003, -1.6000000000000003]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["move forward", "turn left"]
actions: [2, 0]

# State 65
# Total moves: 16
# Most recent reward: -0.1
# Total rewards: -1.6
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# ...>....
# .....v..
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 66
# Total moves: 16
# Most recent reward: -0.1
# Total rewards: -1.6
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# ...>....
# .....v..
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 67
# Total moves: 16
# Most recent reward: -0.1
# Total rewards: -1.6
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# ...>....
# .....v..
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "move forward"
action: 2

# State 68
# Total moves: 17
# Most recent reward: -0.1
# Total rewards: -1.7
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# ....>...
# .....>..
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-1.7000000000000004, -1.7000000000000004]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn left", "move forward"]
actions: [0, 2]

# State 69
# Total moves: 17
# Most recent reward: -0.1
# Total rewards: -1.7
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# ....>...
# .....>..
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 70
# Total moves: 17
# Most recent reward: -0.1
# Total rewards: -1.7
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# ....>...
# .....>..
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 71
# Total moves: 17
# Most recent reward: -0.1
# Total rewards: -1.7
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# ....>...
# .....>..
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "move forward"
action: 2

# State 72
# Total moves: 18
# Most recent reward: -0.1
# Total rewards: -1.8
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# ....>...
# ......>.
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-1.8000000000000005, -1.8000000000000005]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn right", "turn right"]
actions: [1, 1]

# State 73
# Total moves: 18
# Most recent reward: -0.1
# Total rewards: -1.8
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# ....>...
# ......>.
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 74
# Total moves: 18
# Most recent reward: -0.1
# Total rewards: -1.8
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# ....>...
# ......>.
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 75
# Total moves: 18
# Most recent reward: -0.1
# Total rewards: -1.8
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# ....>...
# ......>.
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "move forward"
action: 2

# State 76
# Total moves: 19
# Most recent reward: -0.1
# Total rewards: -1.9
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# ....>...
# ......v.
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-1.9000000000000006, -1.9000000000000006]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["stay", "turn left"]
actions: [3, 0]

# State 77
# Total moves: 19
# Most recent reward: -0.1
# Total rewards: -1.9
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# ....>...
# ......v.
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 78
# Total moves: 19
# Most recent reward: -0.1
# Total rewards: -1.9
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# ....>...
# ......v.
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 79
# Total moves: 19
# Most recent reward: -0.1
# Total rewards: -1.9
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# ....>...
# ......v.
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "move forward"
action: 2

# State 80
# Total moves: 20
# Most recent reward: -0.1
# Total rewards: -2
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# ....>...
# ......v.
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-2.0000000000000004, -2.0000000000000004]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn left", "turn left"]
actions: [0, 0]

# State 81
# Total moves: 20
# Most recent reward: -0.1
# Total rewards: -2
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# ....>...
# ......v.
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 82
# Total moves: 20
# Most recent reward: -0.1
# Total rewards: -2
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# ....>...
# ......v.
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 83
# Total moves: 20
# Most recent reward: -0.1
# Total rewards: -2
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# ....>...
# ......v.
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "move forward"
action: 2

# State 84
# Total moves: 21
# Most recent reward: -0.1
# Total rewards: -2.1
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# ....^...
# ......>.
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-2.1000000000000005, -2.1000000000000005]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["stay", "turn left"]
actions: [3, 0]

# State 85
# Total moves: 21
# Most recent reward: -0.1
# Total rewards: -2.1
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# ....^...
# ......>.
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 86
# Total moves: 21
# Most recent reward: -0.1
# Total rewards: -2.1
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# ....^...
# ......>.
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 87
# Total moves: 21
# Most recent reward: -0.1
# Total rewards: -2.1
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# ....^...
# ......>.
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "move forward"
action: 2

# State 88
# Total moves: 22
# Most recent reward: -0.1
# Total rewards: -2.2
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# ....^...
# ......>.
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-2.2000000000000006, -2.2000000000000006]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["stay", "turn left"]
actions: [3, 0]

# State 89
# Total moves: 22
# Most recent reward: -0.1
# Total rewards: -2.2
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# ....^...
# ......>.
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 90
# Total moves: 22
# Most recent reward: -0.1
# Total rewards: -2.2
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# ....^...
# ......>.
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 91
# Total moves: 22
# Most recent reward: -0.1
# Total rewards: -2.2
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# ....^...
# ......>.
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "move forward"
action: 2

# State 92
# Total moves: 23
# Most recent reward: -0.1
# Total rewards: -2.3
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# ....^...
# ......^.
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-2.3000000000000007, -2.3000000000000007]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn right", "stay"]
actions: [1, 3]

# State 93
# Total moves: 23
# Most recent reward: -0.1
# Total rewards: -2.3
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# ....^...
# ......^.
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 94
# Total moves: 23
# Most recent reward: -0.1
# Total rewards: -2.3
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# ....^...
# ......^.
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 95
# Total moves: 23
# Most recent reward: -0.1
# Total rewards: -2.3
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# ....^...
# ......^.
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "move forward"
action: 2

# State 96
# Total moves: 24
# Most recent reward: -0.1
# Total rewards: -2.4
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# ....>...
# ......^.
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-2.400000000000001, -2.400000000000001]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn left", "turn left"]
actions: [0, 0]

# State 97
# Total moves: 24
# Most recent reward: -0.1
# Total rewards: -2.4
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# ....>...
# ......^.
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 98
# Total moves: 24
# Most recent reward: -0.1
# Total rewards: -2.4
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# ....>...
# ......^.
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 99
# Total moves: 24
# Most recent reward: -0.1
# Total rewards: -2.4
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# ....>...
# ......^.
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 100
# Total moves: 25
# Most recent reward: -0.1
# Total rewards: -2.5
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# ....>...
# ......^.
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-2.500000000000001, -2.500000000000001]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["stay", "move forward"]
actions: [3, 2]

# State 101
# Total moves: 25
# Most recent reward: -0.1
# Total rewards: -2.5
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# ....>...
# ......^.
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 102
# Total moves: 25
# Most recent reward: -0.1
# Total rewards: -2.5
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# ....>...
# ......^.
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 103
# Total moves: 25
# Most recent reward: -0.1
# Total rewards: -2.5
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# ....>...
# ......^.
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 104
# Total moves: 26
# Most recent reward: -0.1
# Total rewards: -2.6
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# ....>.^.
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-2.600000000000001, -2.600000000000001]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["move forward", "turn right"]
actions: [2, 1]

# State 105
# Total moves: 26
# Most recent reward: -0.1
# Total rewards: -2.6
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# ....>.^.
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 106
# Total moves: 26
# Most recent reward: -0.1
# Total rewards: -2.6
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# ....>.^.
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 107
# Total moves: 26
# Most recent reward: -0.1
# Total rewards: -2.6
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# ....>.^.
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 108
# Total moves: 27
# Most recent reward: -0.1
# Total rewards: -2.7
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .....>^.
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "other agent"
ObservationString(1) = "field"
ObservationTensor(0): ◯◯◉◯◯
ObservationTensor(1): ◉◯◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-2.700000000000001, -2.700000000000001]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn left", "stay"]
actions: [0, 3]

# State 109
# Total moves: 27
# Most recent reward: -0.1
# Total rewards: -2.7
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .....>^.
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "other agent"
ObservationString(1) = "field"
ObservationTensor(0): ◯◯◉◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 110
# Total moves: 27
# Most recent reward: -0.1
# Total rewards: -2.7
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .....>^.
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "other agent"
ObservationString(1) = "field"
ObservationTensor(0): ◯◯◉◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 111
# Total moves: 27
# Most recent reward: -0.1
# Total rewards: -2.7
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .....>^.
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "other agent"
ObservationString(1) = "field"
ObservationTensor(0): ◯◯◉◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "move forward"
action: 2

# State 112
# Total moves: 28
# Most recent reward: -0.1
# Total rewards: -2.8
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .....>^.
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "other agent"
ObservationString(1) = "field"
ObservationTensor(0): ◯◯◉◯◯
ObservationTensor(1): ◉◯◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-2.800000000000001, -2.800000000000001]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["stay", "turn left"]
actions: [3, 0]

# State 113
# Total moves: 28
# Most recent reward: -0.1
# Total rewards: -2.8
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .....>^.
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "other agent"
ObservationString(1) = "field"
ObservationTensor(0): ◯◯◉◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 114
# Total moves: 28
# Most recent reward: -0.1
# Total rewards: -2.8
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .....>^.
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "other agent"
ObservationString(1) = "field"
ObservationTensor(0): ◯◯◉◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 115
# Total moves: 28
# Most recent reward: -0.1
# Total rewards: -2.8
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .....>^.
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "other agent"
ObservationString(1) = "field"
ObservationTensor(0): ◯◯◉◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 116
# Total moves: 29
# Most recent reward: -0.1
# Total rewards: -2.9
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .....>^.
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "other agent"
ObservationString(1) = "field"
ObservationTensor(0): ◯◯◉◯◯
ObservationTensor(1): ◉◯◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-2.9000000000000012, -2.9000000000000012]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn left", "stay"]
actions: [0, 3]

# State 117
# Total moves: 29
# Most recent reward: -0.1
# Total rewards: -2.9
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .....>^.
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "other agent"
ObservationString(1) = "field"
ObservationTensor(0): ◯◯◉◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 118
# Total moves: 29
# Most recent reward: -0.1
# Total rewards: -2.9
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .....>^.
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "other agent"
ObservationString(1) = "field"
ObservationTensor(0): ◯◯◉◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 119
# Total moves: 29
# Most recent reward: -0.1
# Total rewards: -2.9
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .....>^.
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "other agent"
ObservationString(1) = "field"
ObservationTensor(0): ◯◯◉◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 120
# Total moves: 30
# Most recent reward: -0.1
# Total rewards: -3
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .....^^.
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-3.0000000000000013, -3.0000000000000013]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["move forward", "move forward"]
actions: [2, 2]

# State 121
# Total moves: 30
# Most recent reward: -0.1
# Total rewards: -3
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .....^^.
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 122
# Total moves: 30
# Most recent reward: -0.1
# Total rewards: -3
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .....^^.
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 123
# Total moves: 30
# Most recent reward: -0.1
# Total rewards: -3
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .....^^.
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 124
# Total moves: 31
# Most recent reward: -0.1
# Total rewards: -3.1
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .....^^.
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-3.1000000000000014, -3.1000000000000014]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn left", "turn left"]
actions: [0, 0]

# State 125
# Total moves: 31
# Most recent reward: -0.1
# Total rewards: -3.1
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .....^^.
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 126
# Total moves: 31
# Most recent reward: -0.1
# Total rewards: -3.1
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .....^^.
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 127
# Total moves: 31
# Most recent reward: -0.1
# Total rewards: -3.1
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .....^^.
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 128
# Total moves: 32
# Most recent reward: -0.1
# Total rewards: -3.2
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .....<<.
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "other agent"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◉◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-3.2000000000000015, -3.2000000000000015]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn right", "turn right"]
actions: [1, 1]

# State 129
# Total moves: 32
# Most recent reward: -0.1
# Total rewards: -3.2
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .....<<.
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "other agent"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◉◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 130
# Total moves: 32
# Most recent reward: -0.1
# Total rewards: -3.2
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .....<<.
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "other agent"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◉◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 131
# Total moves: 32
# Most recent reward: -0.1
# Total rewards: -3.2
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .....<<.
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "other agent"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◉◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 132
# Total moves: 33
# Most recent reward: -0.1
# Total rewards: -3.3
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .....<^.
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-3.3000000000000016, -3.3000000000000016]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["stay", "turn right"]
actions: [3, 1]

# State 133
# Total moves: 33
# Most recent reward: -0.1
# Total rewards: -3.3
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .....<^.
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 134
# Total moves: 33
# Most recent reward: -0.1
# Total rewards: -3.3
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .....<^.
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 135
# Total moves: 33
# Most recent reward: -0.1
# Total rewards: -3.3
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .....<^.
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 136
# Total moves: 34
# Most recent reward: -0.1
# Total rewards: -3.4
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .....<>.
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-3.4000000000000017, -3.4000000000000017]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn right", "turn left"]
actions: [1, 0]

# State 137
# Total moves: 34
# Most recent reward: -0.1
# Total rewards: -3.4
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .....<>.
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 138
# Total moves: 34
# Most recent reward: -0.1
# Total rewards: -3.4
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .....<>.
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 139
# Total moves: 34
# Most recent reward: -0.1
# Total rewards: -3.4
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .....<>.
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 140
# Total moves: 35
# Most recent reward: -0.1
# Total rewards: -3.5
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .....<^.
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-3.5000000000000018, -3.5000000000000018]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn right", "move forward"]
actions: [1, 2]

# State 141
# Total moves: 35
# Most recent reward: -0.1
# Total rewards: -3.5
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .....<^.
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 142
# Total moves: 35
# Most recent reward: -0.1
# Total rewards: -3.5
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .....<^.
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 143
# Total moves: 35
# Most recent reward: -0.1
# Total rewards: -3.5
# ........
# ........
# ........
# .b.BB.b.
# ........
# ........
# .....<^.
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 144
# Total moves: 36
# Most recent reward: -0.1
# Total rewards: -3.6
# ........
# ........
# ........
# .b.BB.b.
# ........
# ......^.
# .....^..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-3.600000000000002, -3.600000000000002]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn right", "turn right"]
actions: [1, 1]

# State 145
# Total moves: 36
# Most recent reward: -0.1
# Total rewards: -3.6
# ........
# ........
# ........
# .b.BB.b.
# ........
# ......^.
# .....^..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 146
# Total moves: 36
# Most recent reward: -0.1
# Total rewards: -3.6
# ........
# ........
# ........
# .b.BB.b.
# ........
# ......^.
# .....^..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 147
# Total moves: 36
# Most recent reward: -0.1
# Total rewards: -3.6
# ........
# ........
# ........
# .b.BB.b.
# ........
# ......^.
# .....^..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 148
# Total moves: 37
# Most recent reward: -0.1
# Total rewards: -3.7
# ........
# ........
# ........
# .b.BB.b.
# ........
# ......>.
# .....>..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-3.700000000000002, -3.700000000000002]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn left", "turn left"]
actions: [0, 0]

# State 149
# Total moves: 37
# Most recent reward: -0.1
# Total rewards: -3.7
# ........
# ........
# ........
# .b.BB.b.
# ........
# ......>.
# .....>..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 150
# Total moves: 37
# Most recent reward: -0.1
# Total rewards: -3.7
# ........
# ........
# ........
# .b.BB.b.
# ........
# ......>.
# .....>..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 151
# Total moves: 37
# Most recent reward: -0.1
# Total rewards: -3.7
# ........
# ........
# ........
# .b.BB.b.
# ........
# ......>.
# .....>..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 152
# Total moves: 38
# Most recent reward: -0.1
# Total rewards: -3.8
# ........
# ........
# ........
# .b.BB.b.
# ........
# ......^.
# .....>..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-3.800000000000002, -3.800000000000002]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["move forward", "turn right"]
actions: [2, 1]

# State 153
# Total moves: 38
# Most recent reward: -0.1
# Total rewards: -3.8
# ........
# ........
# ........
# .b.BB.b.
# ........
# ......^.
# .....>..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 154
# Total moves: 38
# Most recent reward: -0.1
# Total rewards: -3.8
# ........
# ........
# ........
# .b.BB.b.
# ........
# ......^.
# .....>..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 155
# Total moves: 38
# Most recent reward: -0.1
# Total rewards: -3.8
# ........
# ........
# ........
# .b.BB.b.
# ........
# ......^.
# .....>..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 156
# Total moves: 39
# Most recent reward: -0.1
# Total rewards: -3.9
# ........
# ........
# ........
# .b.BB.b.
# ........
# ......^.
# .....>..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-3.900000000000002, -3.900000000000002]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn right", "move forward"]
actions: [1, 2]

# State 157
# Total moves: 39
# Most recent reward: -0.1
# Total rewards: -3.9
# ........
# ........
# ........
# .b.BB.b.
# ........
# ......^.
# .....>..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 158
# Total moves: 39
# Most recent reward: -0.1
# Total rewards: -3.9
# ........
# ........
# ........
# .b.BB.b.
# ........
# ......^.
# .....>..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 159
# Total moves: 39
# Most recent reward: -0.1
# Total rewards: -3.9
# ........
# ........
# ........
# .b.BB.b.
# ........
# ......^.
# .....>..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 160
# Total moves: 40
# Most recent reward: -0.1
# Total rewards: -4
# ........
# ........
# ........
# .b.BB.b.
# ......^.
# ........
# .....v..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
Rewards() = [-0.1, -0.1]
Returns() = [-4.000000000000002, -4.000000000000002]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn right", "move forward"]
actions: [1, 2]

# State 161
# Total moves: 40
# Most recent reward: -0.1
# Total rewards: -4
# ........
# ........
# ........
# .b.BB.b.
# ......^.
# ........
# .....v..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 162
# Total moves: 40
# Most recent reward: -0.1
# Total rewards: -4
# ........
# ........
# ........
# .b.BB.b.
# ......^.
# ........
# .....v..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 163
# Total moves: 40
# Most recent reward: -0.1
# Total rewards: -4
# ........
# ........
# ........
# .b.BB.b.
# ......^.
# ........
# .....v..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "move forward"
action: 2

# State 164
# Total moves: 41
# Most recent reward: -0.1
# Total rewards: -4.1
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ........
# .....<..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
Rewards() = [-0.1, -0.1]
Returns() = [-4.100000000000001, -4.100000000000001]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["move forward", "stay"]
actions: [2, 3]

# State 165
# Total moves: 41
# Most recent reward: -0.1
# Total rewards: -4.1
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ........
# .....<..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 166
# Total moves: 41
# Most recent reward: -0.1
# Total rewards: -4.1
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ........
# .....<..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 167
# Total moves: 41
# Most recent reward: -0.1
# Total rewards: -4.1
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ........
# .....<..
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 168
# Total moves: 42
# Most recent reward: -0.1
# Total rewards: -4.2
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ........
# ....<...
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
Rewards() = [-0.1, -0.1]
Returns() = [-4.200000000000001, -4.200000000000001]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["move forward", "turn right"]
actions: [2, 1]

# State 169
# Total moves: 42
# Most recent reward: -0.1
# Total rewards: -4.2
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ........
# ....<...
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 170
# Total moves: 42
# Most recent reward: -0.1
# Total rewards: -4.2
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ........
# ....<...
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 171
# Total moves: 42
# Most recent reward: -0.1
# Total rewards: -4.2
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ........
# ....<...
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "move forward"
action: 2

# State 172
# Total moves: 43
# Most recent reward: -0.1
# Total rewards: -4.3
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ........
# ....<...
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
Rewards() = [-0.1, -0.1]
Returns() = [-4.300000000000001, -4.300000000000001]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn right", "turn left"]
actions: [1, 0]

# State 173
# Total moves: 43
# Most recent reward: -0.1
# Total rewards: -4.3
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ........
# ....<...
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 174
# Total moves: 43
# Most recent reward: -0.1
# Total rewards: -4.3
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ........
# ....<...
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 175
# Total moves: 43
# Most recent reward: -0.1
# Total rewards: -4.3
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ........
# ....<...
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 176
# Total moves: 44
# Most recent reward: -0.1
# Total rewards: -4.4
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ........
# ....<...
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
Rewards() = [-0.1, -0.1]
Returns() = [-4.4, -4.4]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["move forward", "stay"]
actions: [2, 3]

# State 177
# Total moves: 44
# Most recent reward: -0.1
# Total rewards: -4.4
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ........
# ....<...
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 178
# Total moves: 44
# Most recent reward: -0.1
# Total rewards: -4.4
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ........
# ....<...
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 179
# Total moves: 44
# Most recent reward: -0.1
# Total rewards: -4.4
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ........
# ....<...
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "move forward"
action: 2

# State 180
# Total moves: 45
# Most recent reward: -0.1
# Total rewards: -4.5
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ........
# ...<....
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
Rewards() = [-0.1, -0.1]
Returns() = [-4.5, -4.5]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn right", "stay"]
actions: [1, 3]

# State 181
# Total moves: 45
# Most recent reward: -0.1
# Total rewards: -4.5
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ........
# ...<....
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 182
# Total moves: 45
# Most recent reward: -0.1
# Total rewards: -4.5
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ........
# ...<....
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 183
# Total moves: 45
# Most recent reward: -0.1
# Total rewards: -4.5
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ........
# ...<....
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 184
# Total moves: 46
# Most recent reward: -0.1
# Total rewards: -4.6
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ........
# ...^....
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
Rewards() = [-0.1, -0.1]
Returns() = [-4.6, -4.6]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn left", "turn right"]
actions: [0, 1]

# State 185
# Total moves: 46
# Most recent reward: -0.1
# Total rewards: -4.6
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ........
# ...^....
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 186
# Total moves: 46
# Most recent reward: -0.1
# Total rewards: -4.6
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ........
# ...^....
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 187
# Total moves: 46
# Most recent reward: -0.1
# Total rewards: -4.6
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ........
# ...^....
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 188
# Total moves: 47
# Most recent reward: -0.1
# Total rewards: -4.7
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ........
# ...^....
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
Rewards() = [-0.1, -0.1]
Returns() = [-4.699999999999999, -4.699999999999999]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn left", "stay"]
actions: [0, 3]

# State 189
# Total moves: 47
# Most recent reward: -0.1
# Total rewards: -4.7
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ........
# ...^....
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 190
# Total moves: 47
# Most recent reward: -0.1
# Total rewards: -4.7
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ........
# ...^....
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 191
# Total moves: 47
# Most recent reward: -0.1
# Total rewards: -4.7
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ........
# ...^....
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 192
# Total moves: 48
# Most recent reward: -0.1
# Total rewards: -4.8
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ........
# ...^....
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
Rewards() = [-0.1, -0.1]
Returns() = [-4.799999999999999, -4.799999999999999]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["stay", "stay"]
actions: [3, 3]

# State 193
# Total moves: 48
# Most recent reward: -0.1
# Total rewards: -4.8
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ........
# ...^....
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 194
# Total moves: 48
# Most recent reward: -0.1
# Total rewards: -4.8
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ........
# ...^....
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 195
# Total moves: 48
# Most recent reward: -0.1
# Total rewards: -4.8
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ........
# ...^....
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 196
# Total moves: 49
# Most recent reward: -0.1
# Total rewards: -4.9
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ........
# ...^....
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
Rewards() = [-0.1, -0.1]
Returns() = [-4.899999999999999, -4.899999999999999]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn left", "stay"]
actions: [0, 3]

# State 197
# Total moves: 49
# Most recent reward: -0.1
# Total rewards: -4.9
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ........
# ...^....
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 198
# Total moves: 49
# Most recent reward: -0.1
# Total rewards: -4.9
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ........
# ...^....
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 199
# Total moves: 49
# Most recent reward: -0.1
# Total rewards: -4.9
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ........
# ...^....
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "move forward"
action: 2

# State 200
# Total moves: 50
# Most recent reward: -0.1
# Total rewards: -5
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ........
# ...<....
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
Rewards() = [-0.1, -0.1]
Returns() = [-4.999999999999998, -4.999999999999998]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn left", "stay"]
actions: [0, 3]

# State 201
# Total moves: 50
# Most recent reward: -0.1
# Total rewards: -5
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ........
# ...<....
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 202
# Total moves: 50
# Most recent reward: -0.1
# Total rewards: -5
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ........
# ...<....
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 203
# Total moves: 50
# Most recent reward: -0.1
# Total rewards: -5
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ........
# ...<....
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "move forward"
action: 2

# State 204
# Total moves: 51
# Most recent reward: -0.1
# Total rewards: -5.1
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ........
# ...<....
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
Rewards() = [-0.1, -0.1]
Returns() = [-5.099999999999998, -5.099999999999998]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn right", "turn left"]
actions: [1, 0]

# State 205
# Total moves: 51
# Most recent reward: -0.1
# Total rewards: -5.1
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ........
# ...<....
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 206
# Total moves: 51
# Most recent reward: -0.1
# Total rewards: -5.1
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ........
# ...<....
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 207
# Total moves: 51
# Most recent reward: -0.1
# Total rewards: -5.1
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ........
# ...<....
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "move forward"
action: 2

# State 208
# Total moves: 52
# Most recent reward: -0.1
# Total rewards: -5.2
# ........
# ........
# ......b.
# .b.BB.<.
# ........
# ........
# ...^....
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-5.1999999999999975, -5.1999999999999975]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["move forward", "stay"]
actions: [2, 3]

# State 209
# Total moves: 52
# Most recent reward: -0.1
# Total rewards: -5.2
# ........
# ........
# ......b.
# .b.BB.<.
# ........
# ........
# ...^....
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 210
# Total moves: 52
# Most recent reward: -0.1
# Total rewards: -5.2
# ........
# ........
# ......b.
# .b.BB.<.
# ........
# ........
# ...^....
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 211
# Total moves: 52
# Most recent reward: -0.1
# Total rewards: -5.2
# ........
# ........
# ......b.
# .b.BB.<.
# ........
# ........
# ...^....
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "move forward"
action: 2

# State 212
# Total moves: 53
# Most recent reward: -0.1
# Total rewards: -5.3
# ........
# ........
# ......b.
# .b.BB.<.
# ........
# ...^....
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-5.299999999999997, -5.299999999999997]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["stay", "turn left"]
actions: [3, 0]

# State 213
# Total moves: 53
# Most recent reward: -0.1
# Total rewards: -5.3
# ........
# ........
# ......b.
# .b.BB.<.
# ........
# ...^....
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 214
# Total moves: 53
# Most recent reward: -0.1
# Total rewards: -5.3
# ........
# ........
# ......b.
# .b.BB.<.
# ........
# ...^....
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 215
# Total moves: 53
# Most recent reward: -0.1
# Total rewards: -5.3
# ........
# ........
# ......b.
# .b.BB.<.
# ........
# ...^....
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "move forward"
action: 2

# State 216
# Total moves: 54
# Most recent reward: -0.1
# Total rewards: -5.4
# ........
# ........
# ......b.
# .b.BB.v.
# ........
# ...^....
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-5.399999999999997, -5.399999999999997]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn right", "turn right"]
actions: [1, 1]

# State 217
# Total moves: 54
# Most recent reward: -0.1
# Total rewards: -5.4
# ........
# ........
# ......b.
# .b.BB.v.
# ........
# ...^....
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 218
# Total moves: 54
# Most recent reward: -0.1
# Total rewards: -5.4
# ........
# ........
# ......b.
# .b.BB.v.
# ........
# ...^....
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 219
# Total moves: 54
# Most recent reward: -0.1
# Total rewards: -5.4
# ........
# ........
# ......b.
# .b.BB.v.
# ........
# ...^....
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 220
# Total moves: 55
# Most recent reward: -0.1
# Total rewards: -5.5
# ........
# ........
# ......b.
# .b.BB.<.
# ........
# ...>....
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-5.4999999999999964, -5.4999999999999964]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn left", "turn right"]
actions: [0, 1]

# State 221
# Total moves: 55
# Most recent reward: -0.1
# Total rewards: -5.5
# ........
# ........
# ......b.
# .b.BB.<.
# ........
# ...>....
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 222
# Total moves: 55
# Most recent reward: -0.1
# Total rewards: -5.5
# ........
# ........
# ......b.
# .b.BB.<.
# ........
# ...>....
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 223
# Total moves: 55
# Most recent reward: -0.1
# Total rewards: -5.5
# ........
# ........
# ......b.
# .b.BB.<.
# ........
# ...>....
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 224
# Total moves: 56
# Most recent reward: -0.1
# Total rewards: -5.6
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ...^....
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
Rewards() = [-0.1, -0.1]
Returns() = [-5.599999999999996, -5.599999999999996]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["stay", "turn left"]
actions: [3, 0]

# State 225
# Total moves: 56
# Most recent reward: -0.1
# Total rewards: -5.6
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ...^....
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 226
# Total moves: 56
# Most recent reward: -0.1
# Total rewards: -5.6
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ...^....
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 227
# Total moves: 56
# Most recent reward: -0.1
# Total rewards: -5.6
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ...^....
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 228
# Total moves: 57
# Most recent reward: -0.1
# Total rewards: -5.7
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ...^....
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
Rewards() = [-0.1, -0.1]
Returns() = [-5.699999999999996, -5.699999999999996]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["move forward", "move forward"]
actions: [2, 2]

# State 229
# Total moves: 57
# Most recent reward: -0.1
# Total rewards: -5.7
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ...^....
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 230
# Total moves: 57
# Most recent reward: -0.1
# Total rewards: -5.7
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ...^....
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 231
# Total moves: 57
# Most recent reward: -0.1
# Total rewards: -5.7
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ...^....
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "move forward"
action: 2

# State 232
# Total moves: 58
# Most recent reward: -0.1
# Total rewards: -5.8
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ...^....
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
Rewards() = [-0.1, -0.1]
Returns() = [-5.799999999999995, -5.799999999999995]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn left", "turn left"]
actions: [0, 0]

# State 233
# Total moves: 58
# Most recent reward: -0.1
# Total rewards: -5.8
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ...^....
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 234
# Total moves: 58
# Most recent reward: -0.1
# Total rewards: -5.8
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ...^....
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 235
# Total moves: 58
# Most recent reward: -0.1
# Total rewards: -5.8
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ...^....
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 236
# Total moves: 59
# Most recent reward: -0.1
# Total rewards: -5.9
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ...^....
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
Rewards() = [-0.1, -0.1]
Returns() = [-5.899999999999995, -5.899999999999995]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["move forward", "turn left"]
actions: [2, 0]

# State 237
# Total moves: 59
# Most recent reward: -0.1
# Total rewards: -5.9
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ...^....
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 238
# Total moves: 59
# Most recent reward: -0.1
# Total rewards: -5.9
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ...^....
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 239
# Total moves: 59
# Most recent reward: -0.1
# Total rewards: -5.9
# ........
# ........
# ......b.
# .b.BB.^.
# ........
# ...^....
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "move forward"
action: 2

# State 240
# Total moves: 60
# Most recent reward: -0.1
# Total rewards: -6
# ........
# ........
# ......b.
# .b.BB.<.
# ........
# ...^....
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-5.999999999999995, -5.999999999999995]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn left", "stay"]
actions: [0, 3]

# State 241
# Total moves: 60
# Most recent reward: -0.1
# Total rewards: -6
# ........
# ........
# ......b.
# .b.BB.<.
# ........
# ...^....
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 242
# Total moves: 60
# Most recent reward: -0.1
# Total rewards: -6
# ........
# ........
# ......b.
# .b.BB.<.
# ........
# ...^....
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 243
# Total moves: 60
# Most recent reward: -0.1
# Total rewards: -6
# ........
# ........
# ......b.
# .b.BB.<.
# ........
# ...^....
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "move forward"
action: 2

# State 244
# Total moves: 61
# Most recent reward: -0.1
# Total rewards: -6.1
# ........
# ........
# ......b.
# .b.BB.<.
# ........
# ...^....
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-6.099999999999994, -6.099999999999994]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["move forward", "stay"]
actions: [2, 3]

# State 245
# Total moves: 61
# Most recent reward: -0.1
# Total rewards: -6.1
# ........
# ........
# ......b.
# .b.BB.<.
# ........
# ...^....
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 246
# Total moves: 61
# Most recent reward: -0.1
# Total rewards: -6.1
# ........
# ........
# ......b.
# .b.BB.<.
# ........
# ...^....
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 247
# Total moves: 61
# Most recent reward: -0.1
# Total rewards: -6.1
# ........
# ........
# ......b.
# .b.BB.<.
# ........
# ...^....
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "move forward"
action: 2

# State 248
# Total moves: 62
# Most recent reward: -0.1
# Total rewards: -6.2
# ........
# ........
# ......b.
# .b.BB.<.
# ...^....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "big box"
ObservationString(1) = "field"
ObservationTensor(0): ◯◯◯◯◉
ObservationTensor(1): ◉◯◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-6.199999999999994, -6.199999999999994]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["move forward", "turn left"]
actions: [2, 0]

# State 249
# Total moves: 62
# Most recent reward: -0.1
# Total rewards: -6.2
# ........
# ........
# ......b.
# .b.BB.<.
# ...^....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "big box"
ObservationString(1) = "field"
ObservationTensor(0): ◯◯◯◯◉
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 250
# Total moves: 62
# Most recent reward: -0.1
# Total rewards: -6.2
# ........
# ........
# ......b.
# .b.BB.<.
# ...^....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "big box"
ObservationString(1) = "field"
ObservationTensor(0): ◯◯◯◯◉
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 251
# Total moves: 62
# Most recent reward: -0.1
# Total rewards: -6.2
# ........
# ........
# ......b.
# .b.BB.<.
# ...^....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "big box"
ObservationString(1) = "field"
ObservationTensor(0): ◯◯◯◯◉
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "move forward"
action: 2

# State 252
# Total moves: 63
# Most recent reward: -0.1
# Total rewards: -6.3
# ........
# ........
# ......b.
# .b.BB.v.
# ...^....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "big box"
ObservationString(1) = "field"
ObservationTensor(0): ◯◯◯◯◉
ObservationTensor(1): ◉◯◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-6.299999999999994, -6.299999999999994]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn left", "turn right"]
actions: [0, 1]

# State 253
# Total moves: 63
# Most recent reward: -0.1
# Total rewards: -6.3
# ........
# ........
# ......b.
# .b.BB.v.
# ...^....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "big box"
ObservationString(1) = "field"
ObservationTensor(0): ◯◯◯◯◉
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 254
# Total moves: 63
# Most recent reward: -0.1
# Total rewards: -6.3
# ........
# ........
# ......b.
# .b.BB.v.
# ...^....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "big box"
ObservationString(1) = "field"
ObservationTensor(0): ◯◯◯◯◉
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 255
# Total moves: 63
# Most recent reward: -0.1
# Total rewards: -6.3
# ........
# ........
# ......b.
# .b.BB.v.
# ...^....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "big box"
ObservationString(1) = "field"
ObservationTensor(0): ◯◯◯◯◉
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 256
# Total moves: 64
# Most recent reward: -0.1
# Total rewards: -6.4
# ........
# ........
# ......b.
# .b.BB.<.
# ...<....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-6.399999999999993, -6.399999999999993]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["stay", "stay"]
actions: [3, 3]

# State 257
# Total moves: 64
# Most recent reward: -0.1
# Total rewards: -6.4
# ........
# ........
# ......b.
# .b.BB.<.
# ...<....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 258
# Total moves: 64
# Most recent reward: -0.1
# Total rewards: -6.4
# ........
# ........
# ......b.
# .b.BB.<.
# ...<....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 259
# Total moves: 64
# Most recent reward: -0.1
# Total rewards: -6.4
# ........
# ........
# ......b.
# .b.BB.<.
# ...<....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "move forward"
action: 2

# State 260
# Total moves: 65
# Most recent reward: -0.1
# Total rewards: -6.5
# ........
# ........
# ......b.
# .b.BB.<.
# ...<....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-6.499999999999993, -6.499999999999993]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["stay", "turn left"]
actions: [3, 0]

# State 261
# Total moves: 65
# Most recent reward: -0.1
# Total rewards: -6.5
# ........
# ........
# ......b.
# .b.BB.<.
# ...<....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 262
# Total moves: 65
# Most recent reward: -0.1
# Total rewards: -6.5
# ........
# ........
# ......b.
# .b.BB.<.
# ...<....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 263
# Total moves: 65
# Most recent reward: -0.1
# Total rewards: -6.5
# ........
# ........
# ......b.
# .b.BB.<.
# ...<....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "move forward"
action: 2

# State 264
# Total moves: 66
# Most recent reward: -0.1
# Total rewards: -6.6
# ........
# ........
# ......b.
# .b.BB.<.
# ...<....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-6.5999999999999925, -6.5999999999999925]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn left", "turn right"]
actions: [0, 1]

# State 265
# Total moves: 66
# Most recent reward: -0.1
# Total rewards: -6.6
# ........
# ........
# ......b.
# .b.BB.<.
# ...<....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 266
# Total moves: 66
# Most recent reward: -0.1
# Total rewards: -6.6
# ........
# ........
# ......b.
# .b.BB.<.
# ...<....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 267
# Total moves: 66
# Most recent reward: -0.1
# Total rewards: -6.6
# ........
# ........
# ......b.
# .b.BB.<.
# ...<....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 268
# Total moves: 67
# Most recent reward: -0.1
# Total rewards: -6.7
# ........
# ........
# ......b.
# .b.BB.^.
# ...v....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
Rewards() = [-0.1, -0.1]
Returns() = [-6.699999999999992, -6.699999999999992]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn left", "move forward"]
actions: [0, 2]

# State 269
# Total moves: 67
# Most recent reward: -0.1
# Total rewards: -6.7
# ........
# ........
# ......b.
# .b.BB.^.
# ...v....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 270
# Total moves: 67
# Most recent reward: -0.1
# Total rewards: -6.7
# ........
# ........
# ......b.
# .b.BB.^.
# ...v....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 271
# Total moves: 67
# Most recent reward: -0.1
# Total rewards: -6.7
# ........
# ........
# ......b.
# .b.BB.^.
# ...v....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 272
# Total moves: 68
# Most recent reward: -0.1
# Total rewards: -6.8
# ........
# ........
# ......b.
# .b.BB.^.
# ...>....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
Rewards() = [-0.1, -0.1]
Returns() = [-6.799999999999992, -6.799999999999992]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn right", "turn right"]
actions: [1, 1]

# State 273
# Total moves: 68
# Most recent reward: -0.1
# Total rewards: -6.8
# ........
# ........
# ......b.
# .b.BB.^.
# ...>....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 274
# Total moves: 68
# Most recent reward: -0.1
# Total rewards: -6.8
# ........
# ........
# ......b.
# .b.BB.^.
# ...>....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 275
# Total moves: 68
# Most recent reward: -0.1
# Total rewards: -6.8
# ........
# ........
# ......b.
# .b.BB.^.
# ...>....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 276
# Total moves: 69
# Most recent reward: -0.1
# Total rewards: -6.9
# ........
# ........
# ......b.
# .b.BB.^.
# ...v....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
Rewards() = [-0.1, -0.1]
Returns() = [-6.8999999999999915, -6.8999999999999915]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["move forward", "turn right"]
actions: [2, 1]

# State 277
# Total moves: 69
# Most recent reward: -0.1
# Total rewards: -6.9
# ........
# ........
# ......b.
# .b.BB.^.
# ...v....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 278
# Total moves: 69
# Most recent reward: -0.1
# Total rewards: -6.9
# ........
# ........
# ......b.
# .b.BB.^.
# ...v....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 279
# Total moves: 69
# Most recent reward: -0.1
# Total rewards: -6.9
# ........
# ........
# ......b.
# .b.BB.^.
# ...v....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 280
# Total moves: 70
# Most recent reward: -0.1
# Total rewards: -7
# ........
# ........
# ......b.
# .b.BB.^.
# ...v....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
Rewards() = [-0.1, -0.1]
Returns() = [-6.999999999999991, -6.999999999999991]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn right", "turn right"]
actions: [1, 1]

# State 281
# Total moves: 70
# Most recent reward: -0.1
# Total rewards: -7
# ........
# ........
# ......b.
# .b.BB.^.
# ...v....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 282
# Total moves: 70
# Most recent reward: -0.1
# Total rewards: -7
# ........
# ........
# ......b.
# .b.BB.^.
# ...v....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 283
# Total moves: 70
# Most recent reward: -0.1
# Total rewards: -7
# ........
# ........
# ......b.
# .b.BB.^.
# ...v....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "move forward"
action: 2

# State 284
# Total moves: 71
# Most recent reward: -0.1
# Total rewards: -7.1
# ........
# ........
# ......b.
# .b.BB.^.
# ...<....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
Rewards() = [-0.1, -0.1]
Returns() = [-7.099999999999991, -7.099999999999991]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["stay", "stay"]
actions: [3, 3]

# State 285
# Total moves: 71
# Most recent reward: -0.1
# Total rewards: -7.1
# ........
# ........
# ......b.
# .b.BB.^.
# ...<....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 286
# Total moves: 71
# Most recent reward: -0.1
# Total rewards: -7.1
# ........
# ........
# ......b.
# .b.BB.^.
# ...<....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 287
# Total moves: 71
# Most recent reward: -0.1
# Total rewards: -7.1
# ........
# ........
# ......b.
# .b.BB.^.
# ...<....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 288
# Total moves: 72
# Most recent reward: -0.1
# Total rewards: -7.2
# ........
# ........
# ......b.
# .b.BB.^.
# ...<....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
Rewards() = [-0.1, -0.1]
Returns() = [-7.19999999999999, -7.19999999999999]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn right", "turn right"]
actions: [1, 1]

# State 289
# Total moves: 72
# Most recent reward: -0.1
# Total rewards: -7.2
# ........
# ........
# ......b.
# .b.BB.^.
# ...<....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 290
# Total moves: 72
# Most recent reward: -0.1
# Total rewards: -7.2
# ........
# ........
# ......b.
# .b.BB.^.
# ...<....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 291
# Total moves: 72
# Most recent reward: -0.1
# Total rewards: -7.2
# ........
# ........
# ......b.
# .b.BB.^.
# ...<....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "small box"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◯◯◉◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 292
# Total moves: 73
# Most recent reward: -0.1
# Total rewards: -7.3
# ........
# ........
# ......b.
# .b.BB.>.
# ...<....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-7.29999999999999, -7.29999999999999]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["move forward", "turn right"]
actions: [2, 1]

# State 293
# Total moves: 73
# Most recent reward: -0.1
# Total rewards: -7.3
# ........
# ........
# ......b.
# .b.BB.>.
# ...<....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 294
# Total moves: 73
# Most recent reward: -0.1
# Total rewards: -7.3
# ........
# ........
# ......b.
# .b.BB.>.
# ...<....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 295
# Total moves: 73
# Most recent reward: -0.1
# Total rewards: -7.3
# ........
# ........
# ......b.
# .b.BB.>.
# ...<....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "move forward"
action: 2

# State 296
# Total moves: 74
# Most recent reward: -0.1
# Total rewards: -7.4
# ........
# ........
# ......b.
# .b.BB.>.
# ...<....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-7.39999999999999, -7.39999999999999]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn left", "move forward"]
actions: [0, 2]

# State 297
# Total moves: 74
# Most recent reward: -0.1
# Total rewards: -7.4
# ........
# ........
# ......b.
# .b.BB.>.
# ...<....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 298
# Total moves: 74
# Most recent reward: -0.1
# Total rewards: -7.4
# ........
# ........
# ......b.
# .b.BB.>.
# ...<....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 299
# Total moves: 74
# Most recent reward: -0.1
# Total rewards: -7.4
# ........
# ........
# ......b.
# .b.BB.>.
# ...<....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "move forward"
action: 2

# State 300
# Total moves: 75
# Most recent reward: -0.1
# Total rewards: -7.5
# ........
# ........
# ......b.
# .b.BB..>
# ...v....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-7.499999999999989, -7.499999999999989]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn left", "turn right"]
actions: [0, 1]

# State 301
# Total moves: 75
# Most recent reward: -0.1
# Total rewards: -7.5
# ........
# ........
# ......b.
# .b.BB..>
# ...v....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 302
# Total moves: 75
# Most recent reward: -0.1
# Total rewards: -7.5
# ........
# ........
# ......b.
# .b.BB..>
# ...v....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 303
# Total moves: 75
# Most recent reward: -0.1
# Total rewards: -7.5
# ........
# ........
# ......b.
# .b.BB..>
# ...v....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 304
# Total moves: 76
# Most recent reward: -0.1
# Total rewards: -7.6
# ........
# ........
# ......b.
# .b.BB..>
# ...>....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-7.599999999999989, -7.599999999999989]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["stay", "turn left"]
actions: [3, 0]

# State 305
# Total moves: 76
# Most recent reward: -0.1
# Total rewards: -7.6
# ........
# ........
# ......b.
# .b.BB..>
# ...>....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 306
# Total moves: 76
# Most recent reward: -0.1
# Total rewards: -7.6
# ........
# ........
# ......b.
# .b.BB..>
# ...>....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 307
# Total moves: 76
# Most recent reward: -0.1
# Total rewards: -7.6
# ........
# ........
# ......b.
# .b.BB..>
# ...>....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 308
# Total moves: 77
# Most recent reward: -0.1
# Total rewards: -7.7
# ........
# ........
# ......b.
# .b.BB..^
# ...>....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-7.699999999999989, -7.699999999999989]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["move forward", "move forward"]
actions: [2, 2]

# State 309
# Total moves: 77
# Most recent reward: -0.1
# Total rewards: -7.7
# ........
# ........
# ......b.
# .b.BB..^
# ...>....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 310
# Total moves: 77
# Most recent reward: -0.1
# Total rewards: -7.7
# ........
# ........
# ......b.
# .b.BB..^
# ...>....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 311
# Total moves: 77
# Most recent reward: -0.1
# Total rewards: -7.7
# ........
# ........
# ......b.
# .b.BB..^
# ...>....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 312
# Total moves: 78
# Most recent reward: -0.1
# Total rewards: -7.8
# ........
# ........
# ......b.
# .b.BB..^
# ....>...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-7.799999999999988, -7.799999999999988]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["stay", "turn right"]
actions: [3, 1]

# State 313
# Total moves: 78
# Most recent reward: -0.1
# Total rewards: -7.8
# ........
# ........
# ......b.
# .b.BB..^
# ....>...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 314
# Total moves: 78
# Most recent reward: -0.1
# Total rewards: -7.8
# ........
# ........
# ......b.
# .b.BB..^
# ....>...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 315
# Total moves: 78
# Most recent reward: -0.1
# Total rewards: -7.8
# ........
# ........
# ......b.
# .b.BB..^
# ....>...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "field"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◉◯◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "move forward"
action: 2

# State 316
# Total moves: 79
# Most recent reward: -0.1
# Total rewards: -7.9
# ........
# ........
# ......b.
# .b.BB..>
# ....>...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-7.899999999999988, -7.899999999999988]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn left", "stay"]
actions: [0, 3]

# State 317
# Total moves: 79
# Most recent reward: -0.1
# Total rewards: -7.9
# ........
# ........
# ......b.
# .b.BB..>
# ....>...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 318
# Total moves: 79
# Most recent reward: -0.1
# Total rewards: -7.9
# ........
# ........
# ......b.
# .b.BB..>
# ....>...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 319
# Total moves: 79
# Most recent reward: -0.1
# Total rewards: -7.9
# ........
# ........
# ......b.
# .b.BB..>
# ....>...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 320
# Total moves: 80
# Most recent reward: -0.1
# Total rewards: -8
# ........
# ........
# ......b.
# .b.BB..>
# ....>...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-7.999999999999988, -7.999999999999988]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn left", "move forward"]
actions: [0, 2]

# State 321
# Total moves: 80
# Most recent reward: -0.1
# Total rewards: -8
# ........
# ........
# ......b.
# .b.BB..>
# ....>...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 322
# Total moves: 80
# Most recent reward: -0.1
# Total rewards: -8
# ........
# ........
# ......b.
# .b.BB..>
# ....>...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 323
# Total moves: 80
# Most recent reward: -0.1
# Total rewards: -8
# ........
# ........
# ......b.
# .b.BB..>
# ....>...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "move forward"
action: 2

# State 324
# Total moves: 81
# Most recent reward: -5.1
# Total rewards: -13.1
# ........
# ........
# ......b.
# .b.BB..>
# ....>...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
Rewards() = [-5.1, -5.1]
Returns() = [-13.099999999999987, -13.099999999999987]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn left", "move forward"]
actions: [0, 2]

# State 325
# Total moves: 81
# Most recent reward: -5.1
# Total rewards: -13.1
# ........
# ........
# ......b.
# .b.BB..>
# ....>...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 326
# Total moves: 81
# Most recent reward: -5.1
# Total rewards: -13.1
# ........
# ........
# ......b.
# .b.BB..>
# ....>...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 327
# Total moves: 81
# Most recent reward: -5.1
# Total rewards: -13.1
# ........
# ........
# ......b.
# .b.BB..>
# ....>...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 328
# Total moves: 82
# Most recent reward: -5.1
# Total rewards: -18.2
# ........
# ........
# ......b.
# .b.BB..>
# ....>...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
Rewards() = [-5.1, -5.1]
Returns() = [-18.19999999999999, -18.19999999999999]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn right", "move forward"]
actions: [1, 2]

# State 329
# Total moves: 82
# Most recent reward: -5.1
# Total rewards: -18.2
# ........
# ........
# ......b.
# .b.BB..>
# ....>...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 330
# Total moves: 82
# Most recent reward: -5.1
# Total rewards: -18.2
# ........
# ........
# ......b.
# .b.BB..>
# ....>...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 331
# Total moves: 82
# Most recent reward: -5.1
# Total rewards: -18.2
# ........
# ........
# ......b.
# .b.BB..>
# ....>...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "move forward"
action: 2

# State 332
# Total moves: 83
# Most recent reward: -0.1
# Total rewards: -18.3
# ........
# ........
# ......b.
# .b.BB..>
# ....>...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-18.29999999999999, -18.29999999999999]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["move forward", "turn right"]
actions: [2, 1]

# State 333
# Total moves: 83
# Most recent reward: -0.1
# Total rewards: -18.3
# ........
# ........
# ......b.
# .b.BB..>
# ....>...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 334
# Total moves: 83
# Most recent reward: -0.1
# Total rewards: -18.3
# ........
# ........
# ......b.
# .b.BB..>
# ....>...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 335
# Total moves: 83
# Most recent reward: -0.1
# Total rewards: -18.3
# ........
# ........
# ......b.
# .b.BB..>
# ....>...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "move forward"
action: 2

# State 336
# Total moves: 84
# Most recent reward: -0.1
# Total rewards: -18.4
# ........
# ........
# ......b.
# .b.BB..>
# ....>...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-18.39999999999999, -18.39999999999999]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["stay", "stay"]
actions: [3, 3]

# State 337
# Total moves: 84
# Most recent reward: -0.1
# Total rewards: -18.4
# ........
# ........
# ......b.
# .b.BB..>
# ....>...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 338
# Total moves: 84
# Most recent reward: -0.1
# Total rewards: -18.4
# ........
# ........
# ......b.
# .b.BB..>
# ....>...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 339
# Total moves: 84
# Most recent reward: -0.1
# Total rewards: -18.4
# ........
# ........
# ......b.
# .b.BB..>
# ....>...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "move forward"
action: 2

# State 340
# Total moves: 85
# Most recent reward: -0.1
# Total rewards: -18.5
# ........
# ........
# ......b.
# .b.BB..>
# ....>...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-18.499999999999993, -18.499999999999993]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn left", "move forward"]
actions: [0, 2]

# State 341
# Total moves: 85
# Most recent reward: -0.1
# Total rewards: -18.5
# ........
# ........
# ......b.
# .b.BB..>
# ....>...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 342
# Total moves: 85
# Most recent reward: -0.1
# Total rewards: -18.5
# ........
# ........
# ......b.
# .b.BB..>
# ....>...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 343
# Total moves: 85
# Most recent reward: -0.1
# Total rewards: -18.5
# ........
# ........
# ......b.
# .b.BB..>
# ....>...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 344
# Total moves: 86
# Most recent reward: -5.1
# Total rewards: -23.6
# ........
# ........
# ......b.
# .b.BB..>
# ....>...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
Rewards() = [-5.1, -5.1]
Returns() = [-23.599999999999994, -23.599999999999994]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn left", "turn left"]
actions: [0, 0]

# State 345
# Total moves: 86
# Most recent reward: -5.1
# Total rewards: -23.6
# ........
# ........
# ......b.
# .b.BB..>
# ....>...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 346
# Total moves: 86
# Most recent reward: -5.1
# Total rewards: -23.6
# ........
# ........
# ......b.
# .b.BB..>
# ....>...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 347
# Total moves: 86
# Most recent reward: -5.1
# Total rewards: -23.6
# ........
# ........
# ......b.
# .b.BB..>
# ....>...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 348
# Total moves: 87
# Most recent reward: -0.1
# Total rewards: -23.7
# ........
# ........
# ......b.
# .b.BB..>
# ....^...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "big box"
ObservationString(1) = "wall"
ObservationTensor(0): ◯◯◯◯◉
ObservationTensor(1): ◯◉◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-23.699999999999996, -23.699999999999996]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["stay", "stay"]
actions: [3, 3]

# State 349
# Total moves: 87
# Most recent reward: -0.1
# Total rewards: -23.7
# ........
# ........
# ......b.
# .b.BB..>
# ....^...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "big box"
ObservationString(1) = "wall"
ObservationTensor(0): ◯◯◯◯◉
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 350
# Total moves: 87
# Most recent reward: -0.1
# Total rewards: -23.7
# ........
# ........
# ......b.
# .b.BB..>
# ....^...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "big box"
ObservationString(1) = "wall"
ObservationTensor(0): ◯◯◯◯◉
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 351
# Total moves: 87
# Most recent reward: -0.1
# Total rewards: -23.7
# ........
# ........
# ......b.
# .b.BB..>
# ....^...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "big box"
ObservationString(1) = "wall"
ObservationTensor(0): ◯◯◯◯◉
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "move forward"
action: 2

# State 352
# Total moves: 88
# Most recent reward: -0.1
# Total rewards: -23.8
# ........
# ........
# ......b.
# .b.BB..>
# ....^...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "big box"
ObservationString(1) = "wall"
ObservationTensor(0): ◯◯◯◯◉
ObservationTensor(1): ◯◉◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-23.799999999999997, -23.799999999999997]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["stay", "stay"]
actions: [3, 3]

# State 353
# Total moves: 88
# Most recent reward: -0.1
# Total rewards: -23.8
# ........
# ........
# ......b.
# .b.BB..>
# ....^...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "big box"
ObservationString(1) = "wall"
ObservationTensor(0): ◯◯◯◯◉
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 354
# Total moves: 88
# Most recent reward: -0.1
# Total rewards: -23.8
# ........
# ........
# ......b.
# .b.BB..>
# ....^...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "big box"
ObservationString(1) = "wall"
ObservationTensor(0): ◯◯◯◯◉
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 355
# Total moves: 88
# Most recent reward: -0.1
# Total rewards: -23.8
# ........
# ........
# ......b.
# .b.BB..>
# ....^...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "big box"
ObservationString(1) = "wall"
ObservationTensor(0): ◯◯◯◯◉
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 356
# Total moves: 89
# Most recent reward: -0.1
# Total rewards: -23.9
# ........
# ........
# ......b.
# .b.BB..>
# ....^...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "big box"
ObservationString(1) = "wall"
ObservationTensor(0): ◯◯◯◯◉
ObservationTensor(1): ◯◉◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-23.9, -23.9]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["move forward", "move forward"]
actions: [2, 2]

# State 357
# Total moves: 89
# Most recent reward: -0.1
# Total rewards: -23.9
# ........
# ........
# ......b.
# .b.BB..>
# ....^...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "big box"
ObservationString(1) = "wall"
ObservationTensor(0): ◯◯◯◯◉
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 358
# Total moves: 89
# Most recent reward: -0.1
# Total rewards: -23.9
# ........
# ........
# ......b.
# .b.BB..>
# ....^...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "big box"
ObservationString(1) = "wall"
ObservationTensor(0): ◯◯◯◯◉
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 359
# Total moves: 89
# Most recent reward: -0.1
# Total rewards: -23.9
# ........
# ........
# ......b.
# .b.BB..>
# ....^...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "big box"
ObservationString(1) = "wall"
ObservationTensor(0): ◯◯◯◯◉
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "move forward"
action: 2

# State 360
# Total moves: 90
# Most recent reward: -10.1
# Total rewards: -34
# ........
# ........
# ......b.
# .b.BB..>
# ....^...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "big box"
ObservationString(1) = "wall"
ObservationTensor(0): ◯◯◯◯◉
ObservationTensor(1): ◯◉◯◯◯
Rewards() = [-10.1, -10.1]
Returns() = [-34.0, -34.0]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn left", "stay"]
actions: [0, 3]

# State 361
# Total moves: 90
# Most recent reward: -10.1
# Total rewards: -34
# ........
# ........
# ......b.
# .b.BB..>
# ....^...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "big box"
ObservationString(1) = "wall"
ObservationTensor(0): ◯◯◯◯◉
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 362
# Total moves: 90
# Most recent reward: -10.1
# Total rewards: -34
# ........
# ........
# ......b.
# .b.BB..>
# ....^...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "big box"
ObservationString(1) = "wall"
ObservationTensor(0): ◯◯◯◯◉
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 363
# Total moves: 90
# Most recent reward: -10.1
# Total rewards: -34
# ........
# ........
# ......b.
# .b.BB..>
# ....^...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "big box"
ObservationString(1) = "wall"
ObservationTensor(0): ◯◯◯◯◉
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "move forward"
action: 2

# State 364
# Total moves: 91
# Most recent reward: -0.1
# Total rewards: -34.1
# ........
# ........
# ......b.
# .b.BB..>
# ....^...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "big box"
ObservationString(1) = "wall"
ObservationTensor(0): ◯◯◯◯◉
ObservationTensor(1): ◯◉◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-34.1, -34.1]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["move forward", "move forward"]
actions: [2, 2]

# State 365
# Total moves: 91
# Most recent reward: -0.1
# Total rewards: -34.1
# ........
# ........
# ......b.
# .b.BB..>
# ....^...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "big box"
ObservationString(1) = "wall"
ObservationTensor(0): ◯◯◯◯◉
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 366
# Total moves: 91
# Most recent reward: -0.1
# Total rewards: -34.1
# ........
# ........
# ......b.
# .b.BB..>
# ....^...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "big box"
ObservationString(1) = "wall"
ObservationTensor(0): ◯◯◯◯◉
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 367
# Total moves: 91
# Most recent reward: -0.1
# Total rewards: -34.1
# ........
# ........
# ......b.
# .b.BB..>
# ....^...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "big box"
ObservationString(1) = "wall"
ObservationTensor(0): ◯◯◯◯◉
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 368
# Total moves: 92
# Most recent reward: -10.1
# Total rewards: -44.2
# ........
# ........
# ......b.
# .b.BB..>
# ....^...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "big box"
ObservationString(1) = "wall"
ObservationTensor(0): ◯◯◯◯◉
ObservationTensor(1): ◯◉◯◯◯
Rewards() = [-10.1, -10.1]
Returns() = [-44.2, -44.2]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn left", "stay"]
actions: [0, 3]

# State 369
# Total moves: 92
# Most recent reward: -10.1
# Total rewards: -44.2
# ........
# ........
# ......b.
# .b.BB..>
# ....^...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "big box"
ObservationString(1) = "wall"
ObservationTensor(0): ◯◯◯◯◉
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 370
# Total moves: 92
# Most recent reward: -10.1
# Total rewards: -44.2
# ........
# ........
# ......b.
# .b.BB..>
# ....^...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "big box"
ObservationString(1) = "wall"
ObservationTensor(0): ◯◯◯◯◉
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 371
# Total moves: 92
# Most recent reward: -10.1
# Total rewards: -44.2
# ........
# ........
# ......b.
# .b.BB..>
# ....^...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "big box"
ObservationString(1) = "wall"
ObservationTensor(0): ◯◯◯◯◉
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 372
# Total moves: 93
# Most recent reward: -0.1
# Total rewards: -44.3
# ........
# ........
# ......b.
# .b.BB..>
# ....<...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-44.300000000000004, -44.300000000000004]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn right", "turn right"]
actions: [1, 1]

# State 373
# Total moves: 93
# Most recent reward: -0.1
# Total rewards: -44.3
# ........
# ........
# ......b.
# .b.BB..>
# ....<...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 374
# Total moves: 93
# Most recent reward: -0.1
# Total rewards: -44.3
# ........
# ........
# ......b.
# .b.BB..>
# ....<...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 375
# Total moves: 93
# Most recent reward: -0.1
# Total rewards: -44.3
# ........
# ........
# ......b.
# .b.BB..>
# ....<...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 376
# Total moves: 94
# Most recent reward: -0.1
# Total rewards: -44.4
# ........
# ........
# ......b.
# .b.BB..>
# ....<...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1, 1, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1, 1, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-44.400000000000006, -44.400000000000006]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn left", "move forward"]
actions: [0, 2]

# State 377
# Total moves: 94
# Most recent reward: -0.1
# Total rewards: -44.4
# ........
# ........
# ......b.
# .b.BB..>
# ....<...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1, 1, 3, 0, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1, 1, 3, 0, 2"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 378
# Total moves: 94
# Most recent reward: -0.1
# Total rewards: -44.4
# ........
# ........
# ......b.
# .b.BB..>
# ....<...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1, 1, 3, 0, 2, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1, 1, 3, 0, 2, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 379
# Total moves: 94
# Most recent reward: -0.1
# Total rewards: -44.4
# ........
# ........
# ......b.
# .b.BB..>
# ....<...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1, 1, 3, 0, 2, 1, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1, 1, 3, 0, 2, 1, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "move forward"
action: 2

# State 380
# Total moves: 95
# Most recent reward: -5.1
# Total rewards: -49.5
# ........
# ........
# ......b.
# .b.BB..>
# ....<...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1, 1, 3, 0, 2, 1, 0, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1, 1, 3, 0, 2, 1, 0, 2"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
Rewards() = [-5.1, -5.1]
Returns() = [-49.50000000000001, -49.50000000000001]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["move forward", "stay"]
actions: [2, 3]

# State 381
# Total moves: 95
# Most recent reward: -5.1
# Total rewards: -49.5
# ........
# ........
# ......b.
# .b.BB..>
# ....<...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1, 1, 3, 0, 2, 1, 0, 2, 2, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1, 1, 3, 0, 2, 1, 0, 2, 2, 3"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 382
# Total moves: 95
# Most recent reward: -5.1
# Total rewards: -49.5
# ........
# ........
# ......b.
# .b.BB..>
# ....<...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1, 1, 3, 0, 2, 1, 0, 2, 2, 3, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1, 1, 3, 0, 2, 1, 0, 2, 2, 3, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 383
# Total moves: 95
# Most recent reward: -5.1
# Total rewards: -49.5
# ........
# ........
# ......b.
# .b.BB..>
# ....<...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1, 1, 3, 0, 2, 1, 0, 2, 2, 3, 1, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1, 1, 3, 0, 2, 1, 0, 2, 2, 3, 1, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 384
# Total moves: 96
# Most recent reward: -0.1
# Total rewards: -49.6
# ........
# ........
# ......b.
# .b.BB..>
# ....<...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1, 1, 3, 0, 2, 1, 0, 2, 2, 3, 1, 1, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1, 1, 3, 0, 2, 1, 0, 2, 2, 3, 1, 1, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-49.60000000000001, -49.60000000000001]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["move forward", "stay"]
actions: [2, 3]

# State 385
# Total moves: 96
# Most recent reward: -0.1
# Total rewards: -49.6
# ........
# ........
# ......b.
# .b.BB..>
# ....<...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1, 1, 3, 0, 2, 1, 0, 2, 2, 3, 1, 1, 3, 2, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1, 1, 3, 0, 2, 1, 0, 2, 2, 3, 1, 1, 3, 2, 3"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 386
# Total moves: 96
# Most recent reward: -0.1
# Total rewards: -49.6
# ........
# ........
# ......b.
# .b.BB..>
# ....<...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1, 1, 3, 0, 2, 1, 0, 2, 2, 3, 1, 1, 3, 2, 3, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1, 1, 3, 0, 2, 1, 0, 2, 2, 3, 1, 1, 3, 2, 3, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 387
# Total moves: 96
# Most recent reward: -0.1
# Total rewards: -49.6
# ........
# ........
# ......b.
# .b.BB..>
# ....<...
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1, 1, 3, 0, 2, 1, 0, 2, 2, 3, 1, 1, 3, 2, 3, 0, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1, 1, 3, 0, 2, 1, 0, 2, 2, 3, 1, 1, 3, 2, 3, 0, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "move forward"
action: 2

# State 388
# Total moves: 97
# Most recent reward: -0.1
# Total rewards: -49.7
# ........
# ........
# ......b.
# .b.BB..>
# ...<....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1, 1, 3, 0, 2, 1, 0, 2, 2, 3, 1, 1, 3, 2, 3, 0, 0, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1, 1, 3, 0, 2, 1, 0, 2, 2, 3, 1, 1, 3, 2, 3, 0, 0, 2"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-49.70000000000001, -49.70000000000001]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn right", "move forward"]
actions: [1, 2]

# State 389
# Total moves: 97
# Most recent reward: -0.1
# Total rewards: -49.7
# ........
# ........
# ......b.
# .b.BB..>
# ...<....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1, 1, 3, 0, 2, 1, 0, 2, 2, 3, 1, 1, 3, 2, 3, 0, 0, 2, 1, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1, 1, 3, 0, 2, 1, 0, 2, 2, 3, 1, 1, 3, 2, 3, 0, 0, 2, 1, 2"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 390
# Total moves: 97
# Most recent reward: -0.1
# Total rewards: -49.7
# ........
# ........
# ......b.
# .b.BB..>
# ...<....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1, 1, 3, 0, 2, 1, 0, 2, 2, 3, 1, 1, 3, 2, 3, 0, 0, 2, 1, 2, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1, 1, 3, 0, 2, 1, 0, 2, 2, 3, 1, 1, 3, 2, 3, 0, 0, 2, 1, 2, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 391
# Total moves: 97
# Most recent reward: -0.1
# Total rewards: -49.7
# ........
# ........
# ......b.
# .b.BB..>
# ...<....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1, 1, 3, 0, 2, 1, 0, 2, 2, 3, 1, 1, 3, 2, 3, 0, 0, 2, 1, 2, 1, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1, 1, 3, 0, 2, 1, 0, 2, 2, 3, 1, 1, 3, 2, 3, 0, 0, 2, 1, 2, 1, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "move forward"
action: 2

# State 392
# Total moves: 98
# Most recent reward: -5.1
# Total rewards: -54.8
# ........
# ........
# ......b.
# .b.BB..>
# ...<....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1, 1, 3, 0, 2, 1, 0, 2, 2, 3, 1, 1, 3, 2, 3, 0, 0, 2, 1, 2, 1, 0, 2]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1, 1, 3, 0, 2, 1, 0, 2, 2, 3, 1, 1, 3, 2, 3, 0, 0, 2, 1, 2, 1, 0, 2"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
Rewards() = [-5.1, -5.1]
Returns() = [-54.80000000000001, -54.80000000000001]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn left", "turn right"]
actions: [0, 1]

# State 393
# Total moves: 98
# Most recent reward: -5.1
# Total rewards: -54.8
# ........
# ........
# ......b.
# .b.BB..>
# ...<....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1, 1, 3, 0, 2, 1, 0, 2, 2, 3, 1, 1, 3, 2, 3, 0, 0, 2, 1, 2, 1, 0, 2, 0, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1, 1, 3, 0, 2, 1, 0, 2, 2, 3, 1, 1, 3, 2, 3, 0, 0, 2, 1, 2, 1, 0, 2, 0, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 394
# Total moves: 98
# Most recent reward: -5.1
# Total rewards: -54.8
# ........
# ........
# ......b.
# .b.BB..>
# ...<....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1, 1, 3, 0, 2, 1, 0, 2, 2, 3, 1, 1, 3, 2, 3, 0, 0, 2, 1, 2, 1, 0, 2, 0, 1, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1, 1, 3, 0, 2, 1, 0, 2, 2, 3, 1, 1, 3, 2, 3, 0, 0, 2, 1, 2, 1, 0, 2, 0, 1, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 395
# Total moves: 98
# Most recent reward: -5.1
# Total rewards: -54.8
# ........
# ........
# ......b.
# .b.BB..>
# ...<....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1, 1, 3, 0, 2, 1, 0, 2, 2, 3, 1, 1, 3, 2, 3, 0, 0, 2, 1, 2, 1, 0, 2, 0, 1, 1, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1, 1, 3, 0, 2, 1, 0, 2, 2, 3, 1, 1, 3, 2, 3, 0, 0, 2, 1, 2, 1, 0, 2, 0, 1, 1, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 396
# Total moves: 99
# Most recent reward: -0.1
# Total rewards: -54.9
# ........
# ........
# ......b.
# .b.BB..>
# ...<....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1, 1, 3, 0, 2, 1, 0, 2, 2, 3, 1, 1, 3, 2, 3, 0, 0, 2, 1, 2, 1, 0, 2, 0, 1, 1, 1, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1, 1, 3, 0, 2, 1, 0, 2, 2, 3, 1, 1, 3, 2, 3, 0, 0, 2, 1, 2, 1, 0, 2, 0, 1, 1, 1, 3"
IsChanceNode() = False
IsSimultaneousNode() = True
CurrentPlayer() = -2
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-54.90000000000001, -54.90000000000001]
LegalActions(0) = [0, 1, 2, 3]
LegalActions(1) = [0, 1, 2, 3]
StringLegalActions(0) = ["turn left", "turn right", "move forward", "stay"]
StringLegalActions(1) = ["turn left", "turn right", "move forward", "stay"]

# Apply joint action ["turn right", "stay"]
actions: [1, 3]

# State 397
# Total moves: 99
# Most recent reward: -0.1
# Total rewards: -54.9
# ........
# ........
# ......b.
# .b.BB..>
# ...<....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1, 1, 3, 0, 2, 1, 0, 2, 2, 3, 1, 1, 3, 2, 3, 0, 0, 2, 1, 2, 1, 0, 2, 0, 1, 1, 1, 3, 1, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1, 1, 3, 0, 2, 1, 0, 2, 2, 3, 1, 1, 3, 2, 3, 0, 0, 2, 1, 2, 1, 0, 2, 0, 1, 1, 1, 3, 1, 3"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn left"
action: 0

# State 398
# Total moves: 99
# Most recent reward: -0.1
# Total rewards: -54.9
# ........
# ........
# ......b.
# .b.BB..>
# ...<....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1, 1, 3, 0, 2, 1, 0, 2, 2, 3, 1, 1, 3, 2, 3, 0, 0, 2, 1, 2, 1, 0, 2, 0, 1, 1, 1, 3, 1, 3, 0]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1, 1, 3, 0, 2, 1, 0, 2, 2, 3, 1, 1, 3, 2, 3, 0, 0, 2, 1, 2, 1, 0, 2, 0, 1, 1, 1, 3, 1, 3, 0"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{0, 0.900000000000}, {1, 0.100000000000}]
LegalActions() = [0, 1]
StringLegalActions() = ["turn left", "turn right"]

# Apply action "turn right"
action: 1

# State 399
# Total moves: 99
# Most recent reward: -0.1
# Total rewards: -54.9
# ........
# ........
# ......b.
# .b.BB..>
# ...<....
# ........
# ........
# ........
IsTerminal() = False
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1, 1, 3, 0, 2, 1, 0, 2, 2, 3, 1, 1, 3, 2, 3, 0, 0, 2, 1, 2, 1, 0, 2, 0, 1, 1, 1, 3, 1, 3, 0, 1]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1, 1, 3, 0, 2, 1, 0, 2, 2, 3, 1, 1, 3, 2, 3, 0, 0, 2, 1, 2, 1, 0, 2, 0, 1, 1, 1, 3, 1, 3, 0, 1"
IsChanceNode() = True
IsSimultaneousNode() = False
CurrentPlayer() = -1
ObservationString(0) = "field"
ObservationString(1) = "wall"
ObservationTensor(0): ◉◯◯◯◯
ObservationTensor(1): ◯◉◯◯◯
ChanceOutcomes() = [{2, 0.500000000000}, {3, 0.500000000000}]
LegalActions() = [2, 3]
StringLegalActions() = ["move forward", "stay"]

# Apply action "stay"
action: 3

# State 400
# Total moves: 100
# Most recent reward: -0.1
# Total rewards: -55
# ........
# ........
# ......b.
# .b.BB..>
# ...^....
# ........
# ........
# ........
IsTerminal() = True
History() = [3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1, 1, 3, 0, 2, 1, 0, 2, 2, 3, 1, 1, 3, 2, 3, 0, 0, 2, 1, 2, 1, 0, 2, 0, 1, 1, 1, 3, 1, 3, 0, 1, 3]
HistoryString() = "3, 2, 1, 0, 2, 0, 0, 1, 0, 3, 0, 1, 1, 1, 2, 0, 2, 1, 1, 3, 0, 0, 1, 0, 3, 3, 1, 1, 0, 3, 2, 0, 1, 1, 2, 0, 0, 1, 1, 2, 3, 1, 0, 1, 3, 2, 1, 1, 1, 2, 0, 0, 0, 1, 2, 1, 2, 0, 1, 2, 3, 2, 1, 0, 2, 2, 3, 1, 0, 3, 2, 3, 0, 1, 3, 2, 2, 0, 1, 3, 2, 0, 0, 0, 2, 0, 2, 1, 0, 2, 1, 1, 1, 0, 2, 3, 0, 0, 1, 2, 0, 0, 0, 0, 2, 3, 0, 1, 1, 2, 3, 0, 1, 0, 2, 1, 3, 0, 0, 2, 0, 0, 1, 1, 3, 3, 2, 0, 0, 3, 2, 1, 0, 1, 3, 0, 3, 1, 0, 2, 3, 0, 0, 1, 3, 0, 3, 0, 0, 3, 2, 2, 1, 1, 3, 0, 0, 0, 0, 3, 1, 1, 1, 0, 3, 3, 1, 0, 0, 3, 1, 0, 1, 0, 3, 1, 2, 0, 0, 3, 1, 1, 0, 0, 3, 0, 0, 1, 0, 3, 2, 1, 1, 1, 3, 1, 2, 0, 0, 3, 1, 2, 0, 0, 2, 2, 3, 0, 1, 3, 2, 1, 1, 1, 2, 1, 0, 1, 1, 3, 2, 3, 0, 0, 2, 1, 3, 0, 1, 3, 0, 1, 1, 1, 3, 0, 3, 1, 1, 3, 3, 3, 0, 0, 3, 0, 3, 0, 0, 2, 0, 3, 1, 1, 2, 1, 0, 0, 0, 2, 2, 3, 0, 0, 2, 3, 0, 0, 0, 2, 1, 1, 0, 0, 3, 0, 1, 0, 0, 3, 3, 0, 1, 1, 3, 2, 2, 1, 1, 2, 0, 0, 1, 1, 3, 2, 0, 1, 0, 2, 0, 3, 1, 0, 2, 2, 3, 0, 0, 2, 2, 0, 1, 0, 2, 0, 1, 0, 0, 3, 3, 3, 0, 0, 2, 3, 0, 0, 1, 2, 0, 1, 0, 0, 3, 0, 2, 0, 1, 3, 1, 1, 0, 1, 3, 2, 1, 1, 1, 3, 1, 1, 0, 1, 2, 3, 3, 0, 0, 3, 1, 1, 1, 0, 3, 2, 1, 1, 1, 2, 0, 2, 0, 0, 2, 0, 1, 0, 1, 3, 3, 0, 1, 0, 3, 2, 2, 0, 1, 3, 3, 1, 1, 0, 2, 0, 3, 1, 1, 3, 0, 2, 1, 0, 2, 0, 2, 1, 0, 3, 1, 2, 1, 1, 2, 2, 1, 1, 1, 2, 3, 3, 1, 0, 2, 0, 2, 1, 0, 3, 0, 0, 0, 1, 3, 3, 3, 1, 1, 2, 3, 3, 1, 1, 3, 2, 2, 0, 0, 2, 0, 3, 1, 0, 2, 2, 2, 0, 0, 3, 0, 3, 0, 1, 3, 1, 1, 1, 1, 3, 0, 2, 1, 0, 2, 2, 3, 1, 1, 3, 2, 3, 0, 0, 2, 1, 2, 1, 0, 2, 0, 1, 1, 1, 3, 1, 3, 0, 1, 3"
IsChanceNode() = False
IsSimultaneousNode() = False
CurrentPlayer() = -4
ObservationString(0) = "big box"
ObservationString(1) = "wall"
ObservationTensor(0): ◯◯◯◯◉
ObservationTensor(1): ◯◉◯◯◯
Rewards() = [-0.1, -0.1]
Returns() = [-55.000000000000014, -55.000000000000014]
