gnn_jsp_env (Deepcopy Wrapper)¶
[1]:
from collections import namedtuple
from copy import deepcopy, copy
[2]:
from gymnasium.spaces import Box, Discrete
from jsp_instance_utils.instances import ft06, ft06_makespan
from jsp_vis.console import gantt_chart_console
[3]:
from gymcts.gymcts_agent import GymctsAgent
from gymcts.gymcts_action_history_wrapper import ActionHistoryMCTSGymEnvWrapper
from gymcts.gymcts_deepcopy_wrapper import DeepCopyMCTSGymEnvWrapper
from gymnasium.wrappers import TransformReward, NormalizeReward
from gymcts.logger import log
[4]:
import gymnasium as gym
[5]:
from gymnasium.core import ActType, ObsType
from typing import Any, SupportsFloat
[6]:
import random
[7]:
import pandas as pd
import numpy as np
[8]:
Operation = namedtuple("Operation", ["job_id", "op_id", "unique_op_id", "machine_type", "duration"])
[9]:
def get_legal_pos(op_dur, job_ready_time, possible_pos, mch_infos):
"""
Returns the positions which fit the given operation duration,
considering that the operation can only start when the required machine is free
and the job is ready (the previous operations of the job are completed)
"""
earliest_start_time = max(job_ready_time, mch_infos['end_times'][possible_pos[0] - 1])
possible_pos_end_times = np.append(earliest_start_time, mch_infos['end_times'][possible_pos])[:-1]
possible_gaps = mch_infos['start_times'][possible_pos] - possible_pos_end_times
legal_pos_idx = np.where(op_dur <= possible_gaps)[0]
legal_pos = np.take(possible_pos, legal_pos_idx)
return legal_pos_idx, legal_pos, possible_pos_end_times
[10]:
def put_in_the_end(op, job_ready_time, mch_ready_time, mch_infos):
"""
Puts an operation at the end of the already scheduled operations
"""
index = np.where(mch_infos['start_times'] == -1)[0][0]
op_start_time = max(job_ready_time, mch_ready_time)
mch_infos['op_ids'][index] = op.unique_op_id
mch_infos['start_times'][index] = op_start_time
mch_infos['end_times'][index] = op_start_time + op.duration
return op_start_time
[11]:
def put_in_between(op, legal_pos_idx, legal_pos, possible_pos_end_times, mch_infos):
"""
Puts an operation between already scheduled operations
"""
earliest_idx = legal_pos_idx[0]
earliest_pos = legal_pos[0]
start_time = possible_pos_end_times[earliest_idx]
mch_infos['op_ids'][:] = np.insert(mch_infos['op_ids'], earliest_pos, op.unique_op_id)[:-1]
mch_infos['start_times'][:] = np.insert(mch_infos['start_times'], earliest_pos, start_time)[:-1]
mch_infos['end_times'][:] = np.insert(mch_infos['end_times'], earliest_pos, start_time + op.duration)[:-1]
return start_time
[12]:
def get_end_time_lbs(jobs, machine_infos):
"""
Calculates the end time lower bounds for all operations
:param jobs: array if jobs, where each job is an array of operations
:param machine_infos: dictionary where the keys are machine indices and the values contain
the ids of the operations scheduled on the machine (in the scheduled order), and the
corresponding start and end times
:returns: np array containing the end time lower bounds of all operations
"""
end_times = [m['end_times'][i] for m in machine_infos.values() for i in range(len(m['end_times']))]
op_ids = [m['op_ids'][i] for m in machine_infos.values() for i in range(len(m['op_ids']))]
lbs = -1 * np.ones((len(jobs), len(jobs[0])))
for i, job in enumerate(jobs):
for j, op in enumerate(job):
if op.unique_op_id in op_ids:
lbs[i][j] = end_times[op_ids.index(op.unique_op_id)]
elif j > 0:
lbs[i][j] = lbs[i][j - 1] + op.duration
else:
lbs[i][j] = op.duration
return lbs
[13]:
def get_op_nbghs(op, machine_infos):
"""
Finds a given operation's predecessor and successor on the machine where the operation is carried out
"""
for key, value in machine_infos.items():
if op.unique_op_id in value['op_ids']:
action_coord = [key, np.where(op.unique_op_id == value['op_ids'])[0][0]]
break
assert action_coord, "The operation's unique id was not found in the machine informations"
if action_coord[1].item() > 0:
pred_id = action_coord[0], action_coord[1] - 1
else:
pred_id = action_coord[0], action_coord[1]
pred = machine_infos[pred_id[0]]['op_ids'][pred_id[1]]
if action_coord[1].item() + 1 < machine_infos[action_coord[0]]['op_ids'].shape[-1]:
succ_temp_id = action_coord[0], action_coord[1] + 1
else:
succ_temp_id = action_coord[0], action_coord[1]
succ_temp = machine_infos[succ_temp_id[0]]['op_ids'][succ_temp_id[1]]
succ = op.unique_op_id if succ_temp < 0 else succ_temp
return pred, succ
[14]:
def get_first_ops(state):
"""
Returns an array containing the unique indices of the first operations of each job.
"""
num_ops = len(state['features'])
num_jobs = len(state['jobs'])
first_col = np.arange(start=0, stop=num_ops, step=1).reshape(num_jobs, -1)[:, 0]
return first_col
[15]:
class GNNJobShopModel():
def __init__(self, **kwargs):
pass
@staticmethod
def random_problem(num_jobs, num_ops_per_job, num_machines, max_duration=10):
remaining_operations = []
unique_op_id = 0
for i in range(num_jobs):
job = []
for j in range(num_ops_per_job):
job.append(Operation(i, j, unique_op_id, random.randint(0, num_machines - 1),
random.randint(0, max_duration - 1)))
unique_op_id += 1
remaining_operations.append(job)
schedule = [[] for _ in range(num_machines)]
num_ops = num_jobs * num_machines
# Number of operations scheduled on each machine
ops_per_machine = [len([op for job in remaining_operations for op in job if op.machine_type == m]) for m in
range(num_machines)]
# Information for each machine: the ids of the operations scheduled on it (in the scheduled order), and the
# corresponding start and end times
machine_infos = {m: {'op_ids': -1 * np.ones(ops_per_machine[m], dtype=np.int32),
'start_times': -1 * np.ones(ops_per_machine[m], dtype=np.int32),
'end_times': -1 * np.ones(ops_per_machine[m], dtype=np.int32)} for m in
range(num_machines)}
# Time at which the last scheduled operation ends for each job
last_job_ops = [-1 for _ in range(num_jobs)]
# Time at which the last scheduled operation ends on each machine
last_machine_ops = [-1 for _ in range(num_machines)]
jobs = deepcopy(remaining_operations)
adj_matrix = GNNJobShopModel.init_adj_matrix(num_ops, num_jobs)
features = GNNJobShopModel.init_features(jobs)
node_states = np.array([1 if i % num_ops_per_job == 0 else 0 for i in range(num_ops)],
dtype=np.single)
return {'remaining_ops': remaining_operations, 'schedule': schedule, 'machine_infos': machine_infos,
'last_job_ops': last_job_ops, 'last_mch_ops': last_machine_ops, 'adj_matrix': adj_matrix,
'features': features, 'node_states': node_states, 'jobs': jobs}
@staticmethod
def _schedule_op(job_id, state):
possible = False
if len(state['remaining_ops'][job_id]) > 0:
op = state['remaining_ops'][job_id].pop(0)
start_time, flag = GNNJobShopModel._determine_start_time(op, state['last_job_ops'],
state['last_mch_ops'], state['machine_infos'])
# Insert the operation at the correct position so that the entries remain sorted according to start_time
state['schedule'][op.machine_type].append((op, start_time, start_time + op.duration))
state['schedule'][op.machine_type] = sorted(state['schedule'][op.machine_type], key=lambda x: x[1])
# Update state
if state['last_job_ops'][op.job_id] < start_time + op.duration:
state['last_job_ops'][op.job_id] = start_time + op.duration
if state['last_mch_ops'][op.machine_type] < start_time + op.duration:
state['last_mch_ops'][op.machine_type] = start_time + op.duration
GNNJobShopModel._update_adj_matrix(state, op, flag)
GNNJobShopModel._update_features(state, op)
GNNJobShopModel._update_node_states(state, op)
possible = True
return state, possible
@staticmethod
def _update_adj_matrix(state, op, flag):
# Update the adjacency matrix after a new operation has been scheduled
pred, succ = get_op_nbghs(op, state['machine_infos'])
state['adj_matrix'][op.unique_op_id] = 0
state['adj_matrix'][op.unique_op_id, op.unique_op_id] = 1
state['adj_matrix'][op.unique_op_id, pred] = 1
state['adj_matrix'][succ, op.unique_op_id] = 1
if op.unique_op_id not in get_first_ops(state):
state['adj_matrix'][op.unique_op_id, op.unique_op_id - 1] = 1
# Remove the old arc when a new operation inserts between two operations
if flag and pred != op.unique_op_id and succ != op.unique_op_id:
state['adj_matrix'][succ, pred] = 0
@staticmethod
def _update_features(state, op):
# Update the operations' features after a new operation has been scheduled
lower_bounds = get_end_time_lbs(state['jobs'], state['machine_infos']) # recalculate lower bounds
finished = np.array([f[1] if i != op.unique_op_id
else 1 for i, f in enumerate(state['features'])]) # set op as finished
assert norm_coeff > 0, "The normalization coefficient has not been initialized"
state['features'] = np.concatenate((lower_bounds.reshape(-1, 1) / norm_coeff,
finished.reshape(-1, 1)), axis=1)
@staticmethod
def _update_node_states(state, op):
succ = op.unique_op_id + 1 if ((op.unique_op_id + 1) % len(state['jobs'][0]) != 0) else op.unique_op_id
if succ != op.unique_op_id:
state['node_states'][op.unique_op_id] = 0 # TODO node_states type changes -> fix
state['node_states'][succ] = 1 # TODO add -1 condition?
@staticmethod
def _determine_start_time(op: Operation, last_job_ops, last_mch_ops, machine_infos):
job_ready_time = last_job_ops[op.job_id] if last_job_ops[op.job_id] != -1 else 0
mch_ready_time = last_mch_ops[op.machine_type] if last_mch_ops[op.machine_type] != -1 else 0
# Whether the operation is scheduled between already scheduled operations (True) or in the end (False)
flag = False
# Positions between already scheduled operations on the machine required by the operation
possible_pos = np.where(job_ready_time < machine_infos[op.machine_type]['start_times'])[0]
if len(possible_pos) == 0:
# Not possible to schedule the operation between other operations -> put in the end
op_start_time = put_in_the_end(op, job_ready_time, mch_ready_time, machine_infos[op.machine_type])
else:
# Positions which fit the length of the operation (there is enough time before the next operation)
legal_pos_idx, legal_pos, possible_pos_end_times = get_legal_pos(op.duration, job_ready_time,
possible_pos,
machine_infos[op.machine_type])
if len(legal_pos) == 0:
# No position which can fit the operation -> put in the end
op_start_time = put_in_the_end(op, job_ready_time, mch_ready_time, machine_infos[op.machine_type])
else:
# Schedule the operation between other operations
op_start_time = put_in_between(op, legal_pos_idx, legal_pos, possible_pos_end_times,
machine_infos[op.machine_type])
flag = True
return op_start_time, flag
@staticmethod
def _is_done(remaining_ops):
for j in remaining_ops:
if len(j) > 0:
return False
return True
@staticmethod
def _makespan(schedule):
makespan = 0
for machine, machine_schedule in enumerate(schedule):
if len(machine_schedule) > 0:
_, _, end_time = machine_schedule[-1]
if end_time > makespan:
makespan = end_time
return makespan
@staticmethod
def _get_norm_coeff(max_duration, num_ops_per_job, num_jobs):
i = 10
while i < max_duration * num_ops_per_job * num_jobs:
i *= 10
return i
@staticmethod
def step(state, action):
new_state, possible = GNNJobShopModel._schedule_op(action, deepcopy(state))
reward = 0
if not possible:
reward = -1
done = GNNJobShopModel._is_done(new_state['remaining_ops'])
if done:
reward = - GNNJobShopModel._makespan(new_state['schedule'])
return new_state, reward, done
@staticmethod
def legal_actions(state):
return [job_id for job_id in range(len(state['remaining_ops'])) if
len(state['remaining_ops'][job_id]) > 0]
@staticmethod
def init_adj_matrix(num_ops, num_jobs):
# task ids for first column (array containing the first tasks for each job)
first_col = np.arange(start=0, stop=num_ops, step=1).reshape(num_jobs, -1)[:, 0]
# task ids for last column (array containing the last tasks for each job)
last_col = np.arange(start=0, stop=num_ops, step=1).reshape(num_jobs, -1)[:, -1]
# conjunctive arcs showing precedence relations between tasks of the same job
# np array with 1s on the row above the main diagonal and 0s everywhere else
conj_nei_up_stream = np.eye(num_ops, k=-1, dtype=np.single)
# np array with 1s on the row below the main diagonal and 0s everywhere else
conj_nei_low_stream = np.eye(num_ops, k=1, dtype=np.single)
# first column does not have upper stream conj_nei
conj_nei_up_stream[first_col] = 0
# last column does not have lower stream conj_nei
conj_nei_low_stream[last_col] = 0
# self edges for all nodes
# np array with 1s on the main diagonal and 0s everywhere else
self_as_nei = np.eye(num_ops, dtype=np.single)
adj = self_as_nei + conj_nei_up_stream
return adj
@staticmethod
def init_features(jobs):
durations = np.array([[op.duration for op in job] for job in jobs])
lower_bounds = np.cumsum(durations, axis=1, dtype=np.single) # lower bounds of operations' completion times
machine_types = np.array([[op.machine_type for op in job] for job in jobs])
finished_mark = np.zeros_like(machine_types, dtype=np.single) # 0 for unfinished, 1 for finished
global norm_coeff
norm_coeff = GNNJobShopModel._get_norm_coeff(max(durations.flatten()), len(jobs[0]), len(jobs))
# node features: normalized end time lower bounds and binary indicator of whether the action has been scheduled
features = np.concatenate((lower_bounds.reshape(-1, 1) / norm_coeff, # normalize the lower bounds
finished_mark.reshape(-1, 1)), axis=1) # 1 if scheduled, 0 otherwise
return features
[16]:
class GNNJobShopModelEnv(gym.Env):
def _jsp_instance_adapter(self, jsp_instance):
_, n_jobs, n_machines = jsp_instance.shape
machine_order = jsp_instance[0]
processing_times = jsp_instance[1]
remaining_operations = []
unique_op_id = 0
for i in range(n_jobs):
job = []
num_ops_per_job = n_machines
for j in range(num_ops_per_job):
job.append(
Operation(
i, j,
unique_op_id,
machine_order[i][j], # machine_type
processing_times[i][j] # duration
)
)
unique_op_id += 1
remaining_operations.append(job)
schedule = [[] for _ in range(n_machines)]
num_ops = n_jobs * n_machines
# Number of operations scheduled on each machine
ops_per_machine = [len([op for job in remaining_operations for op in job if op.machine_type == m]) for m in
range(n_machines)]
# Information for each machine: the ids of the operations scheduled on it (in the scheduled order), and the
# corresponding start and end times
machine_infos = {m: {'op_ids': -1 * np.ones(ops_per_machine[m], dtype=np.int32),
'start_times': -1 * np.ones(ops_per_machine[m], dtype=np.int32),
'end_times': -1 * np.ones(ops_per_machine[m], dtype=np.int32)} for m in
range(n_machines)}
# Time at which the last scheduled operation ends for each job
last_job_ops = [-1 for _ in range(n_jobs)]
# Time at which the last scheduled operation ends on each machine
last_machine_ops = [-1 for _ in range(n_machines)]
jobs = deepcopy(remaining_operations)
adj_matrix = GNNJobShopModel.init_adj_matrix(num_ops, n_jobs)
features = GNNJobShopModel.init_features(jobs)
node_states = np.array([1 if i % num_ops_per_job == 0 else 0 for i in range(num_ops)],
dtype=np.single)
return {'remaining_ops': remaining_operations, 'schedule': schedule, 'machine_infos': machine_infos,
'last_job_ops': last_job_ops, 'last_mch_ops': last_machine_ops, 'adj_matrix': adj_matrix,
'features': features, 'node_states': node_states, 'jobs': jobs}
def __init__(self, jsp_instance:np.array, **kwargs):
self.model = GNNJobShopModel()
_, n_jobs, n_machines = jsp_instance.shape
self.n_jobs = n_jobs
# self.n_ops_per_job = 6
self.n_machines = n_machines
# self.state = self.model.random_problem(6, 6, 6)
self.state = self._jsp_instance_adapter(jsp_instance)
self._initial_state = copy(self.state)
# Define the space for an Operation
operation_space = gym.spaces.Tuple((
gym.spaces.Discrete(np.iinfo(np.int32).max), # job_id
gym.spaces.Discrete(np.iinfo(np.int32).max), # op_id
gym.spaces.Discrete(np.iinfo(np.int32).max), # unique_op_id
gym.spaces.Discrete(np.iinfo(np.int32).max), # machine_type
gym.spaces.Discrete(np.iinfo(np.int32).max) # duration
))
# Define the space for a ScheduledOperation
scheduled_operation_space = gym.spaces.Tuple((
operation_space, # Operation
gym.spaces.Discrete(np.iinfo(np.int32).max), # start_time
gym.spaces.Discrete(np.iinfo(np.int32).max) # end_time
))
observation_space = gym.spaces.Dict({
'adj_matrix': Box(low=-1.0, high=1.0, shape=(3,), dtype=np.float32),
'features': Box(low=-1.0, high=1.0, shape=(3,), dtype=np.float32),
'last_job_ops': Box(low=-1.0, high=1.0, shape=(3,), dtype=np.float32),
'last_mch_ops': Box(low=-1.0, high=1.0, shape=(3,), dtype=np.float32),
'machine_infos': gym.spaces.Dict({
key_idx: gym.spaces.Dict({
'end_times': Box(low=-1, high=np.iinfo(np.int32).max, shape=(5,), dtype=np.int32),
'op_ids': Box(low=-1, high=np.iinfo(np.int32).max, shape=(5,), dtype=np.int32),
'start_times': Box(low=-1, high=np.iinfo(np.int32).max, shape=(5,), dtype=np.int32),
}) for key_idx in range(6)
}),
# 'remaining_ops': ,
'schedule': gym.spaces.Tuple([
gym.spaces.Tuple([scheduled_operation_space for _ in range(self.n_machines)]) for _ in
range(self.n_jobs)
])
})
self.observation_space = observation_space
self.action_space = Discrete(6)
self.done = False
def set_state(self, state: dict):
self.state = state
if len(state['remaining_ops']) > 0:
self.done = False
def step(self, action: ActType) -> tuple[ObsType, SupportsFloat, bool, bool, dict[str, Any]]:
self.state, reward, self.done = self.model.step(self.state, action)
return self.state, reward, self.done, False, {'makespan': - reward}
def render(self) -> None:
allocation = []
latest_finish_time = 0
for mache_ops in self.state['schedule']:
if mache_ops and len(mache_ops):
for ops_elem, start_time, finish_time in mache_ops:
entry = {
'Task': f'Job {ops_elem.job_id}',
'Start': start_time,
'Finish': finish_time,
'Resource': f'Machine {ops_elem.machine_type}'
}
latest_finish_time = max(finish_time, latest_finish_time)
allocation.append(entry)
df = pd.DataFrame(allocation)
num_of_machines = self.n_machines
gantt_chart_console(df, num_of_machines)
print(f'Makespan: {latest_finish_time}')
def get_state(self) -> dict:
return self.state
def reset(
self,
*,
seed: int | None = None,
options: dict[str, Any] | None = None,
) -> tuple[ObsType, dict[str, Any]]:
self.set_state(self._initial_state)
return self.state, {}
def get_legal_action_mask(self) -> list[bool]:
legal_action = self.model.legal_actions(self.state)
legal_action_mask = [False for _ in range(self.action_space.n)]
for action in legal_action:
legal_action_mask[action] = True
return legal_action_mask
[17]:
if __name__ == '__main__':
log.setLevel(20)
# model = GNNJobShopModel()
# jsp_state = model.random_problem(6, 6, 6)
# print(pprint.pformat(jsp_state))
env = GNNJobShopModelEnv(
jsp_instance=ft06,
)
env.reset()
env = NormalizeReward(env, gamma=0.99, epsilon=1e-8)
env = TransformReward(env, lambda r: r / 36)
def mask_fn(env: gym.Env) -> np.ndarray:
# Do whatever you'd like in this function to return the action mask
# for the current env. In this example, we assume the env has a
# helpful method we can rely on.
return env.unwrapped.get_legal_action_mask()
env = DeepCopyMCTSGymEnvWrapper(
env,
action_mask_fn=mask_fn
)
agent = GymctsAgent(
env=env,
clear_mcts_tree_after_step=False,
render_tree_after_step=True,
exclude_unvisited_nodes_from_render=True,
number_of_simulations_per_step=125,
)
root = agent.search_root_node.get_root()
actions = agent.solve(render_tree_after_step=True)
env.reset()
for a in actions:
obs, rew, term, trun, info = env.step(a)
env.unwrapped.render()
(N=125, Q_v=-0.17, best=-0.17)
├── (a=0, N=21, Q_v=-0.17, best=-0.17, ubc=0.17)
│ ├── (a=0, N=3, Q_v=-0.17, best=-0.17, ubc=0.54)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.45)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.45)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=3, Q_v=-0.17, best=-0.17, ubc=0.54)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ │ └── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ ├── (a=4, N=3, Q_v=-0.17, best=-0.17, ubc=0.54)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ └── (a=5, N=3, Q_v=-0.17, best=-0.17, ubc=0.54)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ └── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
├── (a=1, N=21, Q_v=-0.17, best=-0.17, ubc=0.17)
│ ├── (a=0, N=3, Q_v=-0.17, best=-0.17, ubc=0.54)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.45)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.45)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=3, Q_v=-0.17, best=-0.17, ubc=0.54)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ ├── (a=4, N=3, Q_v=-0.17, best=-0.17, ubc=0.54)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ └── (a=5, N=3, Q_v=-0.17, best=-0.17, ubc=0.54)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ └── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
├── (a=2, N=20, Q_v=-0.17, best=-0.17, ubc=0.18)
│ ├── (a=0, N=3, Q_v=-0.17, best=-0.17, ubc=0.54)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ ├── (a=1, N=3, Q_v=-0.17, best=-0.17, ubc=0.54)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ │ └── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ ├── (a=2, N=3, Q_v=-0.17, best=-0.17, ubc=0.54)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.44)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=3, Q_v=-0.17, best=-0.17, ubc=0.54)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ └── (a=5, N=3, Q_v=-0.17, best=-0.17, ubc=0.54)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
├── (a=3, N=21, Q_v=-0.17, best=-0.17, ubc=0.17)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.45)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=3, Q_v=-0.17, best=-0.17, ubc=0.54)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.45)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=3, Q_v=-0.17, best=-0.17, ubc=0.54)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ ├── (a=4, N=3, Q_v=-0.17, best=-0.17, ubc=0.54)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ └── (a=5, N=3, Q_v=-0.17, best=-0.17, ubc=0.54)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
├── (a=4, N=20, Q_v=-0.17, best=-0.17, ubc=0.18)
│ ├── (a=0, N=3, Q_v=-0.17, best=-0.17, ubc=0.54)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ │ └── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ ├── (a=1, N=3, Q_v=-0.17, best=-0.17, ubc=0.54)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ ├── (a=2, N=3, Q_v=-0.17, best=-0.17, ubc=0.54)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ │ └── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ ├── (a=3, N=3, Q_v=-0.17, best=-0.17, ubc=0.54)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.44)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=3, Q_v=-0.17, best=-0.17, ubc=0.54)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ └── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
└── (a=5, N=21, Q_v=-0.17, best=-0.17, ubc=0.17)
├── (a=0, N=3, Q_v=-0.17, best=-0.17, ubc=0.54)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
├── (a=1, N=3, Q_v=-0.17, best=-0.17, ubc=0.54)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
├── (a=2, N=3, Q_v=-0.17, best=-0.17, ubc=0.54)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ └── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.45)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.45)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
└── (a=5, N=3, Q_v=-0.17, best=-0.17, ubc=0.54)
├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
└── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
[17:00:58] INFO selected action 5 after 125 simulations.
INFO current action list: [5]
(a=5, N=146, Q_v=-0.17, best=-0.17, ubc=-0.03)
├── (a=0, N=24, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=3, Q_v=-0.17, best=-0.17, ubc=0.56)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ │ └── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=1, N=24, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=3, Q_v=-0.17, best=-0.17, ubc=0.56)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=2, N=24, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=3, Q_v=-0.17, best=-0.17, ubc=0.56)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=3, N=24, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=3, Q_v=-0.17, best=-0.17, ubc=0.56)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ └── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
├── (a=4, N=24, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=3, Q_v=-0.17, best=-0.17, ubc=0.56)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ │ └── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
└── (a=5, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
└── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
└── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
[17:01:05] INFO selected action 5 after 125 simulations.
INFO current action list: [5, 5]
(a=5, N=150, Q_v=-0.17, best=-0.17, ubc=-0.03)
├── (a=0, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=1, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=2, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=3, N=24, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=3, Q_v=-0.17, best=-0.17, ubc=0.56)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
├── (a=4, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
└── (a=5, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
└── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
└── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
[17:01:11] INFO selected action 5 after 125 simulations.
INFO current action list: [5, 5, 5]
(a=5, N=150, Q_v=-0.17, best=-0.17, ubc=-0.03)
├── (a=0, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=1, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=2, N=24, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=3, Q_v=-0.17, best=-0.17, ubc=0.56)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=3, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=4, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
└── (a=5, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
└── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
└── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
[17:01:18] INFO selected action 1 after 125 simulations.
INFO current action list: [5, 5, 5, 1]
(a=1, N=150, Q_v=-0.17, best=-0.17, ubc=-0.03)
├── (a=0, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=1, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=2, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=3, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=4, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
└── (a=5, N=24, Q_v=-0.17, best=-0.17, ubc=0.15)
├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=2, N=3, Q_v=-0.17, best=-0.17, ubc=0.56)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
└── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
└── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
[17:01:25] INFO selected action 1 after 125 simulations.
INFO current action list: [5, 5, 5, 1, 1]
(a=1, N=150, Q_v=-0.17, best=-0.17, ubc=-0.03)
├── (a=0, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=1, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=2, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=3, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=4, N=24, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=3, Q_v=-0.17, best=-0.17, ubc=0.56)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ │ └── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
└── (a=5, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
└── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
└── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
[17:01:31] INFO selected action 2 after 125 simulations.
INFO current action list: [5, 5, 5, 1, 1, 2]
(a=2, N=150, Q_v=-0.17, best=-0.17, ubc=-0.03)
├── (a=0, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=1, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=2, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=3, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=4, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
└── (a=5, N=24, Q_v=-0.17, best=-0.17, ubc=0.15)
├── (a=0, N=3, Q_v=-0.17, best=-0.17, ubc=0.56)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
└── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
└── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
[17:01:37] INFO selected action 3 after 125 simulations.
INFO current action list: [5, 5, 5, 1, 1, 2, 3]
(a=3, N=150, Q_v=-0.17, best=-0.17, ubc=-0.03)
├── (a=0, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=1, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=2, N=24, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=3, Q_v=-0.17, best=-0.17, ubc=0.56)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ └── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
├── (a=3, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=4, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
└── (a=5, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
└── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
└── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
[17:01:43] INFO selected action 0 after 125 simulations.
INFO current action list: [5, 5, 5, 1, 1, 2, 3, 0]
(a=0, N=150, Q_v=-0.17, best=-0.17, ubc=-0.03)
├── (a=0, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=1, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=2, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=3, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=4, N=24, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=3, Q_v=-0.17, best=-0.17, ubc=0.56)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
└── (a=5, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
└── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
└── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
[17:01:49] INFO selected action 1 after 125 simulations.
INFO current action list: [5, 5, 5, 1, 1, 2, 3, 0, 1]
(a=1, N=150, Q_v=-0.17, best=-0.17, ubc=-0.03)
├── (a=0, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=1, N=24, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=3, Q_v=-0.17, best=-0.17, ubc=0.56)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ │ └── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=2, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=3, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=4, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
└── (a=5, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
└── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
└── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
[17:01:54] INFO selected action 5 after 125 simulations.
INFO current action list: [5, 5, 5, 1, 1, 2, 3, 0, 1, 5]
(a=5, N=150, Q_v=-0.17, best=-0.17, ubc=-0.03)
├── (a=0, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=1, N=24, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=3, Q_v=-0.17, best=-0.17, ubc=0.56)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=2, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=3, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=4, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
└── (a=5, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
└── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
└── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
[17:02:00] INFO selected action 3 after 125 simulations.
INFO current action list: [5, 5, 5, 1, 1, 2, 3, 0, 1, 5, 3]
(a=3, N=150, Q_v=-0.17, best=-0.17, ubc=-0.03)
├── (a=0, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=1, N=24, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=3, Q_v=-0.17, best=-0.17, ubc=0.56)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=2, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=3, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=4, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
└── (a=5, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
└── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
└── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
[17:02:05] INFO selected action 2 after 125 simulations.
INFO current action list: [5, 5, 5, 1, 1, 2, 3, 0, 1, 5, 3, 2]
(a=2, N=150, Q_v=-0.17, best=-0.17, ubc=-0.03)
├── (a=0, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=1, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=2, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=3, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=4, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
└── (a=5, N=24, Q_v=-0.17, best=-0.17, ubc=0.15)
├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=1, N=3, Q_v=-0.17, best=-0.17, ubc=0.56)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
└── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
└── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
[17:02:10] INFO selected action 3 after 125 simulations.
INFO current action list: [5, 5, 5, 1, 1, 2, 3, 0, 1, 5, 3, 2, 3]
(a=3, N=150, Q_v=-0.17, best=-0.17, ubc=-0.03)
├── (a=0, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=1, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=2, N=24, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=3, Q_v=-0.17, best=-0.17, ubc=0.56)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=3, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=4, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
└── (a=5, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
└── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
└── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
[17:02:15] INFO selected action 4 after 125 simulations.
INFO current action list: [5, 5, 5, 1, 1, 2, 3, 0, 1, 5, 3, 2, 3, 4]
(a=4, N=150, Q_v=-0.17, best=-0.17, ubc=-0.03)
├── (a=0, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=1, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=2, N=24, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=3, Q_v=-0.17, best=-0.17, ubc=0.56)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
├── (a=3, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=4, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
└── (a=5, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
└── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
└── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
[17:02:19] INFO selected action 3 after 125 simulations.
INFO current action list: [5, 5, 5, 1, 1, 2, 3, 0, 1, 5, 3, 2, 3, 4, 3]
(a=3, N=150, Q_v=-0.17, best=-0.17, ubc=-0.03)
├── (a=0, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=1, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=2, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=3, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=4, N=24, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=3, Q_v=-0.17, best=-0.17, ubc=0.56)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ └── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
└── (a=5, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
└── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
└── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
[17:02:24] INFO selected action 3 after 125 simulations.
INFO current action list: [5, 5, 5, 1, 1, 2, 3, 0, 1, 5, 3, 2, 3, 4, 3, 3]
(a=3, N=150, Q_v=-0.17, best=-0.17, ubc=-0.03)
├── (a=0, N=24, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=3, Q_v=-0.17, best=-0.17, ubc=0.56)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=1, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=2, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=3, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=5, Q_v=-0.17, best=-0.17, ubc=0.40)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ ├── (a=1, N=5, Q_v=-0.17, best=-0.17, ubc=0.40)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ ├── (a=2, N=5, Q_v=-0.17, best=-0.17, ubc=0.40)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ ├── (a=4, N=5, Q_v=-0.17, best=-0.17, ubc=0.40)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=4, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
└── (a=5, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
└── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
└── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
[17:02:28] INFO selected action 5 after 125 simulations.
INFO current action list: [5, 5, 5, 1, 1, 2, 3, 0, 1, 5, 3, 2, 3, 4, 3, 3, 5]
(a=5, N=150, Q_v=-0.17, best=-0.17, ubc=-0.03)
├── (a=0, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=1, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=2, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=3, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=5, Q_v=-0.17, best=-0.17, ubc=0.40)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ ├── (a=1, N=5, Q_v=-0.17, best=-0.17, ubc=0.40)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ ├── (a=2, N=5, Q_v=-0.17, best=-0.17, ubc=0.40)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ ├── (a=4, N=5, Q_v=-0.17, best=-0.17, ubc=0.40)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=4, N=24, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ │ └── (a=5, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=4, N=3, Q_v=-0.17, best=-0.17, ubc=0.56)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ │ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.57)
│ └── (a=5, N=4, Q_v=-0.17, best=-0.17, ubc=0.46)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
└── (a=5, N=25, Q_v=-0.17, best=-0.17, ubc=0.15)
├── (a=0, N=4, Q_v=-0.17, best=-0.17, ubc=0.47)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
│ └── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.66)
├── (a=1, N=5, Q_v=-0.17, best=-0.17, ubc=0.40)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
├── (a=2, N=5, Q_v=-0.17, best=-0.17, ubc=0.40)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
├── (a=3, N=5, Q_v=-0.17, best=-0.17, ubc=0.40)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
└── (a=4, N=5, Q_v=-0.17, best=-0.17, ubc=0.40)
├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
└── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
[17:02:32] INFO selected action 5 after 125 simulations.
INFO current action list: [5, 5, 5, 1, 1, 2, 3, 0, 1, 5, 3, 2, 3, 4, 3, 3, 5, 5]
(a=5, N=150, Q_v=-0.17, best=-0.17, ubc=-0.03)
├── (a=0, N=30, Q_v=-0.17, best=-0.17, ubc=0.12)
│ ├── (a=0, N=6, Q_v=-0.17, best=-0.17, ubc=0.36)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=6, Q_v=-0.17, best=-0.17, ubc=0.36)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=6, Q_v=-0.17, best=-0.17, ubc=0.36)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=6, Q_v=-0.17, best=-0.17, ubc=0.36)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=2, Q_v=-0.17, best=-0.17, ubc=0.50)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=5, Q_v=-0.17, best=-0.17, ubc=0.41)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
├── (a=1, N=30, Q_v=-0.17, best=-0.17, ubc=0.12)
│ ├── (a=0, N=6, Q_v=-0.17, best=-0.17, ubc=0.36)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=5, Q_v=-0.17, best=-0.17, ubc=0.41)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ │ └── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ ├── (a=2, N=6, Q_v=-0.17, best=-0.17, ubc=0.36)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=6, Q_v=-0.17, best=-0.17, ubc=0.36)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.50)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=6, Q_v=-0.17, best=-0.17, ubc=0.36)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=2, N=30, Q_v=-0.17, best=-0.17, ubc=0.12)
│ ├── (a=0, N=6, Q_v=-0.17, best=-0.17, ubc=0.36)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=6, Q_v=-0.17, best=-0.17, ubc=0.36)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=6, Q_v=-0.17, best=-0.17, ubc=0.36)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=5, Q_v=-0.17, best=-0.17, ubc=0.41)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ └── (a=4, N=6, Q_v=-0.17, best=-0.17, ubc=0.36)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=3, N=30, Q_v=-0.17, best=-0.17, ubc=0.12)
│ ├── (a=0, N=7, Q_v=-0.17, best=-0.17, ubc=0.32)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.82)
│ │ ├── (a=2, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.82)
│ ├── (a=1, N=8, Q_v=-0.17, best=-0.17, ubc=0.29)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.85)
│ │ ├── (a=2, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ └── (a=4, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ ├── (a=2, N=7, Q_v=-0.17, best=-0.17, ubc=0.32)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ │ ├── (a=1, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.82)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.82)
│ └── (a=4, N=7, Q_v=-0.17, best=-0.17, ubc=0.32)
│ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.82)
│ ├── (a=2, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.82)
└── (a=4, N=29, Q_v=-0.17, best=-0.17, ubc=0.12)
├── (a=0, N=6, Q_v=-0.17, best=-0.17, ubc=0.36)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=1, N=6, Q_v=-0.17, best=-0.17, ubc=0.36)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=2, N=6, Q_v=-0.17, best=-0.17, ubc=0.36)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=3, N=5, Q_v=-0.17, best=-0.17, ubc=0.41)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
└── (a=4, N=5, Q_v=-0.17, best=-0.17, ubc=0.41)
├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
└── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.73)
[17:02:36] INFO selected action 2 after 125 simulations.
INFO current action list: [5, 5, 5, 1, 1, 2, 3, 0, 1, 5, 3, 2, 3, 4, 3, 3, 5, 5, 2]
(a=2, N=155, Q_v=-0.17, best=-0.17, ubc=-0.03)
├── (a=0, N=31, Q_v=-0.17, best=-0.17, ubc=0.12)
│ ├── (a=0, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=2, Q_v=-0.17, best=-0.17, ubc=0.50)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=1, N=31, Q_v=-0.17, best=-0.17, ubc=0.12)
│ ├── (a=0, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=2, Q_v=-0.17, best=-0.17, ubc=0.50)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=2, N=31, Q_v=-0.17, best=-0.17, ubc=0.12)
│ ├── (a=0, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=2, Q_v=-0.17, best=-0.17, ubc=0.50)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=3, N=30, Q_v=-0.17, best=-0.17, ubc=0.12)
│ ├── (a=0, N=7, Q_v=-0.17, best=-0.17, ubc=0.32)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.82)
│ │ ├── (a=2, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.82)
│ ├── (a=1, N=8, Q_v=-0.17, best=-0.17, ubc=0.29)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ ├── (a=1, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ ├── (a=2, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.85)
│ ├── (a=2, N=7, Q_v=-0.17, best=-0.17, ubc=0.32)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ │ ├── (a=1, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.82)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.82)
│ └── (a=4, N=7, Q_v=-0.17, best=-0.17, ubc=0.32)
│ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ ├── (a=1, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.82)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.82)
└── (a=4, N=31, Q_v=-0.17, best=-0.17, ubc=0.12)
├── (a=0, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=1, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=2, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=3, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=2, Q_v=-0.17, best=-0.17, ubc=0.50)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
└── (a=4, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
└── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
[17:02:40] INFO selected action 1 after 125 simulations.
INFO current action list: [5, 5, 5, 1, 1, 2, 3, 0, 1, 5, 3, 2, 3, 4, 3, 3, 5, 5, 2, 1]
(a=1, N=156, Q_v=-0.17, best=-0.17, ubc=-0.03)
├── (a=0, N=31, Q_v=-0.17, best=-0.17, ubc=0.12)
│ ├── (a=0, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=2, Q_v=-0.17, best=-0.17, ubc=0.50)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=1, N=31, Q_v=-0.17, best=-0.17, ubc=0.12)
│ ├── (a=0, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.50)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=2, Q_v=-0.17, best=-0.17, ubc=0.50)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=2, N=31, Q_v=-0.17, best=-0.17, ubc=0.12)
│ ├── (a=0, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.50)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=3, N=31, Q_v=-0.17, best=-0.17, ubc=0.12)
│ ├── (a=0, N=7, Q_v=-0.17, best=-0.17, ubc=0.33)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.82)
│ │ ├── (a=2, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.82)
│ ├── (a=1, N=7, Q_v=-0.17, best=-0.17, ubc=0.33)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ │ ├── (a=1, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.82)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.82)
│ ├── (a=2, N=8, Q_v=-0.17, best=-0.17, ubc=0.29)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ ├── (a=1, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ ├── (a=2, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.85)
│ └── (a=4, N=8, Q_v=-0.17, best=-0.17, ubc=0.29)
│ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ ├── (a=1, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ ├── (a=2, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.85)
└── (a=4, N=31, Q_v=-0.17, best=-0.17, ubc=0.12)
├── (a=0, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=1, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=2, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=3, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.50)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
└── (a=4, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
└── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
[17:02:43] INFO selected action 2 after 125 simulations.
INFO current action list: [5, 5, 5, 1, 1, 2, 3, 0, 1, 5, 3, 2, 3, 4, 3, 3, 5, 5, 2, 1, 2]
(a=2, N=156, Q_v=-0.17, best=-0.17, ubc=-0.03)
├── (a=0, N=31, Q_v=-0.17, best=-0.17, ubc=0.12)
│ ├── (a=0, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.50)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=1, N=31, Q_v=-0.17, best=-0.17, ubc=0.12)
│ ├── (a=0, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.50)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.50)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=2, N=31, Q_v=-0.17, best=-0.17, ubc=0.12)
│ ├── (a=0, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.50)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.50)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=3, N=31, Q_v=-0.17, best=-0.17, ubc=0.12)
│ ├── (a=0, N=8, Q_v=-0.17, best=-0.17, ubc=0.29)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ ├── (a=1, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ ├── (a=2, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.85)
│ ├── (a=1, N=8, Q_v=-0.17, best=-0.17, ubc=0.29)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ ├── (a=1, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ ├── (a=2, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.85)
│ ├── (a=2, N=7, Q_v=-0.17, best=-0.17, ubc=0.33)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ │ ├── (a=1, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.82)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.82)
│ └── (a=4, N=7, Q_v=-0.17, best=-0.17, ubc=0.33)
│ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ ├── (a=1, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.82)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.82)
└── (a=4, N=31, Q_v=-0.17, best=-0.17, ubc=0.12)
├── (a=0, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=1, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=2, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=3, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.50)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
└── (a=4, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
└── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
[17:02:46] INFO selected action 0 after 125 simulations.
INFO current action list: [5, 5, 5, 1, 1, 2, 3, 0, 1, 5, 3, 2, 3, 4, 3, 3, 5, 5, 2, 1, 2, 0]
(a=0, N=156, Q_v=-0.17, best=-0.17, ubc=-0.03)
├── (a=0, N=31, Q_v=-0.17, best=-0.17, ubc=0.12)
│ ├── (a=0, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.50)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=1, N=31, Q_v=-0.17, best=-0.17, ubc=0.12)
│ ├── (a=0, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.50)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.50)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=2, N=31, Q_v=-0.17, best=-0.17, ubc=0.12)
│ ├── (a=0, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.50)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.50)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=3, N=31, Q_v=-0.17, best=-0.17, ubc=0.12)
│ ├── (a=0, N=8, Q_v=-0.17, best=-0.17, ubc=0.29)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ ├── (a=1, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ ├── (a=2, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.85)
│ ├── (a=1, N=8, Q_v=-0.17, best=-0.17, ubc=0.29)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ ├── (a=1, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ ├── (a=2, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.85)
│ ├── (a=2, N=7, Q_v=-0.17, best=-0.17, ubc=0.33)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ │ ├── (a=1, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.82)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.82)
│ └── (a=4, N=7, Q_v=-0.17, best=-0.17, ubc=0.33)
│ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ ├── (a=1, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.82)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.82)
└── (a=4, N=31, Q_v=-0.17, best=-0.17, ubc=0.12)
├── (a=0, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=1, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=2, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=3, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.50)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
└── (a=4, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
└── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
[17:02:49] INFO selected action 0 after 125 simulations.
INFO current action list: [5, 5, 5, 1, 1, 2, 3, 0, 1, 5, 3, 2, 3, 4, 3, 3, 5, 5, 2, 1, 2, 0, 0]
(a=0, N=156, Q_v=-0.17, best=-0.17, ubc=-0.03)
├── (a=0, N=31, Q_v=-0.17, best=-0.17, ubc=0.12)
│ ├── (a=0, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.50)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=1, N=31, Q_v=-0.17, best=-0.17, ubc=0.12)
│ ├── (a=0, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.50)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.50)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=2, N=31, Q_v=-0.17, best=-0.17, ubc=0.12)
│ ├── (a=0, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.50)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.50)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=3, N=31, Q_v=-0.17, best=-0.17, ubc=0.12)
│ ├── (a=0, N=7, Q_v=-0.17, best=-0.17, ubc=0.33)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ │ ├── (a=1, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.82)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.82)
│ ├── (a=1, N=8, Q_v=-0.17, best=-0.17, ubc=0.29)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ ├── (a=1, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ ├── (a=2, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.85)
│ ├── (a=2, N=8, Q_v=-0.17, best=-0.17, ubc=0.29)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ ├── (a=1, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ ├── (a=2, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.85)
│ └── (a=4, N=7, Q_v=-0.17, best=-0.17, ubc=0.33)
│ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ ├── (a=1, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.82)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.82)
└── (a=4, N=31, Q_v=-0.17, best=-0.17, ubc=0.12)
├── (a=0, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=1, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=2, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=3, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.50)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
└── (a=4, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
└── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
[17:02:52] INFO selected action 1 after 125 simulations.
INFO current action list: [5, 5, 5, 1, 1, 2, 3, 0, 1, 5, 3, 2, 3, 4, 3, 3, 5, 5, 2, 1, 2, 0, 0, 1]
(a=1, N=156, Q_v=-0.17, best=-0.17, ubc=-0.03)
├── (a=0, N=31, Q_v=-0.17, best=-0.17, ubc=0.12)
│ ├── (a=0, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.50)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.50)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=1, N=31, Q_v=-0.17, best=-0.17, ubc=0.12)
│ ├── (a=0, N=8, Q_v=-0.17, best=-0.17, ubc=0.29)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ ├── (a=2, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ ├── (a=3, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.85)
│ ├── (a=2, N=8, Q_v=-0.17, best=-0.17, ubc=0.29)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ ├── (a=2, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ ├── (a=3, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.85)
│ ├── (a=3, N=7, Q_v=-0.17, best=-0.17, ubc=0.33)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ │ ├── (a=2, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ │ └── (a=4, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ └── (a=4, N=7, Q_v=-0.17, best=-0.17, ubc=0.33)
│ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ ├── (a=2, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.82)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.82)
├── (a=2, N=31, Q_v=-0.17, best=-0.17, ubc=0.12)
│ ├── (a=0, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.50)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.50)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.50)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=3, N=31, Q_v=-0.17, best=-0.17, ubc=0.12)
│ ├── (a=0, N=8, Q_v=-0.17, best=-0.17, ubc=0.29)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ ├── (a=1, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ ├── (a=2, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.85)
│ ├── (a=1, N=8, Q_v=-0.17, best=-0.17, ubc=0.29)
│ │ ├── (a=0, N=3, Q_v=-0.17, best=-0.17, ubc=0.42)
│ │ ├── (a=2, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ └── (a=4, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ ├── (a=2, N=7, Q_v=-0.17, best=-0.17, ubc=0.33)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ │ ├── (a=1, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.82)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.82)
│ └── (a=4, N=7, Q_v=-0.17, best=-0.17, ubc=0.33)
│ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ ├── (a=1, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.82)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.82)
└── (a=4, N=31, Q_v=-0.17, best=-0.17, ubc=0.12)
├── (a=0, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=1, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.50)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=2, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=3, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.50)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
└── (a=4, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
└── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
[17:02:55] INFO selected action 0 after 125 simulations.
INFO current action list: [5, 5, 5, 1, 1, 2, 3, 0, 1, 5, 3, 2, 3, 4, 3, 3, 5, 5, 2, 1, 2, 0, 0, 1, 0]
(a=0, N=156, Q_v=-0.17, best=-0.17, ubc=-0.03)
├── (a=0, N=31, Q_v=-0.17, best=-0.17, ubc=0.12)
│ ├── (a=0, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=1, N=2, Q_v=-0.17, best=-0.17, ubc=0.50)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.50)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.50)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=1, N=31, Q_v=-0.17, best=-0.17, ubc=0.12)
│ ├── (a=0, N=8, Q_v=-0.17, best=-0.17, ubc=0.29)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ ├── (a=2, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ ├── (a=3, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.85)
│ ├── (a=2, N=8, Q_v=-0.17, best=-0.17, ubc=0.29)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ ├── (a=2, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ ├── (a=3, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.85)
│ ├── (a=3, N=7, Q_v=-0.17, best=-0.17, ubc=0.33)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ │ ├── (a=2, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ │ └── (a=4, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ └── (a=4, N=7, Q_v=-0.17, best=-0.17, ubc=0.33)
│ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ ├── (a=2, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.82)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.82)
├── (a=2, N=31, Q_v=-0.17, best=-0.17, ubc=0.12)
│ ├── (a=0, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.50)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.50)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.50)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=3, N=31, Q_v=-0.17, best=-0.17, ubc=0.12)
│ ├── (a=0, N=8, Q_v=-0.17, best=-0.17, ubc=0.29)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ ├── (a=1, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ ├── (a=2, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.85)
│ ├── (a=1, N=8, Q_v=-0.17, best=-0.17, ubc=0.29)
│ │ ├── (a=0, N=3, Q_v=-0.17, best=-0.17, ubc=0.42)
│ │ ├── (a=2, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ └── (a=4, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ ├── (a=2, N=7, Q_v=-0.17, best=-0.17, ubc=0.33)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ │ ├── (a=1, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.82)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.82)
│ └── (a=4, N=7, Q_v=-0.17, best=-0.17, ubc=0.33)
│ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ ├── (a=1, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.82)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.82)
└── (a=4, N=31, Q_v=-0.17, best=-0.17, ubc=0.12)
├── (a=0, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=1, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.50)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=2, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=3, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.50)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
└── (a=4, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
└── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
[17:02:57] INFO selected action 0 after 125 simulations.
INFO current action list: [5, 5, 5, 1, 1, 2, 3, 0, 1, 5, 3, 2, 3, 4, 3, 3, 5, 5, 2, 1, 2, 0, 0, 1, 0, 0]
(a=0, N=156, Q_v=-0.17, best=-0.17, ubc=-0.03)
├── (a=0, N=31, Q_v=-0.17, best=-0.17, ubc=0.12)
│ ├── (a=1, N=8, Q_v=-0.17, best=-0.17, ubc=0.29)
│ │ ├── (a=2, N=3, Q_v=-0.17, best=-0.17, ubc=0.42)
│ │ ├── (a=3, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ └── (a=4, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ ├── (a=2, N=8, Q_v=-0.17, best=-0.17, ubc=0.29)
│ │ ├── (a=1, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ ├── (a=2, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ ├── (a=3, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.85)
│ ├── (a=3, N=7, Q_v=-0.17, best=-0.17, ubc=0.33)
│ │ ├── (a=1, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ │ ├── (a=2, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ │ └── (a=4, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ └── (a=4, N=7, Q_v=-0.17, best=-0.17, ubc=0.33)
│ ├── (a=1, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ ├── (a=2, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.82)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.82)
├── (a=1, N=31, Q_v=-0.17, best=-0.17, ubc=0.12)
│ ├── (a=0, N=8, Q_v=-0.17, best=-0.17, ubc=0.29)
│ │ ├── (a=2, N=3, Q_v=-0.17, best=-0.17, ubc=0.42)
│ │ ├── (a=3, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ └── (a=4, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ ├── (a=2, N=8, Q_v=-0.17, best=-0.17, ubc=0.29)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ ├── (a=2, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ ├── (a=3, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.85)
│ ├── (a=3, N=7, Q_v=-0.17, best=-0.17, ubc=0.33)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ │ ├── (a=2, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ │ └── (a=4, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ └── (a=4, N=7, Q_v=-0.17, best=-0.17, ubc=0.33)
│ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ ├── (a=2, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.82)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.82)
├── (a=2, N=31, Q_v=-0.17, best=-0.17, ubc=0.12)
│ ├── (a=0, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=1, N=2, Q_v=-0.17, best=-0.17, ubc=0.50)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.50)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.50)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.50)
│ │ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=3, N=31, Q_v=-0.17, best=-0.17, ubc=0.12)
│ ├── (a=0, N=8, Q_v=-0.17, best=-0.17, ubc=0.29)
│ │ ├── (a=1, N=3, Q_v=-0.17, best=-0.17, ubc=0.42)
│ │ ├── (a=2, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ └── (a=4, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ ├── (a=1, N=8, Q_v=-0.17, best=-0.17, ubc=0.29)
│ │ ├── (a=0, N=3, Q_v=-0.17, best=-0.17, ubc=0.42)
│ │ ├── (a=2, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ │ └── (a=4, N=2, Q_v=-0.17, best=-0.17, ubc=0.55)
│ ├── (a=2, N=7, Q_v=-0.17, best=-0.17, ubc=0.33)
│ │ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ │ ├── (a=1, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ │ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.82)
│ │ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.82)
│ └── (a=4, N=7, Q_v=-0.17, best=-0.17, ubc=0.33)
│ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ ├── (a=1, N=2, Q_v=-0.17, best=-0.17, ubc=0.53)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.82)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.82)
└── (a=4, N=31, Q_v=-0.17, best=-0.17, ubc=0.12)
├── (a=0, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ ├── (a=1, N=2, Q_v=-0.17, best=-0.17, ubc=0.50)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=1, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.50)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=2, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ ├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=3, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
│ ├── (a=0, N=2, Q_v=-0.17, best=-0.17, ubc=0.50)
│ ├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ ├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
│ └── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
└── (a=4, N=6, Q_v=-0.17, best=-0.17, ubc=0.37)
├── (a=0, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=1, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=2, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
├── (a=3, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
└── (a=4, N=1, Q_v=-0.17, best=-0.17, ubc=0.78)
[17:03:00] INFO selected action 0 after 125 simulations.
INFO current action list: [5, 5, 5, 1, 1, 2, 3, 0, 1, 5, 3, 2, 3, 4, 3, 3, 5, 5, 2, 1, 2, 0, 0, 1, 0, 0, 0]
(a=0, N=156, Q_v=-0.17, best=-0.17, ubc=-0.03)
├── (a=1, N=39, Q_v=-0.17, best=-0.17, ubc=0.09)
│ ├── (a=2, N=13, Q_v=-0.17, best=-0.17, ubc=0.21)
│ │ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.40)
│ │ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.40)
│ │ └── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.40)
│ ├── (a=3, N=13, Q_v=-0.17, best=-0.17, ubc=0.21)
│ │ ├── (a=2, N=6, Q_v=-0.17, best=-0.17, ubc=0.29)
│ │ └── (a=4, N=6, Q_v=-0.17, best=-0.17, ubc=0.29)
│ └── (a=4, N=12, Q_v=-0.17, best=-0.17, ubc=0.22)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.39)
│ ├── (a=3, N=4, Q_v=-0.17, best=-0.17, ubc=0.39)
│ └── (a=4, N=3, Q_v=-0.17, best=-0.17, ubc=0.47)
├── (a=2, N=39, Q_v=-0.17, best=-0.17, ubc=0.09)
│ ├── (a=1, N=10, Q_v=-0.17, best=-0.17, ubc=0.26)
│ │ ├── (a=2, N=3, Q_v=-0.17, best=-0.17, ubc=0.45)
│ │ ├── (a=3, N=3, Q_v=-0.17, best=-0.17, ubc=0.45)
│ │ └── (a=4, N=3, Q_v=-0.17, best=-0.17, ubc=0.45)
│ ├── (a=2, N=10, Q_v=-0.17, best=-0.17, ubc=0.26)
│ │ ├── (a=1, N=3, Q_v=-0.17, best=-0.17, ubc=0.45)
│ │ ├── (a=3, N=3, Q_v=-0.17, best=-0.17, ubc=0.45)
│ │ └── (a=4, N=3, Q_v=-0.17, best=-0.17, ubc=0.45)
│ ├── (a=3, N=9, Q_v=-0.17, best=-0.17, ubc=0.28)
│ │ ├── (a=1, N=3, Q_v=-0.17, best=-0.17, ubc=0.44)
│ │ ├── (a=2, N=3, Q_v=-0.17, best=-0.17, ubc=0.44)
│ │ └── (a=4, N=2, Q_v=-0.17, best=-0.17, ubc=0.57)
│ └── (a=4, N=9, Q_v=-0.17, best=-0.17, ubc=0.28)
│ ├── (a=1, N=2, Q_v=-0.17, best=-0.17, ubc=0.57)
│ ├── (a=2, N=2, Q_v=-0.17, best=-0.17, ubc=0.57)
│ ├── (a=3, N=2, Q_v=-0.17, best=-0.17, ubc=0.57)
│ └── (a=4, N=2, Q_v=-0.17, best=-0.17, ubc=0.57)
├── (a=3, N=39, Q_v=-0.17, best=-0.17, ubc=0.09)
│ ├── (a=1, N=13, Q_v=-0.17, best=-0.17, ubc=0.21)
│ │ ├── (a=2, N=6, Q_v=-0.17, best=-0.17, ubc=0.29)
│ │ └── (a=4, N=6, Q_v=-0.17, best=-0.17, ubc=0.29)
│ ├── (a=2, N=13, Q_v=-0.17, best=-0.17, ubc=0.21)
│ │ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.40)
│ │ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.40)
│ │ └── (a=4, N=4, Q_v=-0.17, best=-0.17, ubc=0.40)
│ └── (a=4, N=12, Q_v=-0.17, best=-0.17, ubc=0.22)
│ ├── (a=1, N=4, Q_v=-0.17, best=-0.17, ubc=0.39)
│ ├── (a=2, N=4, Q_v=-0.17, best=-0.17, ubc=0.39)
│ └── (a=4, N=3, Q_v=-0.17, best=-0.17, ubc=0.47)
└── (a=4, N=38, Q_v=-0.17, best=-0.17, ubc=0.09)
├── (a=1, N=10, Q_v=-0.17, best=-0.17, ubc=0.26)
│ ├── (a=2, N=3, Q_v=-0.17, best=-0.17, ubc=0.45)
│ ├── (a=3, N=3, Q_v=-0.17, best=-0.17, ubc=0.45)
│ └── (a=4, N=3, Q_v=-0.17, best=-0.17, ubc=0.45)
├── (a=2, N=9, Q_v=-0.17, best=-0.17, ubc=0.28)
│ ├── (a=1, N=2, Q_v=-0.17, best=-0.17, ubc=0.57)
│ ├── (a=2, N=2, Q_v=-0.17, best=-0.17, ubc=0.57)
│ ├── (a=3, N=2, Q_v=-0.17, best=-0.17, ubc=0.57)
│ └── (a=4, N=2, Q_v=-0.17, best=-0.17, ubc=0.57)
├── (a=3, N=9, Q_v=-0.17, best=-0.17, ubc=0.28)
│ ├── (a=1, N=3, Q_v=-0.17, best=-0.17, ubc=0.44)
│ ├── (a=2, N=3, Q_v=-0.17, best=-0.17, ubc=0.44)
│ └── (a=4, N=2, Q_v=-0.17, best=-0.17, ubc=0.57)
└── (a=4, N=9, Q_v=-0.17, best=-0.17, ubc=0.28)
├── (a=1, N=2, Q_v=-0.17, best=-0.17, ubc=0.57)
├── (a=2, N=2, Q_v=-0.17, best=-0.17, ubc=0.57)
├── (a=3, N=2, Q_v=-0.17, best=-0.17, ubc=0.57)
└── (a=4, N=2, Q_v=-0.17, best=-0.17, ubc=0.57)
[17:03:02] INFO selected action 1 after 125 simulations.
INFO current action list: [5, 5, 5, 1, 1, 2, 3, 0, 1, 5, 3, 2, 3, 4, 3, 3, 5, 5, 2, 1, 2, 0, 0, 1, 0, 0, 0, 1]
(a=1, N=164, Q_v=-0.17, best=-0.17, ubc=-0.04)
├── (a=2, N=55, Q_v=-0.17, best=-0.17, ubc=0.05)
│ ├── (a=2, N=18, Q_v=-0.17, best=-0.17, ubc=0.16)
│ │ ├── (a=3, N=9, Q_v=-0.17, best=-0.17, ubc=0.23)
│ │ └── (a=4, N=8, Q_v=-0.17, best=-0.17, ubc=0.26)
│ ├── (a=3, N=18, Q_v=-0.17, best=-0.17, ubc=0.16)
│ │ ├── (a=2, N=9, Q_v=-0.17, best=-0.17, ubc=0.23)
│ │ └── (a=4, N=8, Q_v=-0.17, best=-0.17, ubc=0.26)
│ └── (a=4, N=18, Q_v=-0.17, best=-0.17, ubc=0.16)
│ ├── (a=2, N=6, Q_v=-0.17, best=-0.17, ubc=0.32)
│ ├── (a=3, N=6, Q_v=-0.17, best=-0.17, ubc=0.32)
│ └── (a=4, N=5, Q_v=-0.17, best=-0.17, ubc=0.37)
├── (a=3, N=54, Q_v=-0.17, best=-0.17, ubc=0.05)
│ ├── (a=2, N=27, Q_v=-0.17, best=-0.17, ubc=0.10)
│ │ ├── (a=2, N=13, Q_v=-0.17, best=-0.17, ubc=0.19)
│ │ └── (a=4, N=13, Q_v=-0.17, best=-0.17, ubc=0.19)
│ └── (a=4, N=26, Q_v=-0.17, best=-0.17, ubc=0.11)
│ ├── (a=2, N=13, Q_v=-0.17, best=-0.17, ubc=0.18)
│ └── (a=4, N=12, Q_v=-0.17, best=-0.17, ubc=0.20)
└── (a=4, N=54, Q_v=-0.17, best=-0.17, ubc=0.05)
├── (a=2, N=18, Q_v=-0.17, best=-0.17, ubc=0.16)
│ ├── (a=2, N=6, Q_v=-0.17, best=-0.17, ubc=0.32)
│ ├── (a=3, N=6, Q_v=-0.17, best=-0.17, ubc=0.32)
│ └── (a=4, N=5, Q_v=-0.17, best=-0.17, ubc=0.37)
├── (a=3, N=18, Q_v=-0.17, best=-0.17, ubc=0.16)
│ ├── (a=2, N=9, Q_v=-0.17, best=-0.17, ubc=0.23)
│ └── (a=4, N=8, Q_v=-0.17, best=-0.17, ubc=0.26)
└── (a=4, N=17, Q_v=-0.17, best=-0.17, ubc=0.17)
├── (a=2, N=6, Q_v=-0.17, best=-0.17, ubc=0.32)
├── (a=3, N=5, Q_v=-0.17, best=-0.17, ubc=0.36)
└── (a=4, N=5, Q_v=-0.17, best=-0.17, ubc=0.36)
[17:03:03] INFO selected action 2 after 125 simulations.
INFO current action list: [5, 5, 5, 1, 1, 2, 3, 0, 1, 5, 3, 2, 3, 4, 3, 3, 5, 5, 2, 1, 2, 0, 0, 1, 0, 0, 0, 1, 2]
(a=2, N=180, Q_v=-0.17, best=-0.17, ubc=-0.04)
├── (a=2, N=60, Q_v=-0.17, best=-0.17, ubc=0.04)
│ ├── (a=3, N=30, Q_v=-0.17, best=-0.17, ubc=0.09)
│ │ └── (a=4, N=29, Q_v=-0.17, best=-0.17, ubc=0.07)
│ └── (a=4, N=29, Q_v=-0.17, best=-0.17, ubc=0.10)
│ ├── (a=3, N=14, Q_v=-0.17, best=-0.17, ubc=0.18)
│ └── (a=4, N=14, Q_v=-0.17, best=-0.17, ubc=0.18)
├── (a=3, N=60, Q_v=-0.17, best=-0.17, ubc=0.04)
│ ├── (a=2, N=30, Q_v=-0.17, best=-0.17, ubc=0.09)
│ │ └── (a=4, N=29, Q_v=-0.17, best=-0.17, ubc=0.07)
│ └── (a=4, N=29, Q_v=-0.17, best=-0.17, ubc=0.10)
│ ├── (a=2, N=14, Q_v=-0.17, best=-0.17, ubc=0.18)
│ └── (a=4, N=14, Q_v=-0.17, best=-0.17, ubc=0.18)
└── (a=4, N=59, Q_v=-0.17, best=-0.17, ubc=0.04)
├── (a=2, N=20, Q_v=-0.17, best=-0.17, ubc=0.15)
│ ├── (a=3, N=10, Q_v=-0.17, best=-0.17, ubc=0.22)
│ └── (a=4, N=9, Q_v=-0.17, best=-0.17, ubc=0.24)
├── (a=3, N=19, Q_v=-0.17, best=-0.17, ubc=0.16)
│ ├── (a=2, N=9, Q_v=-0.17, best=-0.17, ubc=0.24)
│ └── (a=4, N=9, Q_v=-0.17, best=-0.17, ubc=0.24)
└── (a=4, N=19, Q_v=-0.17, best=-0.17, ubc=0.16)
├── (a=2, N=6, Q_v=-0.17, best=-0.17, ubc=0.33)
├── (a=3, N=6, Q_v=-0.17, best=-0.17, ubc=0.33)
└── (a=4, N=6, Q_v=-0.17, best=-0.17, ubc=0.33)
INFO selected action 2 after 125 simulations.
INFO current action list: [5, 5, 5, 1, 1, 2, 3, 0, 1, 5, 3, 2, 3, 4, 3, 3, 5, 5, 2, 1, 2, 0, 0, 1, 0, 0, 0, 1, 2, 2]
(a=2, N=185, Q_v=-0.17, best=-0.17, ubc=-0.04)
├── (a=3, N=92, Q_v=-0.17, best=-0.17, ubc=-0.00)
│ └── (a=4, N=91, Q_v=-0.17, best=-0.17, ubc=-0.01)
│ └── (a=4, N=90, Q_v=-0.17, best=-0.17, ubc=-0.01)
└── (a=4, N=92, Q_v=-0.17, best=-0.17, ubc=-0.00)
├── (a=3, N=46, Q_v=-0.17, best=-0.17, ubc=0.05)
│ └── (a=4, N=45, Q_v=-0.17, best=-0.17, ubc=0.04)
└── (a=4, N=45, Q_v=-0.17, best=-0.17, ubc=0.06)
├── (a=3, N=22, Q_v=-0.17, best=-0.17, ubc=0.13)
└── (a=4, N=22, Q_v=-0.17, best=-0.17, ubc=0.13)
INFO selected action 3 after 125 simulations.
INFO current action list: [5, 5, 5, 1, 1, 2, 3, 0, 1, 5, 3, 2, 3, 4, 3, 3, 5, 5, 2, 1, 2, 0, 0, 1, 0, 0, 0, 1, 2, 2, 3]
(a=3, N=217, Q_v=-0.17, best=-0.17, ubc=-0.05)
└── (a=4, N=216, Q_v=-0.17, best=-0.17, ubc=-0.06)
└── (a=4, N=215, Q_v=-0.17, best=-0.17, ubc=-0.06)
└── (a=4, N=214, Q_v=-0.17, best=-0.17, ubc=-0.06)
[17:03:04] INFO selected action 4 after 125 simulations.
INFO current action list: [5, 5, 5, 1, 1, 2, 3, 0, 1, 5, 3, 2, 3, 4, 3, 3, 5, 5, 2, 1, 2, 0, 0, 1, 0, 0, 0, 1, 2, 2, 3, 4]
(a=4, N=341, Q_v=-0.17, best=-0.17, ubc=-0.08)
└── (a=4, N=340, Q_v=-0.17, best=-0.17, ubc=-0.08)
└── (a=4, N=339, Q_v=-0.17, best=-0.17, ubc=-0.08)
└── (a=4, N=338, Q_v=-0.17, best=-0.17, ubc=-0.08)
INFO selected action 4 after 125 simulations.
INFO current action list: [5, 5, 5, 1, 1, 2, 3, 0, 1, 5, 3, 2, 3, 4, 3, 3, 5, 5, 2, 1, 2, 0, 0, 1, 0, 0, 0, 1, 2, 2, 3, 4, 4]
(a=4, N=465, Q_v=-0.17, best=-0.17, ubc=-0.09)
└── (a=4, N=464, Q_v=-0.17, best=-0.17, ubc=-0.09)
└── (a=4, N=463, Q_v=-0.17, best=-0.17, ubc=-0.09)
└── (a=4, N=462, Q_v=-0.17, best=-0.17, ubc=-0.09)
INFO selected action 4 after 125 simulations.
INFO current action list: [5, 5, 5, 1, 1, 2, 3, 0, 1, 5, 3, 2, 3, 4, 3, 3, 5, 5, 2, 1, 2, 0, 0, 1, 0, 0, 0, 1, 2, 2, 3, 4, 4, 4]
(a=4, N=589, Q_v=-0.17, best=-0.17, ubc=-0.10)
└── (a=4, N=588, Q_v=-0.17, best=-0.17, ubc=-0.10)
└── (a=4, N=587, Q_v=-0.17, best=-0.17, ubc=-0.10)
INFO selected action 4 after 125 simulations.
INFO current action list: [5, 5, 5, 1, 1, 2, 3, 0, 1, 5, 3, 2, 3, 4, 3, 3, 5, 5, 2, 1, 2, 0, 0, 1, 0, 0, 0, 1, 2, 2, 3, 4, 4, 4, 4]
(a=4, N=713, Q_v=-0.17, best=-0.17, ubc=-0.10)
└── (a=4, N=712, Q_v=-0.17, best=-0.17, ubc=-0.10)
INFO selected action 4 after 125 simulations.
INFO current action list: [5, 5, 5, 1, 1, 2, 3, 0, 1, 5, 3, 2, 3, 4, 3, 3, 5, 5, 2, 1, 2, 0, 0, 1, 0, 0, 0, 1, 2, 2, 3, 4, 4, 4, 4, 4]
INFO Final action list: [5, 5, 5, 1, 1, 2, 3, 0, 1, 5, 3, 2, 3, 4, 3, 3, 5, 5, 2, 1, 2, 0, 0, 1, 0, 0, 0, 1, 2, 2, 3, 4, 4, 4, 4, 4]
╔═══════════════════════════════════════════════════════╗
Job 0 ║ ████ ████████████ ███ █████ ║ Machine 0 █
Job 1 ║ ███████████████████████████████ █████████████ ║ Machine 1 █
Job 2 ║█████ ████ ████████ █████████ ███████║ Machine 2 █
Job 3 ║ ████ ████████████████████████████ ║ Machine 3 █
Job 4 ║ ███████████ █████ ████ ███ █ ║ Machine 4 █
Job 5 ║███████████████████████ ████ █ ║ Machine 5 █
╚╦════╤════╤════╤════╤════╦════╤════╤════╤════╤════╦════╝
0.0 27.3 54.5
Makespan: 59