graph-matrix-jsp-env (Deepcopy Wrapper)

[1]:
from graph_matrix_jsp_env.disjunctive_jsp_env import DisjunctiveGraphJspEnv
from jsp_instance_utils.instances import ft06, ft06_makespan



     ▐███▌         ▟███▛▟███████▛▐███▌
     ▐███▌        ▟███▛▟███████▛ ▐███▌
     ▐███▌ ▟███  ▟███▛    ▟███▛  ▐███▌
     ▐███▌▟████ ▟███▛    ▟███▛   ▐███▌
     ▐██████▛▐█████▛    ▟████████▐█████████▛
     ▐█████▛ ▐████▛    ▟█████████▐████████▛


     ▐█▀▜▙█▙   ███████▐█ ▐█    ▟█▙   ▟█▙  ▟███▐█ ▐█▐█▀▀▐█▙ █
     ▐█▄▟▛▜█▙▟▙██ ▐█  ▐████   ▟▛ ▜▙ ▟▛ ▜▙ █▍  ▐████▐█▀▀▐██▙█
     ▐█ ▜▙ ▜█▛▜██ ▐█  ▐█ ▐█  ▟█▛▀▜█▙█▛▀▜█▙▜███▐█ ▐█▐█▆▆▐█ ▜█
           ▐█  ▐█▐█▙ █▐███▜█▙ ▟███▀▀▐█▀▜▙▟█▀▜█▐███▐█████▙ ▟▛
           ▐█  ▐█▐██▙█ ▐█  ▜█▄█▛▐█▀▀▐█▄▟▛▜█▆▆▄ ▐█  ▐█  ▜█▄▛
            ▜███▛▐█ ▜█▐███  ▜█▛ ▐███▐█ ▜▙▐█▆▆▛▐███ ▐█   ██

    
    Graph Matrix Job Shop Problem Environment
    

    Version:    0.1.0
[2]:
from gymcts.gymcts_agent import GymctsAgent
from gymcts.gymcts_deepcopy_wrapper import DeepCopyMCTSGymEnvWrapper
from gymnasium.wrappers import TransformReward
from gymcts.logger import log
[3]:
import gymnasium as gym
import numpy as np
[4]:
if __name__ == '__main__':
    log.setLevel(20)


    env = DisjunctiveGraphJspEnv(
        jsp_instance=ft06,
        reward_function="makespan",
    )
    # map reward to [1, -inf]
    # ideally you want the reward to be in the range of [-1, 1] for the UBC score
    env = TransformReward(env, lambda r: r / ft06_makespan + 2 if r != 0 else 0.0)
    env.reset()



    def mask_fn(env: gym.Env) -> np.ndarray:
        # Do whatever you'd like in this function to return the action mask
        # for the current env. In this example, we assume the env has a
        # helpful method we can rely on.
        return env.unwrapped.valid_action_mask()

    env = DeepCopyMCTSGymEnvWrapper(
        env,
        action_mask_fn=mask_fn
    )


    agent = GymctsAgent(
        env=env,
        render_tree_after_step=True,
        exclude_unvisited_nodes_from_render=True,
        number_of_simulations_per_step=125,
    )

    root = agent.search_root_node.get_root()

    actions = agent.solve(render_tree_after_step=True)
    for a in actions:
        obs, rew, term, trun, info = env.step(a)

    env.render()
    makespan = env.unwrapped.get_makespan()
    print(f"makespan: {makespan}")
(N=125, Q_v=0.41, best=0.93)
├── (a=1, N=26, Q_v=0.45, best=0.80, ubc=0.76)
│   ├── (a=2, N=3, Q_v=0.33, best=0.53, ubc=1.06)
│   ├── (a=3, N=1, Q_v=0.38, best=0.38, ubc=1.12)
│   └── (a=13, N=1, Q_v=0.07, best=0.07, ubc=0.81)
│   ├── (a=7, N=4, Q_v=0.42, best=0.60, ubc=1.06)
│   ├── (a=2, N=1, Q_v=0.60, best=0.60, ubc=1.43)
│   ├── (a=8, N=1, Q_v=0.44, best=0.44, ubc=1.27)
│   └── (a=19, N=1, Q_v=0.56, best=0.56, ubc=1.40)
│   ├── (a=13, N=4, Q_v=0.45, best=0.55, ubc=1.09)
│   ├── (a=2, N=1, Q_v=0.29, best=0.29, ubc=1.12)
│   ├── (a=7, N=1, Q_v=0.47, best=0.47, ubc=1.31)
│   └── (a=14, N=1, Q_v=0.51, best=0.51, ubc=1.34)
│   ├── (a=19, N=4, Q_v=0.45, best=0.80, ubc=1.08)
│   ├── (a=2, N=1, Q_v=0.40, best=0.40, ubc=1.23)
│   ├── (a=7, N=1, Q_v=0.27, best=0.27, ubc=1.11)
│   └── (a=31, N=1, Q_v=0.31, best=0.31, ubc=1.14)
│   ├── (a=25, N=5, Q_v=0.47, best=0.62, ubc=1.04)
│   ├── (a=2, N=1, Q_v=0.51, best=0.51, ubc=1.41)
│   ├── (a=7, N=1, Q_v=0.62, best=0.62, ubc=1.52)
│   ├── (a=13, N=1, Q_v=0.40, best=0.40, ubc=1.30)
│   └── (a=19, N=1, Q_v=0.38, best=0.38, ubc=1.28)
│   └── (a=31, N=5, Q_v=0.56, best=0.78, ubc=1.13)
│       ├── (a=2, N=1, Q_v=0.47, best=0.47, ubc=1.37)
│       ├── (a=7, N=1, Q_v=0.53, best=0.53, ubc=1.42)
│       ├── (a=13, N=1, Q_v=0.51, best=0.51, ubc=1.41)
│       └── (a=19, N=1, Q_v=0.78, best=0.78, ubc=1.68)
├── (a=7, N=15, Q_v=0.34, best=0.65, ubc=0.74)
│   ├── (a=1, N=2, Q_v=0.31, best=0.38, ubc=1.13)
│   └── (a=2, N=1, Q_v=0.38, best=0.38, ubc=0.97)
│   ├── (a=8, N=2, Q_v=0.35, best=0.36, ubc=1.18)
│   └── (a=9, N=1, Q_v=0.35, best=0.35, ubc=0.93)
│   ├── (a=13, N=3, Q_v=0.30, best=0.42, ubc=0.97)
│   ├── (a=1, N=1, Q_v=0.11, best=0.11, ubc=0.85)
│   └── (a=14, N=1, Q_v=0.36, best=0.36, ubc=1.10)
│   ├── (a=19, N=2, Q_v=0.15, best=0.22, ubc=0.97)
│   └── (a=1, N=1, Q_v=0.07, best=0.07, ubc=0.66)
│   ├── (a=25, N=3, Q_v=0.53, best=0.65, ubc=1.21)
│   ├── (a=1, N=1, Q_v=0.65, best=0.65, ubc=1.40)
│   └── (a=19, N=1, Q_v=0.47, best=0.47, ubc=1.21)
│   └── (a=31, N=2, Q_v=0.35, best=0.49, ubc=1.17)
│       └── (a=19, N=1, Q_v=0.49, best=0.49, ubc=1.08)
├── (a=13, N=15, Q_v=0.36, best=0.93, ubc=0.76)
│   ├── (a=1, N=1, Q_v=0.02, best=0.02, ubc=1.18)
│   ├── (a=7, N=2, Q_v=0.23, best=0.53, ubc=1.05)
│   └── (a=19, N=1, Q_v=-0.07, best=-0.07, ubc=0.52)
│   ├── (a=14, N=3, Q_v=0.25, best=0.56, ubc=0.93)
│   ├── (a=1, N=1, Q_v=-0.11, best=-0.11, ubc=0.63)
│   └── (a=19, N=1, Q_v=0.56, best=0.56, ubc=1.30)
│   ├── (a=19, N=3, Q_v=0.55, best=0.93, ubc=1.22)
│   ├── (a=1, N=1, Q_v=0.33, best=0.33, ubc=1.07)
│   └── (a=7, N=1, Q_v=0.40, best=0.40, ubc=1.14)
│   ├── (a=25, N=3, Q_v=0.45, best=0.49, ubc=1.13)
│   ├── (a=1, N=1, Q_v=0.42, best=0.42, ubc=1.16)
│   └── (a=14, N=1, Q_v=0.49, best=0.49, ubc=1.23)
│   └── (a=31, N=2, Q_v=0.25, best=0.40, ubc=1.08)
│       └── (a=14, N=1, Q_v=0.40, best=0.40, ubc=0.99)
├── (a=19, N=27, Q_v=0.45, best=0.87, ubc=0.75)
│   ├── (a=1, N=5, Q_v=0.52, best=0.64, ubc=1.09)
│   ├── (a=2, N=1, Q_v=0.58, best=0.58, ubc=1.48)
│   ├── (a=7, N=1, Q_v=0.64, best=0.64, ubc=1.53)
│   ├── (a=13, N=1, Q_v=0.53, best=0.53, ubc=1.42)
│   └── (a=31, N=1, Q_v=0.56, best=0.56, ubc=1.46)
│   ├── (a=7, N=3, Q_v=0.30, best=0.73, ubc=1.04)
│   ├── (a=1, N=1, Q_v=0.36, best=0.36, ubc=1.10)
│   └── (a=8, N=1, Q_v=-0.18, best=-0.18, ubc=0.56)
│   ├── (a=13, N=7, Q_v=0.54, best=0.87, ubc=1.03)
│   ├── (a=1, N=1, Q_v=0.75, best=0.75, ubc=1.73)
│   ├── (a=7, N=1, Q_v=0.69, best=0.69, ubc=1.68)
│   ├── (a=14, N=1, Q_v=0.87, best=0.87, ubc=1.86)
│   ├── (a=20, N=1, Q_v=0.49, best=0.49, ubc=1.48)
│   ├── (a=25, N=1, Q_v=0.25, best=0.25, ubc=1.24)
│   └── (a=31, N=1, Q_v=0.22, best=0.22, ubc=1.20)
│   ├── (a=20, N=4, Q_v=0.46, best=0.75, ubc=1.11)
│   ├── (a=1, N=1, Q_v=0.42, best=0.42, ubc=1.25)
│   ├── (a=7, N=1, Q_v=0.31, best=0.31, ubc=1.14)
│   └── (a=25, N=1, Q_v=0.38, best=0.38, ubc=1.21)
│   ├── (a=25, N=4, Q_v=0.47, best=0.62, ubc=1.11)
│   ├── (a=1, N=1, Q_v=0.45, best=0.45, ubc=1.29)
│   ├── (a=7, N=1, Q_v=0.51, best=0.51, ubc=1.34)
│   └── (a=13, N=1, Q_v=0.31, best=0.31, ubc=1.14)
│   └── (a=31, N=3, Q_v=0.30, best=0.33, ubc=1.04)
│       ├── (a=1, N=1, Q_v=0.31, best=0.31, ubc=1.05)
│       └── (a=7, N=1, Q_v=0.33, best=0.33, ubc=1.07)
├── (a=25, N=18, Q_v=0.38, best=0.78, ubc=0.74)
│   ├── (a=1, N=2, Q_v=0.21, best=0.27, ubc=1.06)
│   └── (a=26, N=1, Q_v=0.15, best=0.15, ubc=0.73)
│   ├── (a=7, N=3, Q_v=0.42, best=0.58, ubc=1.12)
│   ├── (a=1, N=1, Q_v=0.58, best=0.58, ubc=1.32)
│   └── (a=26, N=1, Q_v=0.42, best=0.42, ubc=1.16)
│   ├── (a=13, N=4, Q_v=0.54, best=0.78, ubc=1.14)
│   ├── (a=1, N=1, Q_v=0.40, best=0.40, ubc=1.23)
│   ├── (a=7, N=1, Q_v=0.78, best=0.78, ubc=1.61)
│   └── (a=14, N=1, Q_v=0.36, best=0.36, ubc=1.20)
│   ├── (a=19, N=2, Q_v=0.21, best=0.35, ubc=1.06)
│   └── (a=13, N=1, Q_v=0.35, best=0.35, ubc=0.93)
│   ├── (a=26, N=3, Q_v=0.42, best=0.62, ubc=1.11)
│   ├── (a=1, N=1, Q_v=0.31, best=0.31, ubc=1.05)
│   └── (a=27, N=1, Q_v=0.33, best=0.33, ubc=1.07)
│   └── (a=31, N=3, Q_v=0.27, best=0.42, ubc=0.97)
│       ├── (a=1, N=1, Q_v=0.20, best=0.20, ubc=0.94)
│       └── (a=19, N=1, Q_v=0.20, best=0.20, ubc=0.94)
└── (a=31, N=23, Q_v=0.44, best=0.82, ubc=0.77)
    ├── (a=1, N=5, Q_v=0.59, best=0.76, ubc=1.15)
    ├── (a=2, N=1, Q_v=0.62, best=0.62, ubc=1.52)
    ├── (a=7, N=1, Q_v=0.35, best=0.35, ubc=1.24)
    ├── (a=13, N=1, Q_v=0.51, best=0.51, ubc=1.41)
    └── (a=25, N=1, Q_v=0.76, best=0.76, ubc=1.66)
    ├── (a=7, N=3, Q_v=0.40, best=0.82, ubc=1.12)
    ├── (a=1, N=1, Q_v=0.64, best=0.64, ubc=1.38)
    └── (a=13, N=1, Q_v=-0.25, best=-0.25, ubc=0.49)
    ├── (a=13, N=3, Q_v=0.31, best=0.60, ubc=1.03)
    ├── (a=1, N=1, Q_v=0.33, best=0.33, ubc=1.07)
    └── (a=7, N=1, Q_v=0.00, best=0.00, ubc=0.74)
    ├── (a=19, N=3, Q_v=0.41, best=0.64, ubc=1.13)
    ├── (a=1, N=1, Q_v=0.64, best=0.64, ubc=1.38)
    └── (a=13, N=1, Q_v=0.33, best=0.33, ubc=1.07)
    ├── (a=25, N=4, Q_v=0.44, best=0.71, ubc=1.07)
    ├── (a=1, N=1, Q_v=0.49, best=0.49, ubc=1.32)
    ├── (a=7, N=1, Q_v=0.24, best=0.24, ubc=1.07)
    └── (a=13, N=1, Q_v=0.33, best=0.33, ubc=1.16)
    └── (a=32, N=4, Q_v=0.39, best=0.73, ubc=1.01)
        ├── (a=1, N=1, Q_v=0.73, best=0.73, ubc=1.56)
        ├── (a=7, N=1, Q_v=0.15, best=0.15, ubc=0.98)
        └── (a=13, N=1, Q_v=0.33, best=0.33, ubc=1.16)
[16:53:18] INFO     selected action 1 after 125 simulations.
           INFO     current action list: [1]
(N=125, Q_v=0.40, best=0.84)
├── (a=2, N=17, Q_v=0.36, best=0.62, ubc=0.73)
├── (a=3, N=3, Q_v=0.42, best=0.60, ubc=1.11)
├── (a=4, N=1, Q_v=0.60, best=0.60, ubc=1.34)
└── (a=7, N=1, Q_v=0.25, best=0.25, ubc=1.00)
├── (a=7, N=2, Q_v=0.25, best=0.29, ubc=1.09)
└── (a=25, N=1, Q_v=0.20, best=0.20, ubc=0.79)
├── (a=13, N=2, Q_v=0.13, best=0.25, ubc=0.97)
└── (a=7, N=1, Q_v=0.00, best=0.00, ubc=0.59)
├── (a=19, N=3, Q_v=0.55, best=0.60, ubc=1.23)
├── (a=3, N=1, Q_v=0.58, best=0.58, ubc=1.32)
└── (a=25, N=1, Q_v=0.60, best=0.60, ubc=1.34)
├── (a=25, N=3, Q_v=0.27, best=0.47, ubc=0.96)
├── (a=3, N=1, Q_v=-0.04, best=-0.04, ubc=0.70)
└── (a=13, N=1, Q_v=0.38, best=0.38, ubc=1.12)
└── (a=31, N=3, Q_v=0.53, best=0.62, ubc=1.21)
    ├── (a=3, N=1, Q_v=0.36, best=0.36, ubc=1.10)
    └── (a=7, N=1, Q_v=0.60, best=0.60, ubc=1.34)
├── (a=7, N=14, Q_v=0.31, best=0.56, ubc=0.73)
├── (a=2, N=2, Q_v=0.31, best=0.33, ubc=1.12)
└── (a=25, N=1, Q_v=0.29, best=0.29, ubc=0.88)
├── (a=8, N=2, Q_v=0.25, best=0.38, ubc=1.07)
└── (a=19, N=1, Q_v=0.13, best=0.13, ubc=0.72)
├── (a=13, N=3, Q_v=0.51, best=0.56, ubc=1.17)
├── (a=2, N=1, Q_v=0.51, best=0.51, ubc=1.25)
└── (a=31, N=1, Q_v=0.56, best=0.56, ubc=1.30)
├── (a=19, N=2, Q_v=0.15, best=0.27, ubc=0.97)
└── (a=13, N=1, Q_v=0.27, best=0.27, ubc=0.86)
├── (a=25, N=2, Q_v=0.24, best=0.55, ubc=1.05)
└── (a=2, N=1, Q_v=-0.07, best=-0.07, ubc=0.52)
└── (a=31, N=2, Q_v=0.26, best=0.31, ubc=1.08)
    └── (a=13, N=1, Q_v=0.31, best=0.31, ubc=0.90)
├── (a=13, N=26, Q_v=0.43, best=0.82, ubc=0.73)
├── (a=2, N=4, Q_v=0.39, best=0.65, ubc=1.02)
├── (a=3, N=1, Q_v=0.65, best=0.65, ubc=1.49)
├── (a=7, N=1, Q_v=0.38, best=0.38, ubc=1.21)
└── (a=14, N=1, Q_v=0.09, best=0.09, ubc=0.92)
├── (a=7, N=3, Q_v=0.33, best=0.42, ubc=1.07)
├── (a=2, N=1, Q_v=0.25, best=0.25, ubc=1.00)
└── (a=19, N=1, Q_v=0.33, best=0.33, ubc=1.07)
├── (a=14, N=6, Q_v=0.55, best=0.82, ubc=1.07)
├── (a=2, N=1, Q_v=0.36, best=0.36, ubc=1.31)
├── (a=7, N=1, Q_v=0.55, best=0.55, ubc=1.49)
├── (a=15, N=1, Q_v=0.73, best=0.73, ubc=1.67)
├── (a=19, N=1, Q_v=0.82, best=0.82, ubc=1.76)
└── (a=25, N=1, Q_v=0.33, best=0.33, ubc=1.27)
├── (a=19, N=5, Q_v=0.48, best=0.55, ubc=1.05)
├── (a=2, N=1, Q_v=0.45, best=0.45, ubc=1.35)
├── (a=7, N=1, Q_v=0.44, best=0.44, ubc=1.33)
├── (a=14, N=1, Q_v=0.45, best=0.45, ubc=1.35)
└── (a=20, N=1, Q_v=0.55, best=0.55, ubc=1.44)
├── (a=25, N=3, Q_v=0.34, best=0.55, ubc=1.08)
├── (a=2, N=1, Q_v=0.05, best=0.05, ubc=0.80)
└── (a=14, N=1, Q_v=0.42, best=0.42, ubc=1.16)
└── (a=31, N=4, Q_v=0.40, best=0.73, ubc=1.04)
    ├── (a=2, N=1, Q_v=0.22, best=0.22, ubc=1.05)
    ├── (a=7, N=1, Q_v=0.29, best=0.29, ubc=1.12)
    └── (a=32, N=1, Q_v=0.73, best=0.73, ubc=1.56)
├── (a=19, N=28, Q_v=0.45, best=0.84, ubc=0.74)
├── (a=2, N=4, Q_v=0.36, best=0.64, ubc=1.01)
├── (a=3, N=1, Q_v=0.35, best=0.35, ubc=1.18)
├── (a=7, N=1, Q_v=0.11, best=0.11, ubc=0.94)
└── (a=13, N=1, Q_v=0.64, best=0.64, ubc=1.47)
├── (a=7, N=5, Q_v=0.51, best=0.80, ubc=1.09)
├── (a=2, N=1, Q_v=0.65, best=0.65, ubc=1.55)
├── (a=8, N=1, Q_v=0.33, best=0.33, ubc=1.22)
├── (a=13, N=1, Q_v=0.31, best=0.31, ubc=1.21)
└── (a=20, N=1, Q_v=0.47, best=0.47, ubc=1.37)
├── (a=13, N=4, Q_v=0.43, best=0.71, ubc=1.07)
├── (a=2, N=1, Q_v=0.22, best=0.22, ubc=1.05)
├── (a=7, N=1, Q_v=0.13, best=0.13, ubc=0.96)
└── (a=14, N=1, Q_v=0.65, best=0.65, ubc=1.49)
├── (a=20, N=5, Q_v=0.49, best=0.67, ubc=1.07)
├── (a=2, N=1, Q_v=0.49, best=0.49, ubc=1.39)
├── (a=7, N=1, Q_v=0.51, best=0.51, ubc=1.41)
├── (a=13, N=1, Q_v=0.38, best=0.38, ubc=1.28)
└── (a=21, N=1, Q_v=0.40, best=0.40, ubc=1.30)
├── (a=25, N=4, Q_v=0.35, best=0.71, ubc=1.00)
├── (a=2, N=1, Q_v=0.25, best=0.25, ubc=1.09)
├── (a=7, N=1, Q_v=0.18, best=0.18, ubc=1.01)
└── (a=31, N=1, Q_v=0.71, best=0.71, ubc=1.54)
└── (a=31, N=5, Q_v=0.49, best=0.84, ubc=1.07)
    ├── (a=2, N=1, Q_v=0.60, best=0.60, ubc=1.50)
    ├── (a=7, N=1, Q_v=0.18, best=0.18, ubc=1.08)
    ├── (a=13, N=1, Q_v=0.44, best=0.44, ubc=1.33)
    └── (a=32, N=1, Q_v=0.40, best=0.40, ubc=1.30)
├── (a=25, N=12, Q_v=0.28, best=0.71, ubc=0.73)
├── (a=2, N=2, Q_v=0.29, best=0.36, ubc=1.08)
└── (a=3, N=1, Q_v=0.22, best=0.22, ubc=0.81)
├── (a=7, N=2, Q_v=0.48, best=0.53, ubc=1.27)
└── (a=26, N=1, Q_v=0.53, best=0.53, ubc=1.12)
├── (a=13, N=2, Q_v=0.33, best=0.38, ubc=1.12)
└── (a=31, N=1, Q_v=0.38, best=0.38, ubc=0.97)
├── (a=19, N=2, Q_v=0.50, best=0.71, ubc=1.29)
└── (a=2, N=1, Q_v=0.29, best=0.29, ubc=0.88)
├── (a=26, N=1, Q_v=-0.20, best=-0.20, ubc=0.91)
└── (a=31, N=2, Q_v=0.11, best=0.22, ubc=0.90)
    └── (a=26, N=1, Q_v=0.00, best=0.00, ubc=0.59)
└── (a=31, N=27, Q_v=0.44, best=0.75, ubc=0.74)
    ├── (a=2, N=4, Q_v=0.44, best=0.67, ubc=1.08)
    ├── (a=3, N=1, Q_v=0.27, best=0.27, ubc=1.11)
    ├── (a=7, N=1, Q_v=0.16, best=0.16, ubc=1.00)
    └── (a=19, N=1, Q_v=0.65, best=0.65, ubc=1.49)
    ├── (a=7, N=4, Q_v=0.30, best=0.55, ubc=0.95)
    ├── (a=2, N=1, Q_v=0.15, best=0.15, ubc=0.98)
    ├── (a=8, N=1, Q_v=0.49, best=0.49, ubc=1.32)
    └── (a=13, N=1, Q_v=0.04, best=0.04, ubc=0.87)
    ├── (a=13, N=7, Q_v=0.59, best=0.75, ubc=1.08)
    ├── (a=2, N=1, Q_v=0.75, best=0.75, ubc=1.73)
    ├── (a=7, N=1, Q_v=0.44, best=0.44, ubc=1.42)
    ├── (a=14, N=1, Q_v=0.71, best=0.71, ubc=1.70)
    ├── (a=19, N=1, Q_v=0.64, best=0.64, ubc=1.62)
    ├── (a=25, N=1, Q_v=0.53, best=0.53, ubc=1.51)
    └── (a=32, N=1, Q_v=0.65, best=0.65, ubc=1.64)
    ├── (a=19, N=4, Q_v=0.38, best=0.47, ubc=1.02)
    ├── (a=2, N=1, Q_v=0.27, best=0.27, ubc=1.11)
    ├── (a=7, N=1, Q_v=0.36, best=0.36, ubc=1.20)
    └── (a=13, N=1, Q_v=0.42, best=0.42, ubc=1.25)
    ├── (a=25, N=2, Q_v=0.08, best=0.31, ubc=0.99)
    └── (a=2, N=1, Q_v=-0.15, best=-0.15, ubc=0.44)
    └── (a=32, N=5, Q_v=0.50, best=0.60, ubc=1.08)
        ├── (a=2, N=1, Q_v=0.53, best=0.53, ubc=1.42)
        ├── (a=7, N=1, Q_v=0.60, best=0.60, ubc=1.50)
        ├── (a=13, N=1, Q_v=0.47, best=0.47, ubc=1.37)
        └── (a=25, N=1, Q_v=0.31, best=0.31, ubc=1.21)
[16:53:22] INFO     selected action 19 after 125 simulations.
           INFO     current action list: [1, 19]
(N=125, Q_v=0.42, best=0.84)
├── (a=2, N=22, Q_v=0.44, best=0.76, ubc=0.77)
├── (a=3, N=4, Q_v=0.47, best=0.58, ubc=1.09)
├── (a=4, N=1, Q_v=0.53, best=0.53, ubc=1.36)
├── (a=7, N=1, Q_v=0.49, best=0.49, ubc=1.32)
└── (a=13, N=1, Q_v=0.29, best=0.29, ubc=1.12)
├── (a=7, N=4, Q_v=0.41, best=0.76, ubc=1.03)
├── (a=3, N=1, Q_v=0.25, best=0.25, ubc=1.09)
├── (a=8, N=1, Q_v=0.22, best=0.22, ubc=1.05)
└── (a=13, N=1, Q_v=0.40, best=0.40, ubc=1.23)
├── (a=13, N=2, Q_v=0.27, best=0.33, ubc=1.15)
└── (a=25, N=1, Q_v=0.22, best=0.22, ubc=0.81)
├── (a=20, N=3, Q_v=0.42, best=0.47, ubc=1.14)
├── (a=3, N=1, Q_v=0.38, best=0.38, ubc=1.12)
└── (a=7, N=1, Q_v=0.42, best=0.42, ubc=1.16)
├── (a=25, N=3, Q_v=0.32, best=0.40, ubc=1.04)
├── (a=3, N=1, Q_v=0.40, best=0.40, ubc=1.14)
└── (a=31, N=1, Q_v=0.16, best=0.16, ubc=0.90)
└── (a=31, N=5, Q_v=0.57, best=0.75, ubc=1.12)
    ├── (a=3, N=1, Q_v=0.36, best=0.36, ubc=1.26)
    ├── (a=7, N=1, Q_v=0.56, best=0.56, ubc=1.46)
    ├── (a=13, N=1, Q_v=0.55, best=0.55, ubc=1.44)
    └── (a=20, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=7, N=20, Q_v=0.42, best=0.69, ubc=0.77)
├── (a=2, N=4, Q_v=0.48, best=0.60, ubc=1.09)
├── (a=3, N=1, Q_v=0.55, best=0.55, ubc=1.38)
├── (a=8, N=1, Q_v=0.44, best=0.44, ubc=1.27)
└── (a=20, N=1, Q_v=0.33, best=0.33, ubc=1.16)
├── (a=8, N=3, Q_v=0.39, best=0.44, ubc=1.09)
├── (a=2, N=1, Q_v=0.33, best=0.33, ubc=1.07)
└── (a=13, N=1, Q_v=0.40, best=0.40, ubc=1.14)
├── (a=13, N=3, Q_v=0.45, best=0.56, ubc=1.15)
├── (a=2, N=1, Q_v=0.45, best=0.45, ubc=1.20)
└── (a=25, N=1, Q_v=0.56, best=0.56, ubc=1.30)
├── (a=20, N=3, Q_v=0.41, best=0.64, ubc=1.11)
├── (a=2, N=1, Q_v=0.24, best=0.24, ubc=0.98)
└── (a=13, N=1, Q_v=0.64, best=0.64, ubc=1.38)
├── (a=25, N=3, Q_v=0.45, best=0.69, ubc=1.15)
├── (a=2, N=1, Q_v=0.64, best=0.64, ubc=1.38)
└── (a=20, N=1, Q_v=0.02, best=0.02, ubc=0.76)
└── (a=31, N=3, Q_v=0.38, best=0.51, ubc=1.09)
    ├── (a=2, N=1, Q_v=0.24, best=0.24, ubc=0.98)
    └── (a=13, N=1, Q_v=0.51, best=0.51, ubc=1.25)
├── (a=13, N=19, Q_v=0.41, best=0.73, ubc=0.77)
├── (a=2, N=4, Q_v=0.54, best=0.73, ubc=1.15)
├── (a=3, N=1, Q_v=0.51, best=0.51, ubc=1.34)
├── (a=7, N=1, Q_v=0.45, best=0.45, ubc=1.29)
└── (a=14, N=1, Q_v=0.47, best=0.47, ubc=1.31)
├── (a=7, N=3, Q_v=0.30, best=0.62, ubc=1.00)
├── (a=2, N=1, Q_v=-0.15, best=-0.15, ubc=0.60)
└── (a=8, N=1, Q_v=0.42, best=0.42, ubc=1.16)
├── (a=14, N=3, Q_v=0.36, best=0.42, ubc=1.06)
├── (a=2, N=1, Q_v=0.31, best=0.31, ubc=1.05)
└── (a=31, N=1, Q_v=0.42, best=0.42, ubc=1.16)
├── (a=20, N=3, Q_v=0.38, best=0.49, ubc=1.08)
├── (a=2, N=1, Q_v=0.22, best=0.22, ubc=0.96)
└── (a=21, N=1, Q_v=0.44, best=0.44, ubc=1.18)
├── (a=25, N=2, Q_v=0.26, best=0.40, ubc=1.12)
└── (a=2, N=1, Q_v=0.13, best=0.13, ubc=0.72)
└── (a=31, N=3, Q_v=0.50, best=0.53, ubc=1.20)
    ├── (a=2, N=1, Q_v=0.51, best=0.51, ubc=1.25)
    └── (a=25, N=1, Q_v=0.53, best=0.53, ubc=1.27)
├── (a=20, N=24, Q_v=0.45, best=0.82, ubc=0.76)
├── (a=2, N=3, Q_v=0.37, best=0.42, ubc=1.10)
├── (a=3, N=1, Q_v=0.42, best=0.42, ubc=1.16)
└── (a=31, N=1, Q_v=0.29, best=0.29, ubc=1.03)
├── (a=7, N=5, Q_v=0.47, best=0.69, ubc=1.03)
├── (a=2, N=1, Q_v=0.69, best=0.69, ubc=1.59)
├── (a=8, N=1, Q_v=0.69, best=0.69, ubc=1.59)
├── (a=13, N=1, Q_v=0.13, best=0.13, ubc=1.02)
└── (a=21, N=1, Q_v=0.45, best=0.45, ubc=1.35)
├── (a=13, N=3, Q_v=0.45, best=0.75, ubc=1.18)
├── (a=2, N=1, Q_v=0.42, best=0.42, ubc=1.16)
└── (a=7, N=1, Q_v=0.75, best=0.75, ubc=1.49)
├── (a=21, N=4, Q_v=0.42, best=0.56, ubc=1.05)
├── (a=2, N=1, Q_v=0.45, best=0.45, ubc=1.29)
├── (a=7, N=1, Q_v=0.22, best=0.22, ubc=1.05)
└── (a=25, N=1, Q_v=0.45, best=0.45, ubc=1.29)
├── (a=25, N=3, Q_v=0.33, best=0.36, ubc=1.05)
├── (a=2, N=1, Q_v=0.36, best=0.36, ubc=1.10)
└── (a=31, N=1, Q_v=0.33, best=0.33, ubc=1.07)
└── (a=31, N=5, Q_v=0.58, best=0.82, ubc=1.14)
    ├── (a=2, N=1, Q_v=0.62, best=0.62, ubc=1.52)
    ├── (a=7, N=1, Q_v=0.82, best=0.82, ubc=1.72)
    ├── (a=13, N=1, Q_v=0.49, best=0.49, ubc=1.39)
    └── (a=21, N=1, Q_v=0.24, best=0.24, ubc=1.13)
├── (a=25, N=19, Q_v=0.41, best=0.71, ubc=0.77)
├── (a=2, N=1, Q_v=-0.11, best=-0.11, ubc=1.10)
├── (a=7, N=4, Q_v=0.46, best=0.53, ubc=1.07)
├── (a=2, N=1, Q_v=0.44, best=0.44, ubc=1.27)
├── (a=8, N=1, Q_v=0.44, best=0.44, ubc=1.27)
└── (a=26, N=1, Q_v=0.53, best=0.53, ubc=1.36)
├── (a=13, N=3, Q_v=0.32, best=0.56, ubc=1.02)
├── (a=2, N=1, Q_v=0.33, best=0.33, ubc=1.07)
└── (a=20, N=1, Q_v=0.56, best=0.56, ubc=1.30)
├── (a=20, N=4, Q_v=0.55, best=0.71, ubc=1.16)
├── (a=2, N=1, Q_v=0.31, best=0.31, ubc=1.14)
├── (a=7, N=1, Q_v=0.49, best=0.49, ubc=1.32)
└── (a=13, N=1, Q_v=0.69, best=0.69, ubc=1.52)
├── (a=26, N=3, Q_v=0.45, best=0.65, ubc=1.15)
├── (a=2, N=1, Q_v=0.44, best=0.44, ubc=1.18)
└── (a=31, N=1, Q_v=0.25, best=0.25, ubc=1.00)
└── (a=31, N=3, Q_v=0.32, best=0.71, ubc=1.02)
    ├── (a=2, N=1, Q_v=0.15, best=0.15, ubc=0.89)
    └── (a=13, N=1, Q_v=0.71, best=0.71, ubc=1.45)
└── (a=31, N=20, Q_v=0.41, best=0.84, ubc=0.75)
    ├── (a=2, N=2, Q_v=0.24, best=0.35, ubc=1.10)
    └── (a=7, N=1, Q_v=0.35, best=0.35, ubc=0.93)
    ├── (a=7, N=3, Q_v=0.36, best=0.80, ubc=1.06)
    ├── (a=2, N=1, Q_v=0.00, best=0.00, ubc=0.74)
    └── (a=25, N=1, Q_v=0.80, best=0.80, ubc=1.54)
    ├── (a=13, N=3, Q_v=0.38, best=0.62, ubc=1.09)
    ├── (a=2, N=1, Q_v=0.62, best=0.62, ubc=1.36)
    └── (a=7, N=1, Q_v=0.35, best=0.35, ubc=1.09)
    ├── (a=20, N=3, Q_v=0.39, best=0.60, ubc=1.09)
    ├── (a=2, N=1, Q_v=0.22, best=0.22, ubc=0.96)
    └── (a=25, N=1, Q_v=0.35, best=0.35, ubc=1.09)
    ├── (a=25, N=5, Q_v=0.51, best=0.84, ubc=1.06)
    ├── (a=2, N=1, Q_v=0.55, best=0.55, ubc=1.44)
    ├── (a=7, N=1, Q_v=0.44, best=0.44, ubc=1.33)
    ├── (a=13, N=1, Q_v=0.11, best=0.11, ubc=1.01)
    └── (a=26, N=1, Q_v=0.84, best=0.84, ubc=1.73)
    └── (a=32, N=3, Q_v=0.41, best=0.62, ubc=1.11)
        ├── (a=2, N=1, Q_v=0.20, best=0.20, ubc=0.94)
        └── (a=7, N=1, Q_v=0.62, best=0.62, ubc=1.36)
[16:53:26] INFO     selected action 20 after 125 simulations.
           INFO     current action list: [1, 19, 20]
(N=125, Q_v=0.41, best=0.87)
├── (a=2, N=12, Q_v=0.30, best=0.62, ubc=0.75)
├── (a=3, N=2, Q_v=0.24, best=0.56, ubc=1.02)
└── (a=4, N=1, Q_v=-0.09, best=-0.09, ubc=0.50)
├── (a=7, N=3, Q_v=0.49, best=0.62, ubc=1.13)
├── (a=3, N=1, Q_v=0.33, best=0.33, ubc=1.07)
└── (a=25, N=1, Q_v=0.53, best=0.53, ubc=1.27)
├── (a=13, N=1, Q_v=0.04, best=0.04, ubc=1.15)
├── (a=21, N=1, Q_v=0.02, best=0.02, ubc=1.13)
├── (a=25, N=2, Q_v=0.31, best=0.42, ubc=1.10)
└── (a=26, N=1, Q_v=0.42, best=0.42, ubc=1.01)
└── (a=31, N=2, Q_v=0.27, best=0.29, ubc=1.06)
    └── (a=21, N=1, Q_v=0.25, best=0.25, ubc=0.84)
├── (a=7, N=18, Q_v=0.38, best=0.62, ubc=0.75)
├── (a=2, N=4, Q_v=0.47, best=0.58, ubc=1.07)
├── (a=3, N=1, Q_v=0.58, best=0.58, ubc=1.41)
├── (a=8, N=1, Q_v=0.44, best=0.44, ubc=1.27)
└── (a=13, N=1, Q_v=0.49, best=0.49, ubc=1.32)
├── (a=8, N=3, Q_v=0.39, best=0.47, ubc=1.09)
├── (a=2, N=1, Q_v=0.27, best=0.27, ubc=1.01)
└── (a=9, N=1, Q_v=0.47, best=0.47, ubc=1.21)
├── (a=13, N=3, Q_v=0.38, best=0.45, ubc=1.07)
├── (a=2, N=1, Q_v=0.45, best=0.45, ubc=1.20)
└── (a=21, N=1, Q_v=0.38, best=0.38, ubc=1.12)
├── (a=21, N=2, Q_v=0.27, best=0.27, ubc=1.12)
└── (a=25, N=1, Q_v=0.27, best=0.27, ubc=0.86)
├── (a=25, N=1, Q_v=-0.05, best=-0.05, ubc=1.15)
└── (a=31, N=4, Q_v=0.43, best=0.62, ubc=1.03)
    ├── (a=2, N=1, Q_v=0.25, best=0.25, ubc=1.09)
    ├── (a=8, N=1, Q_v=0.35, best=0.35, ubc=1.18)
    └── (a=21, N=1, Q_v=0.49, best=0.49, ubc=1.32)
├── (a=13, N=22, Q_v=0.43, best=0.78, ubc=0.76)
├── (a=2, N=3, Q_v=0.24, best=0.35, ubc=0.96)
├── (a=3, N=1, Q_v=0.07, best=0.07, ubc=0.81)
└── (a=25, N=1, Q_v=0.35, best=0.35, ubc=1.09)
├── (a=7, N=3, Q_v=0.43, best=0.64, ubc=1.15)
├── (a=2, N=1, Q_v=0.38, best=0.38, ubc=1.12)
└── (a=25, N=1, Q_v=0.27, best=0.27, ubc=1.01)
├── (a=14, N=2, Q_v=0.22, best=0.29, ubc=1.10)
└── (a=15, N=1, Q_v=0.29, best=0.29, ubc=0.88)
├── (a=21, N=3, Q_v=0.42, best=0.53, ubc=1.14)
├── (a=2, N=1, Q_v=0.36, best=0.36, ubc=1.10)
└── (a=22, N=1, Q_v=0.38, best=0.38, ubc=1.12)
├── (a=25, N=5, Q_v=0.54, best=0.78, ubc=1.09)
├── (a=2, N=1, Q_v=0.58, best=0.58, ubc=1.48)
├── (a=7, N=1, Q_v=0.78, best=0.78, ubc=1.68)
├── (a=14, N=1, Q_v=0.40, best=0.40, ubc=1.30)
└── (a=21, N=1, Q_v=0.69, best=0.69, ubc=1.59)
└── (a=31, N=5, Q_v=0.50, best=0.67, ubc=1.06)
    ├── (a=2, N=1, Q_v=0.65, best=0.65, ubc=1.55)
    ├── (a=7, N=1, Q_v=0.38, best=0.38, ubc=1.28)
    ├── (a=14, N=1, Q_v=0.67, best=0.67, ubc=1.57)
    └── (a=21, N=1, Q_v=0.40, best=0.40, ubc=1.30)
├── (a=21, N=22, Q_v=0.42, best=0.73, ubc=0.75)
├── (a=2, N=2, Q_v=0.11, best=0.25, ubc=0.99)
└── (a=25, N=1, Q_v=0.25, best=0.25, ubc=0.84)
├── (a=7, N=3, Q_v=0.41, best=0.47, ubc=1.12)
├── (a=2, N=1, Q_v=0.38, best=0.38, ubc=1.12)
└── (a=8, N=1, Q_v=0.47, best=0.47, ubc=1.21)
├── (a=13, N=4, Q_v=0.52, best=0.64, ubc=1.14)
├── (a=2, N=1, Q_v=0.42, best=0.42, ubc=1.25)
├── (a=7, N=1, Q_v=0.42, best=0.42, ubc=1.25)
└── (a=22, N=1, Q_v=0.62, best=0.62, ubc=1.45)
├── (a=22, N=3, Q_v=0.39, best=0.53, ubc=1.11)
├── (a=2, N=1, Q_v=0.53, best=0.53, ubc=1.27)
└── (a=13, N=1, Q_v=0.38, best=0.38, ubc=1.12)
├── (a=25, N=4, Q_v=0.42, best=0.56, ubc=1.04)
├── (a=2, N=1, Q_v=0.47, best=0.47, ubc=1.31)
├── (a=7, N=1, Q_v=0.29, best=0.29, ubc=1.12)
└── (a=13, N=1, Q_v=0.56, best=0.56, ubc=1.40)
└── (a=31, N=5, Q_v=0.51, best=0.73, ubc=1.06)
    ├── (a=2, N=1, Q_v=0.58, best=0.58, ubc=1.48)
    ├── (a=7, N=1, Q_v=0.73, best=0.73, ubc=1.62)
    ├── (a=13, N=1, Q_v=0.69, best=0.69, ubc=1.59)
    └── (a=22, N=1, Q_v=0.29, best=0.29, ubc=1.19)
├── (a=25, N=26, Q_v=0.44, best=0.76, ubc=0.75)
├── (a=2, N=4, Q_v=0.35, best=0.45, ubc=0.99)
├── (a=3, N=1, Q_v=0.27, best=0.27, ubc=1.11)
├── (a=7, N=1, Q_v=0.27, best=0.27, ubc=1.11)
└── (a=26, N=1, Q_v=0.45, best=0.45, ubc=1.29)
├── (a=7, N=4, Q_v=0.36, best=0.58, ubc=1.00)
├── (a=2, N=1, Q_v=0.58, best=0.58, ubc=1.41)
├── (a=8, N=1, Q_v=0.09, best=0.09, ubc=0.92)
└── (a=31, N=1, Q_v=0.29, best=0.29, ubc=1.12)
├── (a=13, N=5, Q_v=0.49, best=0.76, ubc=1.07)
├── (a=2, N=1, Q_v=0.76, best=0.76, ubc=1.66)
├── (a=7, N=1, Q_v=0.27, best=0.27, ubc=1.17)
├── (a=14, N=1, Q_v=0.53, best=0.53, ubc=1.42)
└── (a=26, N=1, Q_v=0.49, best=0.49, ubc=1.39)
├── (a=21, N=3, Q_v=0.38, best=0.40, ubc=1.11)
├── (a=2, N=1, Q_v=0.33, best=0.33, ubc=1.07)
└── (a=31, N=1, Q_v=0.40, best=0.40, ubc=1.14)
├── (a=26, N=6, Q_v=0.58, best=0.69, ubc=1.11)
├── (a=2, N=1, Q_v=0.60, best=0.60, ubc=1.55)
├── (a=7, N=1, Q_v=0.42, best=0.42, ubc=1.36)
├── (a=13, N=1, Q_v=0.44, best=0.44, ubc=1.38)
├── (a=21, N=1, Q_v=0.69, best=0.69, ubc=1.64)
└── (a=31, N=1, Q_v=0.67, best=0.67, ubc=1.62)
└── (a=31, N=3, Q_v=0.35, best=0.73, ubc=1.09)
    ├── (a=2, N=1, Q_v=0.05, best=0.05, ubc=0.80)
    └── (a=26, N=1, Q_v=0.27, best=0.27, ubc=1.01)
└── (a=31, N=24, Q_v=0.43, best=0.87, ubc=0.75)
    ├── (a=2, N=4, Q_v=0.39, best=0.58, ubc=1.02)
    ├── (a=3, N=1, Q_v=0.58, best=0.58, ubc=1.41)
    ├── (a=7, N=1, Q_v=0.44, best=0.44, ubc=1.27)
    └── (a=13, N=1, Q_v=0.27, best=0.27, ubc=1.11)
    ├── (a=7, N=4, Q_v=0.45, best=0.87, ubc=1.08)
    ├── (a=2, N=1, Q_v=0.87, best=0.87, ubc=1.71)
    ├── (a=8, N=1, Q_v=0.13, best=0.13, ubc=0.96)
    └── (a=21, N=1, Q_v=0.31, best=0.31, ubc=1.14)
    ├── (a=13, N=5, Q_v=0.49, best=0.84, ubc=1.05)
    ├── (a=2, N=1, Q_v=0.38, best=0.38, ubc=1.28)
    ├── (a=7, N=1, Q_v=0.84, best=0.84, ubc=1.73)
    ├── (a=14, N=1, Q_v=-0.02, best=-0.02, ubc=0.88)
    └── (a=32, N=1, Q_v=0.49, best=0.49, ubc=1.39)
    ├── (a=21, N=3, Q_v=0.37, best=0.55, ubc=1.10)
    ├── (a=2, N=1, Q_v=0.55, best=0.55, ubc=1.29)
    └── (a=25, N=1, Q_v=0.51, best=0.51, ubc=1.25)
    ├── (a=25, N=2, Q_v=0.25, best=0.38, ubc=1.14)
    └── (a=26, N=1, Q_v=0.11, best=0.11, ubc=0.70)
    └── (a=32, N=5, Q_v=0.50, best=0.65, ubc=1.06)
        ├── (a=2, N=1, Q_v=0.65, best=0.65, ubc=1.55)
        ├── (a=7, N=1, Q_v=0.62, best=0.62, ubc=1.52)
        ├── (a=13, N=1, Q_v=0.25, best=0.25, ubc=1.15)
        └── (a=21, N=1, Q_v=0.36, best=0.36, ubc=1.26)
[16:53:29] INFO     selected action 25 after 125 simulations.
           INFO     current action list: [1, 19, 20, 25]
(N=125, Q_v=0.37, best=0.75)
├── (a=2, N=23, Q_v=0.38, best=0.64, ubc=0.70)
├── (a=3, N=3, Q_v=0.22, best=0.31, ubc=0.95)
├── (a=4, N=1, Q_v=0.31, best=0.31, ubc=1.05)
└── (a=21, N=1, Q_v=0.07, best=0.07, ubc=0.81)
├── (a=7, N=3, Q_v=0.28, best=0.44, ubc=1.00)
├── (a=3, N=1, Q_v=0.44, best=0.44, ubc=1.18)
└── (a=31, N=1, Q_v=0.05, best=0.05, ubc=0.80)
├── (a=13, N=5, Q_v=0.50, best=0.64, ubc=1.06)
├── (a=3, N=1, Q_v=0.49, best=0.49, ubc=1.39)
├── (a=7, N=1, Q_v=0.45, best=0.45, ubc=1.35)
├── (a=14, N=1, Q_v=0.56, best=0.56, ubc=1.46)
└── (a=21, N=1, Q_v=0.64, best=0.64, ubc=1.53)
├── (a=21, N=3, Q_v=0.33, best=0.51, ubc=1.06)
├── (a=3, N=1, Q_v=0.04, best=0.04, ubc=0.78)
└── (a=22, N=1, Q_v=0.51, best=0.51, ubc=1.25)
├── (a=26, N=3, Q_v=0.28, best=0.35, ubc=1.00)
├── (a=3, N=1, Q_v=0.27, best=0.27, ubc=1.01)
└── (a=21, N=1, Q_v=0.35, best=0.35, ubc=1.09)
└── (a=31, N=5, Q_v=0.46, best=0.64, ubc=1.02)
    ├── (a=3, N=1, Q_v=0.42, best=0.42, ubc=1.32)
    ├── (a=7, N=1, Q_v=0.55, best=0.55, ubc=1.44)
    ├── (a=13, N=1, Q_v=0.09, best=0.09, ubc=0.99)
    └── (a=32, N=1, Q_v=0.64, best=0.64, ubc=1.53)
├── (a=7, N=25, Q_v=0.40, best=0.71, ubc=0.71)
├── (a=2, N=5, Q_v=0.44, best=0.67, ubc=1.00)
├── (a=3, N=1, Q_v=0.67, best=0.67, ubc=1.57)
├── (a=8, N=1, Q_v=0.25, best=0.25, ubc=1.15)
├── (a=13, N=1, Q_v=0.51, best=0.51, ubc=1.41)
└── (a=21, N=1, Q_v=0.22, best=0.22, ubc=1.12)
├── (a=8, N=4, Q_v=0.45, best=0.58, ubc=1.08)
├── (a=2, N=1, Q_v=0.25, best=0.25, ubc=1.09)
├── (a=9, N=1, Q_v=0.58, best=0.58, ubc=1.41)
└── (a=13, N=1, Q_v=0.49, best=0.49, ubc=1.32)
├── (a=13, N=4, Q_v=0.42, best=0.71, ubc=1.05)
├── (a=2, N=1, Q_v=0.42, best=0.42, ubc=1.25)
├── (a=8, N=1, Q_v=0.13, best=0.13, ubc=0.96)
└── (a=31, N=1, Q_v=0.42, best=0.42, ubc=1.25)
├── (a=21, N=4, Q_v=0.36, best=0.47, ubc=1.00)
├── (a=2, N=1, Q_v=0.24, best=0.24, ubc=1.07)
├── (a=8, N=1, Q_v=0.36, best=0.36, ubc=1.20)
└── (a=13, N=1, Q_v=0.38, best=0.38, ubc=1.21)
├── (a=26, N=4, Q_v=0.38, best=0.58, ubc=1.01)
├── (a=2, N=1, Q_v=0.53, best=0.53, ubc=1.36)
├── (a=8, N=1, Q_v=0.09, best=0.09, ubc=0.92)
└── (a=13, N=1, Q_v=0.31, best=0.31, ubc=1.14)
└── (a=31, N=3, Q_v=0.31, best=0.38, ubc=1.04)
    ├── (a=2, N=1, Q_v=0.27, best=0.27, ubc=1.01)
    └── (a=8, N=1, Q_v=0.27, best=0.27, ubc=1.01)
├── (a=13, N=14, Q_v=0.29, best=0.73, ubc=0.71)
├── (a=2, N=2, Q_v=0.33, best=0.49, ubc=1.14)
└── (a=21, N=1, Q_v=0.49, best=0.49, ubc=1.08)
├── (a=7, N=2, Q_v=0.23, best=0.24, ubc=1.04)
└── (a=21, N=1, Q_v=0.22, best=0.22, ubc=0.81)
├── (a=14, N=4, Q_v=0.52, best=0.73, ubc=1.10)
├── (a=2, N=1, Q_v=0.73, best=0.73, ubc=1.56)
├── (a=7, N=1, Q_v=0.49, best=0.49, ubc=1.32)
└── (a=15, N=1, Q_v=0.27, best=0.27, ubc=1.11)
├── (a=21, N=2, Q_v=0.19, best=0.24, ubc=1.00)
└── (a=7, N=1, Q_v=0.15, best=0.15, ubc=0.73)
├── (a=26, N=1, Q_v=0.00, best=0.00, ubc=1.15)
└── (a=31, N=2, Q_v=-0.02, best=0.33, ubc=0.79)
    └── (a=2, N=1, Q_v=-0.36, best=-0.36, ubc=0.22)
├── (a=21, N=28, Q_v=0.41, best=0.62, ubc=0.70)
├── (a=2, N=4, Q_v=0.40, best=0.58, ubc=1.05)
├── (a=3, N=1, Q_v=0.38, best=0.38, ubc=1.21)
├── (a=7, N=1, Q_v=0.58, best=0.58, ubc=1.41)
└── (a=31, N=1, Q_v=0.22, best=0.22, ubc=1.05)
├── (a=7, N=5, Q_v=0.45, best=0.53, ubc=1.03)
├── (a=2, N=1, Q_v=0.36, best=0.36, ubc=1.26)
├── (a=8, N=1, Q_v=0.42, best=0.42, ubc=1.32)
├── (a=13, N=1, Q_v=0.47, best=0.47, ubc=1.37)
└── (a=31, N=1, Q_v=0.49, best=0.49, ubc=1.39)
├── (a=13, N=5, Q_v=0.46, best=0.62, ubc=1.04)
├── (a=2, N=1, Q_v=0.40, best=0.40, ubc=1.30)
├── (a=7, N=1, Q_v=0.62, best=0.62, ubc=1.52)
├── (a=14, N=1, Q_v=0.49, best=0.49, ubc=1.39)
└── (a=26, N=1, Q_v=0.35, best=0.35, ubc=1.24)
├── (a=22, N=4, Q_v=0.37, best=0.45, ubc=1.01)
├── (a=2, N=1, Q_v=0.27, best=0.27, ubc=1.11)
├── (a=7, N=1, Q_v=0.45, best=0.45, ubc=1.29)
└── (a=13, N=1, Q_v=0.42, best=0.42, ubc=1.25)
├── (a=26, N=4, Q_v=0.36, best=0.58, ubc=1.00)
├── (a=2, N=1, Q_v=0.35, best=0.35, ubc=1.18)
├── (a=7, N=1, Q_v=0.27, best=0.27, ubc=1.11)
└── (a=27, N=1, Q_v=0.58, best=0.58, ubc=1.41)
└── (a=31, N=5, Q_v=0.39, best=0.55, ubc=0.96)
    ├── (a=2, N=1, Q_v=0.36, best=0.36, ubc=1.26)
    ├── (a=7, N=1, Q_v=0.55, best=0.55, ubc=1.44)
    ├── (a=13, N=1, Q_v=0.40, best=0.40, ubc=1.30)
    └── (a=22, N=1, Q_v=0.22, best=0.22, ubc=1.12)
├── (a=26, N=20, Q_v=0.36, best=0.56, ubc=0.70)
├── (a=2, N=4, Q_v=0.39, best=0.56, ubc=1.00)
├── (a=3, N=1, Q_v=0.56, best=0.56, ubc=1.40)
├── (a=7, N=1, Q_v=0.29, best=0.29, ubc=1.12)
└── (a=27, N=1, Q_v=0.33, best=0.33, ubc=1.16)
├── (a=7, N=3, Q_v=0.39, best=0.51, ubc=1.10)
├── (a=2, N=1, Q_v=0.33, best=0.33, ubc=1.07)
└── (a=31, N=1, Q_v=0.51, best=0.51, ubc=1.25)
├── (a=13, N=3, Q_v=0.32, best=0.40, ubc=1.02)
├── (a=2, N=1, Q_v=0.25, best=0.25, ubc=1.00)
└── (a=14, N=1, Q_v=0.40, best=0.40, ubc=1.14)
├── (a=21, N=3, Q_v=0.29, best=0.40, ubc=1.00)
├── (a=2, N=1, Q_v=0.25, best=0.25, ubc=1.00)
└── (a=7, N=1, Q_v=0.22, best=0.22, ubc=0.96)
├── (a=27, N=3, Q_v=0.42, best=0.53, ubc=1.13)
├── (a=2, N=1, Q_v=0.53, best=0.53, ubc=1.27)
└── (a=28, N=1, Q_v=0.49, best=0.49, ubc=1.23)
└── (a=31, N=3, Q_v=0.33, best=0.38, ubc=1.04)
    ├── (a=2, N=1, Q_v=0.38, best=0.38, ubc=1.12)
    └── (a=27, N=1, Q_v=0.25, best=0.25, ubc=1.00)
└── (a=31, N=14, Q_v=0.30, best=0.75, ubc=0.72)
    ├── (a=2, N=2, Q_v=0.26, best=0.47, ubc=1.08)
    └── (a=3, N=1, Q_v=0.05, best=0.05, ubc=0.64)
    ├── (a=7, N=2, Q_v=0.25, best=0.36, ubc=1.06)
    └── (a=13, N=1, Q_v=0.13, best=0.13, ubc=0.72)
    ├── (a=13, N=2, Q_v=0.27, best=0.56, ubc=1.08)
    └── (a=2, N=1, Q_v=-0.02, best=-0.02, ubc=0.57)
    ├── (a=21, N=2, Q_v=0.31, best=0.75, ubc=1.12)
    └── (a=22, N=1, Q_v=-0.13, best=-0.13, ubc=0.46)
    ├── (a=26, N=2, Q_v=0.21, best=0.42, ubc=1.02)
    └── (a=2, N=1, Q_v=0.00, best=0.00, ubc=0.59)
    └── (a=32, N=3, Q_v=0.42, best=0.56, ubc=1.08)
        ├── (a=2, N=1, Q_v=0.56, best=0.56, ubc=1.30)
        └── (a=21, N=1, Q_v=0.36, best=0.36, ubc=1.10)
[16:53:33] INFO     selected action 21 after 125 simulations.
           INFO     current action list: [1, 19, 20, 25, 21]
(N=125, Q_v=0.42, best=0.82)
├── (a=2, N=18, Q_v=0.38, best=0.75, ubc=0.74)
├── (a=3, N=3, Q_v=0.29, best=0.49, ubc=0.98)
├── (a=4, N=1, Q_v=0.13, best=0.13, ubc=0.87)
└── (a=22, N=1, Q_v=0.25, best=0.25, ubc=1.00)
├── (a=7, N=3, Q_v=0.45, best=0.75, ubc=1.15)
├── (a=3, N=1, Q_v=0.25, best=0.25, ubc=1.00)
└── (a=8, N=1, Q_v=0.36, best=0.36, ubc=1.10)
├── (a=13, N=3, Q_v=0.39, best=0.71, ubc=1.08)
├── (a=3, N=1, Q_v=0.25, best=0.25, ubc=1.00)
└── (a=26, N=1, Q_v=0.71, best=0.71, ubc=1.45)
├── (a=22, N=3, Q_v=0.42, best=0.49, ubc=1.11)
├── (a=3, N=1, Q_v=0.42, best=0.42, ubc=1.16)
└── (a=13, N=1, Q_v=0.35, best=0.35, ubc=1.09)
├── (a=26, N=3, Q_v=0.36, best=0.58, ubc=1.05)
├── (a=3, N=1, Q_v=0.05, best=0.05, ubc=0.80)
└── (a=31, N=1, Q_v=0.44, best=0.44, ubc=1.18)
└── (a=31, N=2, Q_v=0.33, best=0.47, ubc=1.18)
    └── (a=26, N=1, Q_v=0.18, best=0.18, ubc=0.77)
├── (a=7, N=15, Q_v=0.35, best=0.56, ubc=0.75)
├── (a=2, N=2, Q_v=0.35, best=0.42, ubc=1.17)
└── (a=31, N=1, Q_v=0.27, best=0.27, ubc=0.86)
├── (a=8, N=2, Q_v=0.38, best=0.44, ubc=1.20)
└── (a=26, N=1, Q_v=0.44, best=0.44, ubc=1.02)
├── (a=13, N=2, Q_v=0.31, best=0.35, ubc=1.13)
└── (a=8, N=1, Q_v=0.35, best=0.35, ubc=0.93)
├── (a=22, N=3, Q_v=0.39, best=0.56, ubc=1.06)
├── (a=2, N=1, Q_v=0.27, best=0.27, ubc=1.01)
└── (a=31, N=1, Q_v=0.56, best=0.56, ubc=1.30)
├── (a=26, N=3, Q_v=0.41, best=0.51, ubc=1.08)
├── (a=2, N=1, Q_v=0.33, best=0.33, ubc=1.07)
└── (a=13, N=1, Q_v=0.51, best=0.51, ubc=1.25)
└── (a=31, N=2, Q_v=0.34, best=0.38, ubc=1.16)
    └── (a=32, N=1, Q_v=0.38, best=0.38, ubc=0.97)
├── (a=13, N=28, Q_v=0.46, best=0.82, ubc=0.76)
├── (a=2, N=4, Q_v=0.45, best=0.64, ubc=1.09)
├── (a=3, N=1, Q_v=0.36, best=0.36, ubc=1.20)
├── (a=7, N=1, Q_v=0.53, best=0.53, ubc=1.36)
└── (a=22, N=1, Q_v=0.25, best=0.25, ubc=1.09)
├── (a=7, N=4, Q_v=0.30, best=0.56, ubc=0.95)
├── (a=2, N=1, Q_v=0.42, best=0.42, ubc=1.25)
├── (a=8, N=1, Q_v=0.02, best=0.02, ubc=0.85)
└── (a=22, N=1, Q_v=0.56, best=0.56, ubc=1.40)
├── (a=14, N=5, Q_v=0.53, best=0.62, ubc=1.11)
├── (a=2, N=1, Q_v=0.53, best=0.53, ubc=1.42)
├── (a=7, N=1, Q_v=0.58, best=0.58, ubc=1.48)
├── (a=15, N=1, Q_v=0.47, best=0.47, ubc=1.37)
└── (a=31, N=1, Q_v=0.47, best=0.47, ubc=1.37)
├── (a=22, N=4, Q_v=0.43, best=0.49, ubc=1.08)
├── (a=2, N=1, Q_v=0.49, best=0.49, ubc=1.32)
├── (a=7, N=1, Q_v=0.47, best=0.47, ubc=1.31)
└── (a=23, N=1, Q_v=0.35, best=0.35, ubc=1.18)
├── (a=26, N=5, Q_v=0.53, best=0.82, ubc=1.10)
├── (a=2, N=1, Q_v=0.82, best=0.82, ubc=1.72)
├── (a=7, N=1, Q_v=0.51, best=0.51, ubc=1.41)
├── (a=14, N=1, Q_v=0.29, best=0.29, ubc=1.19)
└── (a=22, N=1, Q_v=0.53, best=0.53, ubc=1.42)
└── (a=31, N=5, Q_v=0.47, best=0.69, ubc=1.05)
    ├── (a=2, N=1, Q_v=0.69, best=0.69, ubc=1.59)
    ├── (a=7, N=1, Q_v=0.58, best=0.58, ubc=1.48)
    ├── (a=14, N=1, Q_v=0.22, best=0.22, ubc=1.12)
    └── (a=26, N=1, Q_v=0.45, best=0.45, ubc=1.35)
├── (a=22, N=15, Q_v=0.35, best=0.53, ubc=0.76)
├── (a=2, N=3, Q_v=0.36, best=0.49, ubc=1.04)
├── (a=3, N=1, Q_v=0.25, best=0.25, ubc=1.00)
└── (a=31, N=1, Q_v=0.35, best=0.35, ubc=1.09)
├── (a=7, N=2, Q_v=0.39, best=0.47, ubc=1.21)
└── (a=8, N=1, Q_v=0.31, best=0.31, ubc=0.90)
├── (a=13, N=3, Q_v=0.49, best=0.53, ubc=1.16)
├── (a=2, N=1, Q_v=0.51, best=0.51, ubc=1.25)
└── (a=26, N=1, Q_v=0.44, best=0.44, ubc=1.18)
├── (a=23, N=2, Q_v=0.29, best=0.49, ubc=1.11)
└── (a=31, N=1, Q_v=0.49, best=0.49, ubc=1.08)
├── (a=26, N=2, Q_v=0.23, best=0.29, ubc=1.05)
└── (a=7, N=1, Q_v=0.29, best=0.29, ubc=0.88)
└── (a=31, N=2, Q_v=0.30, best=0.35, ubc=1.12)
    └── (a=13, N=1, Q_v=0.25, best=0.25, ubc=0.84)
├── (a=26, N=33, Q_v=0.47, best=0.82, ubc=0.74)
├── (a=2, N=4, Q_v=0.39, best=0.49, ubc=1.05)
├── (a=3, N=1, Q_v=0.33, best=0.33, ubc=1.16)
├── (a=7, N=1, Q_v=0.49, best=0.49, ubc=1.32)
└── (a=31, N=1, Q_v=0.40, best=0.40, ubc=1.23)
├── (a=7, N=6, Q_v=0.52, best=0.71, ubc=1.06)
├── (a=2, N=1, Q_v=0.71, best=0.71, ubc=1.66)
├── (a=8, N=1, Q_v=0.64, best=0.64, ubc=1.58)
├── (a=13, N=1, Q_v=0.49, best=0.49, ubc=1.44)
├── (a=22, N=1, Q_v=0.58, best=0.58, ubc=1.53)
└── (a=27, N=1, Q_v=0.22, best=0.22, ubc=1.16)
├── (a=13, N=4, Q_v=0.40, best=0.56, ubc=1.06)
├── (a=2, N=1, Q_v=0.44, best=0.44, ubc=1.27)
├── (a=7, N=1, Q_v=0.56, best=0.56, ubc=1.40)
└── (a=14, N=1, Q_v=0.49, best=0.49, ubc=1.32)
├── (a=22, N=5, Q_v=0.49, best=0.64, ubc=1.08)
├── (a=2, N=1, Q_v=0.44, best=0.44, ubc=1.33)
├── (a=7, N=1, Q_v=0.29, best=0.29, ubc=1.19)
├── (a=13, N=1, Q_v=0.49, best=0.49, ubc=1.39)
└── (a=23, N=1, Q_v=0.64, best=0.64, ubc=1.53)
├── (a=27, N=6, Q_v=0.57, best=0.82, ubc=1.11)
├── (a=2, N=1, Q_v=0.73, best=0.73, ubc=1.67)
├── (a=7, N=1, Q_v=0.53, best=0.53, ubc=1.47)
├── (a=13, N=1, Q_v=0.82, best=0.82, ubc=1.76)
├── (a=22, N=1, Q_v=0.56, best=0.56, ubc=1.51)
└── (a=28, N=1, Q_v=0.45, best=0.45, ubc=1.40)
└── (a=31, N=7, Q_v=0.48, best=0.76, ubc=0.98)
    ├── (a=2, N=1, Q_v=0.56, best=0.56, ubc=1.55)
    ├── (a=7, N=1, Q_v=0.40, best=0.40, ubc=1.39)
    ├── (a=13, N=1, Q_v=0.60, best=0.60, ubc=1.59)
    ├── (a=22, N=1, Q_v=0.60, best=0.60, ubc=1.59)
    ├── (a=27, N=1, Q_v=0.49, best=0.49, ubc=1.48)
    └── (a=32, N=1, Q_v=-0.04, best=-0.04, ubc=0.95)
└── (a=31, N=15, Q_v=0.36, best=0.62, ubc=0.76)
    ├── (a=2, N=2, Q_v=0.28, best=0.42, ubc=1.10)
    └── (a=32, N=1, Q_v=0.42, best=0.42, ubc=1.01)
    ├── (a=7, N=2, Q_v=0.22, best=0.25, ubc=1.04)
    └── (a=2, N=1, Q_v=0.25, best=0.25, ubc=0.84)
    ├── (a=13, N=3, Q_v=0.50, best=0.60, ubc=1.17)
    ├── (a=2, N=1, Q_v=0.33, best=0.33, ubc=1.07)
    └── (a=22, N=1, Q_v=0.56, best=0.56, ubc=1.30)
    ├── (a=22, N=2, Q_v=0.38, best=0.62, ubc=1.20)
    └── (a=26, N=1, Q_v=0.15, best=0.15, ubc=0.73)
    ├── (a=26, N=2, Q_v=0.17, best=0.25, ubc=1.00)
    └── (a=22, N=1, Q_v=0.25, best=0.25, ubc=0.84)
    └── (a=32, N=3, Q_v=0.43, best=0.60, ubc=1.10)
        ├── (a=2, N=1, Q_v=0.29, best=0.29, ubc=1.03)
        └── (a=7, N=1, Q_v=0.40, best=0.40, ubc=1.14)
[16:53:37] INFO     selected action 26 after 125 simulations.
           INFO     current action list: [1, 19, 20, 25, 21, 26]
(N=125, Q_v=0.41, best=0.78)
├── (a=2, N=17, Q_v=0.37, best=0.71, ubc=0.75)
├── (a=3, N=3, Q_v=0.47, best=0.55, ubc=1.15)
├── (a=4, N=1, Q_v=0.47, best=0.47, ubc=1.21)
└── (a=22, N=1, Q_v=0.38, best=0.38, ubc=1.12)
├── (a=7, N=1, Q_v=-0.11, best=-0.11, ubc=1.08)
├── (a=13, N=4, Q_v=0.48, best=0.71, ubc=1.07)
├── (a=3, N=1, Q_v=0.55, best=0.55, ubc=1.38)
├── (a=7, N=1, Q_v=0.18, best=0.18, ubc=1.01)
└── (a=27, N=1, Q_v=0.71, best=0.71, ubc=1.54)
├── (a=22, N=2, Q_v=0.38, best=0.38, ubc=1.22)
└── (a=31, N=1, Q_v=0.38, best=0.38, ubc=0.97)
├── (a=27, N=3, Q_v=0.29, best=0.47, ubc=0.98)
├── (a=3, N=1, Q_v=0.04, best=0.04, ubc=0.78)
└── (a=28, N=1, Q_v=0.36, best=0.36, ubc=1.10)
└── (a=31, N=3, Q_v=0.34, best=0.49, ubc=1.03)
    ├── (a=3, N=1, Q_v=0.20, best=0.20, ubc=0.94)
    └── (a=27, N=1, Q_v=0.49, best=0.49, ubc=1.23)
├── (a=7, N=23, Q_v=0.43, best=0.71, ubc=0.75)
├── (a=2, N=4, Q_v=0.36, best=0.67, ubc=0.99)
├── (a=3, N=1, Q_v=0.09, best=0.09, ubc=0.92)
├── (a=8, N=1, Q_v=0.15, best=0.15, ubc=0.98)
└── (a=31, N=1, Q_v=0.67, best=0.67, ubc=1.51)
├── (a=8, N=3, Q_v=0.41, best=0.49, ubc=1.13)
├── (a=2, N=1, Q_v=0.29, best=0.29, ubc=1.03)
└── (a=31, N=1, Q_v=0.44, best=0.44, ubc=1.18)
├── (a=13, N=4, Q_v=0.49, best=0.71, ubc=1.11)
├── (a=2, N=1, Q_v=0.53, best=0.53, ubc=1.36)
├── (a=8, N=1, Q_v=0.22, best=0.22, ubc=1.05)
└── (a=22, N=1, Q_v=0.49, best=0.49, ubc=1.32)
├── (a=22, N=3, Q_v=0.42, best=0.53, ubc=1.14)
├── (a=2, N=1, Q_v=0.53, best=0.53, ubc=1.27)
└── (a=27, N=1, Q_v=0.47, best=0.47, ubc=1.21)
├── (a=27, N=4, Q_v=0.49, best=0.56, ubc=1.12)
├── (a=2, N=1, Q_v=0.53, best=0.53, ubc=1.36)
├── (a=8, N=1, Q_v=0.55, best=0.55, ubc=1.38)
└── (a=13, N=1, Q_v=0.56, best=0.56, ubc=1.40)
└── (a=31, N=4, Q_v=0.49, best=0.58, ubc=1.12)
    ├── (a=2, N=1, Q_v=0.55, best=0.55, ubc=1.38)
    ├── (a=8, N=1, Q_v=0.47, best=0.47, ubc=1.31)
    └── (a=22, N=1, Q_v=0.58, best=0.58, ubc=1.41)
├── (a=13, N=22, Q_v=0.42, best=0.65, ubc=0.75)
├── (a=2, N=5, Q_v=0.52, best=0.65, ubc=1.08)
├── (a=3, N=1, Q_v=0.47, best=0.47, ubc=1.37)
├── (a=7, N=1, Q_v=0.53, best=0.53, ubc=1.42)
├── (a=14, N=1, Q_v=0.47, best=0.47, ubc=1.37)
└── (a=22, N=1, Q_v=0.47, best=0.47, ubc=1.37)
├── (a=7, N=3, Q_v=0.37, best=0.58, ubc=1.09)
├── (a=2, N=1, Q_v=0.58, best=0.58, ubc=1.32)
└── (a=31, N=1, Q_v=0.31, best=0.31, ubc=1.05)
├── (a=14, N=3, Q_v=0.33, best=0.44, ubc=1.04)
├── (a=2, N=1, Q_v=0.36, best=0.36, ubc=1.10)
└── (a=27, N=1, Q_v=0.44, best=0.44, ubc=1.18)
├── (a=22, N=2, Q_v=0.15, best=0.36, ubc=1.02)
└── (a=23, N=1, Q_v=0.36, best=0.36, ubc=0.95)
├── (a=27, N=4, Q_v=0.49, best=0.65, ubc=1.11)
├── (a=2, N=1, Q_v=0.58, best=0.58, ubc=1.41)
├── (a=7, N=1, Q_v=0.22, best=0.22, ubc=1.05)
└── (a=14, N=1, Q_v=0.65, best=0.65, ubc=1.49)
└── (a=31, N=4, Q_v=0.44, best=0.56, ubc=1.06)
    ├── (a=2, N=1, Q_v=0.51, best=0.51, ubc=1.34)
    ├── (a=7, N=1, Q_v=0.33, best=0.33, ubc=1.16)
    └── (a=14, N=1, Q_v=0.36, best=0.36, ubc=1.20)
├── (a=22, N=19, Q_v=0.39, best=0.78, ubc=0.75)
├── (a=2, N=4, Q_v=0.46, best=0.78, ubc=1.07)
├── (a=3, N=1, Q_v=0.25, best=0.25, ubc=1.09)
├── (a=7, N=1, Q_v=0.56, best=0.56, ubc=1.40)
└── (a=13, N=1, Q_v=0.24, best=0.24, ubc=1.07)
├── (a=7, N=3, Q_v=0.36, best=0.47, ubc=1.06)
├── (a=2, N=1, Q_v=0.25, best=0.25, ubc=1.00)
└── (a=13, N=1, Q_v=0.47, best=0.47, ubc=1.21)
├── (a=13, N=2, Q_v=0.28, best=0.36, ubc=1.14)
└── (a=2, N=1, Q_v=0.20, best=0.20, ubc=0.79)
├── (a=23, N=4, Q_v=0.42, best=0.58, ubc=1.03)
├── (a=2, N=1, Q_v=0.33, best=0.33, ubc=1.16)
├── (a=7, N=1, Q_v=0.31, best=0.31, ubc=1.14)
└── (a=27, N=1, Q_v=0.47, best=0.47, ubc=1.31)
├── (a=27, N=2, Q_v=0.28, best=0.29, ubc=1.14)
└── (a=2, N=1, Q_v=0.29, best=0.29, ubc=0.88)
└── (a=31, N=3, Q_v=0.41, best=0.58, ubc=1.11)
    ├── (a=2, N=1, Q_v=0.58, best=0.58, ubc=1.32)
    └── (a=7, N=1, Q_v=0.22, best=0.22, ubc=0.96)
├── (a=27, N=24, Q_v=0.44, best=0.64, ubc=0.75)
├── (a=2, N=4, Q_v=0.45, best=0.53, ubc=1.08)
├── (a=3, N=1, Q_v=0.38, best=0.38, ubc=1.21)
├── (a=7, N=1, Q_v=0.53, best=0.53, ubc=1.36)
└── (a=13, N=1, Q_v=0.53, best=0.53, ubc=1.36)
├── (a=7, N=4, Q_v=0.50, best=0.58, ubc=1.13)
├── (a=2, N=1, Q_v=0.49, best=0.49, ubc=1.32)
├── (a=8, N=1, Q_v=0.58, best=0.58, ubc=1.41)
└── (a=13, N=1, Q_v=0.47, best=0.47, ubc=1.31)
├── (a=13, N=4, Q_v=0.46, best=0.60, ubc=1.09)
├── (a=2, N=1, Q_v=0.60, best=0.60, ubc=1.43)
├── (a=7, N=1, Q_v=0.49, best=0.49, ubc=1.32)
└── (a=31, N=1, Q_v=0.45, best=0.45, ubc=1.29)
├── (a=22, N=3, Q_v=0.40, best=0.56, ubc=1.13)
├── (a=2, N=1, Q_v=0.56, best=0.56, ubc=1.30)
└── (a=31, N=1, Q_v=0.24, best=0.24, ubc=0.98)
├── (a=28, N=4, Q_v=0.44, best=0.64, ubc=1.07)
├── (a=2, N=1, Q_v=0.56, best=0.56, ubc=1.40)
├── (a=7, N=1, Q_v=0.00, best=0.00, ubc=0.83)
└── (a=13, N=1, Q_v=0.56, best=0.56, ubc=1.40)
└── (a=31, N=4, Q_v=0.38, best=0.64, ubc=1.01)
    ├── (a=2, N=1, Q_v=0.56, best=0.56, ubc=1.40)
    ├── (a=7, N=1, Q_v=0.13, best=0.13, ubc=0.96)
    └── (a=13, N=1, Q_v=0.20, best=0.20, ubc=1.03)
└── (a=31, N=19, Q_v=0.37, best=0.62, ubc=0.72)
    ├── (a=2, N=3, Q_v=0.32, best=0.47, ubc=1.02)
    ├── (a=3, N=1, Q_v=0.20, best=0.20, ubc=0.94)
    └── (a=13, N=1, Q_v=0.27, best=0.27, ubc=1.01)
    ├── (a=7, N=2, Q_v=0.25, best=0.42, ubc=1.10)
    └── (a=27, N=1, Q_v=0.42, best=0.42, ubc=1.01)
    ├── (a=13, N=2, Q_v=0.29, best=0.55, ubc=1.15)
    └── (a=22, N=1, Q_v=0.55, best=0.55, ubc=1.13)
    ├── (a=22, N=3, Q_v=0.17, best=0.40, ubc=0.87)
    ├── (a=2, N=1, Q_v=-0.18, best=-0.18, ubc=0.56)
    └── (a=32, N=1, Q_v=0.40, best=0.40, ubc=1.14)
    ├── (a=27, N=4, Q_v=0.50, best=0.62, ubc=1.10)
    ├── (a=2, N=1, Q_v=0.62, best=0.62, ubc=1.45)
    ├── (a=7, N=1, Q_v=0.31, best=0.31, ubc=1.14)
    └── (a=13, N=1, Q_v=0.53, best=0.53, ubc=1.36)
    └── (a=32, N=4, Q_v=0.51, best=0.62, ubc=1.12)
        ├── (a=2, N=1, Q_v=0.58, best=0.58, ubc=1.41)
        ├── (a=7, N=1, Q_v=0.29, best=0.29, ubc=1.12)
        └── (a=27, N=1, Q_v=0.56, best=0.56, ubc=1.40)
[16:53:40] INFO     selected action 27 after 125 simulations.
           INFO     current action list: [1, 19, 20, 25, 21, 26, 27]
(N=125, Q_v=0.39, best=0.87)
├── (a=2, N=23, Q_v=0.42, best=0.76, ubc=0.74)
├── (a=3, N=3, Q_v=0.27, best=0.44, ubc=1.00)
├── (a=4, N=1, Q_v=0.27, best=0.27, ubc=1.01)
└── (a=31, N=1, Q_v=0.44, best=0.44, ubc=1.18)
├── (a=7, N=4, Q_v=0.45, best=0.64, ubc=1.08)
├── (a=3, N=1, Q_v=0.38, best=0.38, ubc=1.21)
├── (a=8, N=1, Q_v=0.36, best=0.36, ubc=1.20)
└── (a=13, N=1, Q_v=0.42, best=0.42, ubc=1.25)
├── (a=13, N=5, Q_v=0.49, best=0.76, ubc=1.05)
├── (a=3, N=1, Q_v=0.27, best=0.27, ubc=1.17)
├── (a=7, N=1, Q_v=0.49, best=0.49, ubc=1.39)
├── (a=14, N=1, Q_v=0.35, best=0.35, ubc=1.24)
└── (a=28, N=1, Q_v=0.76, best=0.76, ubc=1.66)
├── (a=22, N=3, Q_v=0.42, best=0.49, ubc=1.14)
├── (a=3, N=1, Q_v=0.47, best=0.47, ubc=1.21)
└── (a=31, N=1, Q_v=0.29, best=0.29, ubc=1.03)
├── (a=28, N=3, Q_v=0.28, best=0.33, ubc=1.01)
├── (a=3, N=1, Q_v=0.27, best=0.27, ubc=1.01)
└── (a=29, N=1, Q_v=0.33, best=0.33, ubc=1.07)
└── (a=31, N=4, Q_v=0.47, best=0.65, ubc=1.09)
    ├── (a=3, N=1, Q_v=0.65, best=0.65, ubc=1.49)
    ├── (a=7, N=1, Q_v=0.53, best=0.53, ubc=1.36)
    └── (a=32, N=1, Q_v=0.18, best=0.18, ubc=1.01)
├── (a=7, N=23, Q_v=0.42, best=0.87, ubc=0.74)
├── (a=2, N=2, Q_v=0.19, best=0.31, ubc=1.08)
└── (a=13, N=1, Q_v=0.07, best=0.07, ubc=0.66)
├── (a=8, N=3, Q_v=0.36, best=0.55, ubc=1.09)
├── (a=2, N=1, Q_v=0.40, best=0.40, ubc=1.14)
└── (a=9, N=1, Q_v=0.55, best=0.55, ubc=1.29)
├── (a=13, N=4, Q_v=0.40, best=0.62, ubc=1.03)
├── (a=2, N=1, Q_v=0.62, best=0.62, ubc=1.45)
├── (a=8, N=1, Q_v=0.33, best=0.33, ubc=1.16)
└── (a=14, N=1, Q_v=0.40, best=0.40, ubc=1.23)
├── (a=22, N=3, Q_v=0.35, best=0.53, ubc=1.07)
├── (a=2, N=1, Q_v=0.53, best=0.53, ubc=1.27)
└── (a=23, N=1, Q_v=0.45, best=0.45, ubc=1.20)
├── (a=28, N=4, Q_v=0.45, best=0.58, ubc=1.08)
├── (a=2, N=1, Q_v=0.36, best=0.36, ubc=1.20)
├── (a=8, N=1, Q_v=0.49, best=0.49, ubc=1.32)
└── (a=22, N=1, Q_v=0.58, best=0.58, ubc=1.41)
└── (a=31, N=6, Q_v=0.54, best=0.87, ubc=1.05)
    ├── (a=2, N=1, Q_v=0.51, best=0.51, ubc=1.46)
    ├── (a=8, N=1, Q_v=0.49, best=0.49, ubc=1.44)
    ├── (a=13, N=1, Q_v=0.87, best=0.87, ubc=1.82)
    ├── (a=22, N=1, Q_v=0.40, best=0.40, ubc=1.35)
    └── (a=28, N=1, Q_v=0.49, best=0.49, ubc=1.44)
├── (a=13, N=21, Q_v=0.40, best=0.64, ubc=0.73)
├── (a=2, N=4, Q_v=0.51, best=0.60, ubc=1.13)
├── (a=3, N=1, Q_v=0.60, best=0.60, ubc=1.43)
├── (a=7, N=1, Q_v=0.53, best=0.53, ubc=1.36)
└── (a=14, N=1, Q_v=0.56, best=0.56, ubc=1.40)
├── (a=7, N=3, Q_v=0.33, best=0.64, ubc=1.04)
├── (a=2, N=1, Q_v=0.29, best=0.29, ubc=1.03)
└── (a=31, N=1, Q_v=0.64, best=0.64, ubc=1.38)
├── (a=14, N=3, Q_v=0.42, best=0.56, ubc=1.14)
├── (a=2, N=1, Q_v=0.56, best=0.56, ubc=1.30)
└── (a=7, N=1, Q_v=0.51, best=0.51, ubc=1.25)
├── (a=22, N=4, Q_v=0.42, best=0.58, ubc=1.04)
├── (a=2, N=1, Q_v=0.22, best=0.22, ubc=1.05)
├── (a=7, N=1, Q_v=0.33, best=0.33, ubc=1.16)
└── (a=28, N=1, Q_v=0.58, best=0.58, ubc=1.41)
├── (a=28, N=3, Q_v=0.39, best=0.49, ubc=1.10)
├── (a=2, N=1, Q_v=0.49, best=0.49, ubc=1.23)
└── (a=14, N=1, Q_v=0.49, best=0.49, ubc=1.23)
└── (a=31, N=3, Q_v=0.33, best=0.51, ubc=1.04)
    ├── (a=2, N=1, Q_v=0.15, best=0.15, ubc=0.89)
    └── (a=14, N=1, Q_v=0.33, best=0.33, ubc=1.07)
├── (a=22, N=20, Q_v=0.39, best=0.64, ubc=0.73)
├── (a=2, N=3, Q_v=0.44, best=0.47, ubc=1.15)
├── (a=3, N=1, Q_v=0.47, best=0.47, ubc=1.21)
└── (a=28, N=1, Q_v=0.38, best=0.38, ubc=1.12)
├── (a=7, N=4, Q_v=0.45, best=0.60, ubc=1.06)
├── (a=2, N=1, Q_v=0.49, best=0.49, ubc=1.32)
├── (a=8, N=1, Q_v=0.27, best=0.27, ubc=1.11)
└── (a=28, N=1, Q_v=0.44, best=0.44, ubc=1.27)
├── (a=13, N=3, Q_v=0.34, best=0.45, ubc=1.05)
├── (a=2, N=1, Q_v=0.13, best=0.13, ubc=0.87)
└── (a=28, N=1, Q_v=0.44, best=0.44, ubc=1.18)
├── (a=23, N=4, Q_v=0.34, best=0.56, ubc=0.95)
├── (a=2, N=1, Q_v=0.42, best=0.42, ubc=1.25)
├── (a=7, N=1, Q_v=0.56, best=0.56, ubc=1.40)
└── (a=13, N=1, Q_v=-0.09, best=-0.09, ubc=0.74)
├── (a=28, N=2, Q_v=0.25, best=0.40, ubc=1.12)
└── (a=7, N=1, Q_v=0.40, best=0.40, ubc=0.99)
└── (a=31, N=3, Q_v=0.47, best=0.64, ubc=1.17)
    ├── (a=2, N=1, Q_v=0.16, best=0.16, ubc=0.90)
    └── (a=13, N=1, Q_v=0.64, best=0.64, ubc=1.38)
├── (a=28, N=20, Q_v=0.40, best=0.80, ubc=0.74)
├── (a=2, N=3, Q_v=0.28, best=0.49, ubc=0.99)
├── (a=3, N=1, Q_v=0.20, best=0.20, ubc=0.94)
└── (a=13, N=1, Q_v=0.16, best=0.16, ubc=0.90)
├── (a=7, N=3, Q_v=0.35, best=0.51, ubc=1.06)
├── (a=2, N=1, Q_v=0.38, best=0.38, ubc=1.12)
└── (a=13, N=1, Q_v=0.16, best=0.16, ubc=0.90)
├── (a=13, N=3, Q_v=0.42, best=0.49, ubc=1.13)
├── (a=2, N=1, Q_v=0.45, best=0.45, ubc=1.20)
└── (a=14, N=1, Q_v=0.49, best=0.49, ubc=1.23)
├── (a=22, N=4, Q_v=0.50, best=0.55, ubc=1.12)
├── (a=2, N=1, Q_v=0.49, best=0.49, ubc=1.32)
├── (a=7, N=1, Q_v=0.53, best=0.53, ubc=1.36)
└── (a=13, N=1, Q_v=0.55, best=0.55, ubc=1.38)
├── (a=29, N=3, Q_v=0.43, best=0.56, ubc=1.14)
├── (a=2, N=1, Q_v=0.35, best=0.35, ubc=1.09)
└── (a=7, N=1, Q_v=0.38, best=0.38, ubc=1.12)
└── (a=31, N=3, Q_v=0.37, best=0.80, ubc=1.08)
    ├── (a=2, N=1, Q_v=0.22, best=0.22, ubc=0.96)
    └── (a=7, N=1, Q_v=0.09, best=0.09, ubc=0.83)
└── (a=31, N=17, Q_v=0.37, best=0.56, ubc=0.75)
    ├── (a=2, N=3, Q_v=0.47, best=0.53, ubc=1.16)
    ├── (a=3, N=1, Q_v=0.45, best=0.45, ubc=1.20)
    └── (a=28, N=1, Q_v=0.53, best=0.53, ubc=1.27)
    ├── (a=7, N=3, Q_v=0.29, best=0.53, ubc=0.98)
    ├── (a=2, N=1, Q_v=-0.05, best=-0.05, ubc=0.69)
    └── (a=32, N=1, Q_v=0.53, best=0.53, ubc=1.27)
    ├── (a=13, N=2, Q_v=0.35, best=0.56, ubc=1.19)
    └── (a=2, N=1, Q_v=0.56, best=0.56, ubc=1.15)
    ├── (a=22, N=3, Q_v=0.41, best=0.53, ubc=1.10)
    ├── (a=2, N=1, Q_v=0.24, best=0.24, ubc=0.98)
    └── (a=23, N=1, Q_v=0.47, best=0.47, ubc=1.21)
    ├── (a=28, N=3, Q_v=0.26, best=0.44, ubc=0.95)
    ├── (a=2, N=1, Q_v=0.42, best=0.42, ubc=1.16)
    └── (a=7, N=1, Q_v=-0.07, best=-0.07, ubc=0.67)
    └── (a=32, N=2, Q_v=0.35, best=0.49, ubc=1.20)
        └── (a=2, N=1, Q_v=0.49, best=0.49, ubc=1.08)
[16:53:43] INFO     selected action 7 after 125 simulations.
           INFO     current action list: [1, 19, 20, 25, 21, 26, 27, 7]
(N=125, Q_v=0.42, best=0.78)
├── (a=2, N=13, Q_v=0.32, best=0.58, ubc=0.75)
├── (a=3, N=2, Q_v=0.30, best=0.35, ubc=1.10)
└── (a=13, N=1, Q_v=0.25, best=0.25, ubc=0.84)
├── (a=8, N=1, Q_v=0.11, best=0.11, ubc=1.24)
├── (a=13, N=2, Q_v=0.31, best=0.31, ubc=1.11)
└── (a=8, N=1, Q_v=0.31, best=0.31, ubc=0.90)
├── (a=22, N=2, Q_v=0.39, best=0.56, ubc=1.19)
└── (a=3, N=1, Q_v=0.56, best=0.56, ubc=1.15)
├── (a=28, N=2, Q_v=0.35, best=0.42, ubc=1.16)
└── (a=31, N=1, Q_v=0.42, best=0.42, ubc=1.01)
└── (a=31, N=3, Q_v=0.42, best=0.58, ubc=1.07)
    ├── (a=3, N=1, Q_v=0.29, best=0.29, ubc=1.03)
    └── (a=22, N=1, Q_v=0.38, best=0.38, ubc=1.12)
├── (a=8, N=22, Q_v=0.43, best=0.78, ubc=0.76)
├── (a=2, N=3, Q_v=0.41, best=0.65, ubc=1.13)
├── (a=3, N=1, Q_v=0.33, best=0.33, ubc=1.07)
└── (a=13, N=1, Q_v=0.25, best=0.25, ubc=1.00)
├── (a=9, N=4, Q_v=0.45, best=0.55, ubc=1.08)
├── (a=2, N=1, Q_v=0.42, best=0.42, ubc=1.25)
├── (a=10, N=1, Q_v=0.36, best=0.36, ubc=1.20)
└── (a=28, N=1, Q_v=0.49, best=0.49, ubc=1.32)
├── (a=13, N=4, Q_v=0.50, best=0.60, ubc=1.12)
├── (a=2, N=1, Q_v=0.49, best=0.49, ubc=1.32)
├── (a=9, N=1, Q_v=0.35, best=0.35, ubc=1.18)
└── (a=22, N=1, Q_v=0.55, best=0.55, ubc=1.38)
├── (a=22, N=2, Q_v=0.17, best=0.29, ubc=1.05)
└── (a=9, N=1, Q_v=0.05, best=0.05, ubc=0.64)
├── (a=28, N=5, Q_v=0.52, best=0.78, ubc=1.08)
├── (a=2, N=1, Q_v=0.51, best=0.51, ubc=1.41)
├── (a=9, N=1, Q_v=0.36, best=0.36, ubc=1.26)
├── (a=13, N=1, Q_v=0.78, best=0.78, ubc=1.68)
└── (a=22, N=1, Q_v=0.49, best=0.49, ubc=1.39)
└── (a=31, N=3, Q_v=0.41, best=0.49, ubc=1.13)
    ├── (a=2, N=1, Q_v=0.49, best=0.49, ubc=1.23)
    └── (a=22, N=1, Q_v=0.49, best=0.49, ubc=1.23)
├── (a=13, N=19, Q_v=0.40, best=0.76, ubc=0.75)
├── (a=2, N=1, Q_v=-0.11, best=-0.11, ubc=1.10)
├── (a=8, N=3, Q_v=0.33, best=0.49, ubc=1.03)
├── (a=2, N=1, Q_v=0.49, best=0.49, ubc=1.23)
└── (a=9, N=1, Q_v=0.18, best=0.18, ubc=0.92)
├── (a=14, N=4, Q_v=0.49, best=0.67, ubc=1.10)
├── (a=2, N=1, Q_v=0.22, best=0.22, ubc=1.05)
├── (a=8, N=1, Q_v=0.56, best=0.56, ubc=1.40)
└── (a=15, N=1, Q_v=0.51, best=0.51, ubc=1.34)
├── (a=22, N=3, Q_v=0.45, best=0.60, ubc=1.15)
├── (a=2, N=1, Q_v=0.49, best=0.49, ubc=1.23)
└── (a=28, N=1, Q_v=0.60, best=0.60, ubc=1.34)
├── (a=28, N=2, Q_v=0.21, best=0.76, ubc=1.07)
└── (a=2, N=1, Q_v=-0.35, best=-0.35, ubc=0.24)
└── (a=31, N=5, Q_v=0.52, best=0.67, ubc=1.06)
    ├── (a=2, N=1, Q_v=0.67, best=0.67, ubc=1.57)
    ├── (a=8, N=1, Q_v=0.40, best=0.40, ubc=1.30)
    ├── (a=14, N=1, Q_v=0.40, best=0.40, ubc=1.30)
    └── (a=28, N=1, Q_v=0.56, best=0.56, ubc=1.46)
├── (a=22, N=24, Q_v=0.44, best=0.60, ubc=0.75)
├── (a=2, N=4, Q_v=0.46, best=0.58, ubc=1.09)
├── (a=3, N=1, Q_v=0.24, best=0.24, ubc=1.07)
├── (a=8, N=1, Q_v=0.53, best=0.53, ubc=1.36)
└── (a=28, N=1, Q_v=0.58, best=0.58, ubc=1.41)
├── (a=8, N=3, Q_v=0.36, best=0.49, ubc=1.09)
├── (a=2, N=1, Q_v=0.49, best=0.49, ubc=1.23)
└── (a=9, N=1, Q_v=0.35, best=0.35, ubc=1.09)
├── (a=13, N=4, Q_v=0.39, best=0.60, ubc=1.02)
├── (a=2, N=1, Q_v=0.42, best=0.42, ubc=1.25)
├── (a=8, N=1, Q_v=0.25, best=0.25, ubc=1.09)
└── (a=23, N=1, Q_v=0.27, best=0.27, ubc=1.11)
├── (a=23, N=5, Q_v=0.48, best=0.53, ubc=1.04)
├── (a=2, N=1, Q_v=0.49, best=0.49, ubc=1.39)
├── (a=8, N=1, Q_v=0.45, best=0.45, ubc=1.35)
├── (a=13, N=1, Q_v=0.53, best=0.53, ubc=1.42)
└── (a=24, N=1, Q_v=0.38, best=0.38, ubc=1.28)
├── (a=28, N=4, Q_v=0.46, best=0.60, ubc=1.09)
├── (a=2, N=1, Q_v=0.51, best=0.51, ubc=1.34)
├── (a=8, N=1, Q_v=0.60, best=0.60, ubc=1.43)
└── (a=13, N=1, Q_v=0.40, best=0.40, ubc=1.23)
└── (a=31, N=3, Q_v=0.40, best=0.47, ubc=1.13)
    ├── (a=2, N=1, Q_v=0.47, best=0.47, ubc=1.21)
    └── (a=13, N=1, Q_v=0.29, best=0.29, ubc=1.03)
├── (a=28, N=31, Q_v=0.47, best=0.75, ubc=0.75)
├── (a=2, N=5, Q_v=0.50, best=0.65, ubc=1.09)
├── (a=3, N=1, Q_v=0.64, best=0.64, ubc=1.53)
├── (a=8, N=1, Q_v=0.07, best=0.07, ubc=0.97)
├── (a=13, N=1, Q_v=0.60, best=0.60, ubc=1.50)
└── (a=31, N=1, Q_v=0.55, best=0.55, ubc=1.44)
├── (a=8, N=5, Q_v=0.49, best=0.65, ubc=1.08)
├── (a=2, N=1, Q_v=0.65, best=0.65, ubc=1.55)
├── (a=9, N=1, Q_v=0.51, best=0.51, ubc=1.41)
├── (a=13, N=1, Q_v=0.35, best=0.35, ubc=1.24)
└── (a=22, N=1, Q_v=0.49, best=0.49, ubc=1.39)
├── (a=13, N=4, Q_v=0.33, best=0.45, ubc=0.98)
├── (a=2, N=1, Q_v=0.45, best=0.45, ubc=1.29)
├── (a=8, N=1, Q_v=0.40, best=0.40, ubc=1.23)
└── (a=14, N=1, Q_v=0.27, best=0.27, ubc=1.11)
├── (a=22, N=6, Q_v=0.49, best=0.75, ubc=1.03)
├── (a=2, N=1, Q_v=0.31, best=0.31, ubc=1.26)
├── (a=8, N=1, Q_v=0.35, best=0.35, ubc=1.29)
├── (a=13, N=1, Q_v=0.62, best=0.62, ubc=1.56)
├── (a=23, N=1, Q_v=0.55, best=0.55, ubc=1.49)
└── (a=29, N=1, Q_v=0.40, best=0.40, ubc=1.35)
├── (a=29, N=5, Q_v=0.48, best=0.64, ubc=1.07)
├── (a=2, N=1, Q_v=0.47, best=0.47, ubc=1.37)
├── (a=8, N=1, Q_v=0.56, best=0.56, ubc=1.46)
├── (a=13, N=1, Q_v=0.64, best=0.64, ubc=1.53)
└── (a=22, N=1, Q_v=0.40, best=0.40, ubc=1.30)
└── (a=31, N=5, Q_v=0.49, best=0.64, ubc=1.08)
    ├── (a=2, N=1, Q_v=0.56, best=0.56, ubc=1.46)
    ├── (a=8, N=1, Q_v=0.60, best=0.60, ubc=1.50)
    ├── (a=13, N=1, Q_v=0.64, best=0.64, ubc=1.53)
    └── (a=22, N=1, Q_v=0.18, best=0.18, ubc=1.08)
└── (a=31, N=15, Q_v=0.36, best=0.65, ubc=0.76)
    ├── (a=2, N=2, Q_v=0.36, best=0.38, ubc=1.19)
    └── (a=8, N=1, Q_v=0.35, best=0.35, ubc=0.93)
    ├── (a=8, N=3, Q_v=0.44, best=0.58, ubc=1.11)
    ├── (a=2, N=1, Q_v=0.24, best=0.24, ubc=0.98)
    └── (a=13, N=1, Q_v=0.58, best=0.58, ubc=1.32)
    ├── (a=13, N=2, Q_v=0.27, best=0.33, ubc=1.10)
    └── (a=28, N=1, Q_v=0.22, best=0.22, ubc=0.81)
    ├── (a=22, N=2, Q_v=0.36, best=0.45, ubc=1.19)
    └── (a=8, N=1, Q_v=0.45, best=0.45, ubc=1.04)
    ├── (a=28, N=3, Q_v=0.33, best=0.56, ubc=1.01)
    ├── (a=2, N=1, Q_v=0.02, best=0.02, ubc=0.76)
    └── (a=8, N=1, Q_v=0.56, best=0.56, ubc=1.30)
    └── (a=32, N=2, Q_v=0.42, best=0.65, ubc=1.24)
        └── (a=22, N=1, Q_v=0.65, best=0.65, ubc=1.24)
[16:53:47] INFO     selected action 28 after 125 simulations.
           INFO     current action list: [1, 19, 20, 25, 21, 26, 27, 7, 28]
(N=125, Q_v=0.43, best=0.76)
├── (a=2, N=25, Q_v=0.46, best=0.64, ubc=0.77)
├── (a=3, N=4, Q_v=0.45, best=0.56, ubc=1.08)
├── (a=4, N=1, Q_v=0.33, best=0.33, ubc=1.16)
├── (a=8, N=1, Q_v=0.56, best=0.56, ubc=1.40)
└── (a=13, N=1, Q_v=0.55, best=0.55, ubc=1.38)
├── (a=8, N=3, Q_v=0.30, best=0.38, ubc=1.03)
├── (a=3, N=1, Q_v=0.35, best=0.35, ubc=1.09)
└── (a=29, N=1, Q_v=0.38, best=0.38, ubc=1.12)
├── (a=13, N=5, Q_v=0.50, best=0.62, ubc=1.07)
├── (a=3, N=1, Q_v=0.40, best=0.40, ubc=1.30)
├── (a=8, N=1, Q_v=0.62, best=0.62, ubc=1.52)
├── (a=14, N=1, Q_v=0.49, best=0.49, ubc=1.39)
└── (a=22, N=1, Q_v=0.44, best=0.44, ubc=1.33)
├── (a=22, N=4, Q_v=0.42, best=0.56, ubc=1.06)
├── (a=3, N=1, Q_v=0.49, best=0.49, ubc=1.32)
├── (a=8, N=1, Q_v=0.42, best=0.42, ubc=1.25)
└── (a=13, N=1, Q_v=0.22, best=0.22, ubc=1.05)
├── (a=29, N=4, Q_v=0.50, best=0.58, ubc=1.14)
├── (a=3, N=1, Q_v=0.53, best=0.53, ubc=1.36)
├── (a=8, N=1, Q_v=0.58, best=0.58, ubc=1.41)
└── (a=31, N=1, Q_v=0.45, best=0.45, ubc=1.29)
└── (a=31, N=4, Q_v=0.50, best=0.55, ubc=1.13)
    ├── (a=3, N=1, Q_v=0.47, best=0.47, ubc=1.31)
    ├── (a=8, N=1, Q_v=0.55, best=0.55, ubc=1.38)
    └── (a=32, N=1, Q_v=0.49, best=0.49, ubc=1.32)
├── (a=8, N=23, Q_v=0.45, best=0.65, ubc=0.77)
├── (a=2, N=4, Q_v=0.45, best=0.65, ubc=1.08)
├── (a=3, N=1, Q_v=0.20, best=0.20, ubc=1.03)
├── (a=9, N=1, Q_v=0.42, best=0.42, ubc=1.25)
└── (a=29, N=1, Q_v=0.53, best=0.53, ubc=1.36)
├── (a=9, N=3, Q_v=0.38, best=0.56, ubc=1.10)
├── (a=2, N=1, Q_v=0.56, best=0.56, ubc=1.30)
└── (a=13, N=1, Q_v=0.20, best=0.20, ubc=0.94)
├── (a=13, N=4, Q_v=0.45, best=0.60, ubc=1.08)
├── (a=2, N=1, Q_v=0.36, best=0.36, ubc=1.20)
├── (a=9, N=1, Q_v=0.60, best=0.60, ubc=1.43)
└── (a=29, N=1, Q_v=0.31, best=0.31, ubc=1.14)
├── (a=22, N=4, Q_v=0.47, best=0.56, ubc=1.09)
├── (a=2, N=1, Q_v=0.38, best=0.38, ubc=1.21)
├── (a=9, N=1, Q_v=0.44, best=0.44, ubc=1.27)
└── (a=29, N=1, Q_v=0.56, best=0.56, ubc=1.40)
├── (a=29, N=2, Q_v=0.18, best=0.18, ubc=1.07)
└── (a=22, N=1, Q_v=0.18, best=0.18, ubc=0.77)
└── (a=31, N=5, Q_v=0.55, best=0.65, ubc=1.11)
    ├── (a=2, N=1, Q_v=0.49, best=0.49, ubc=1.39)
    ├── (a=9, N=1, Q_v=0.65, best=0.65, ubc=1.55)
    ├── (a=13, N=1, Q_v=0.49, best=0.49, ubc=1.39)
    └── (a=32, N=1, Q_v=0.65, best=0.65, ubc=1.55)
├── (a=13, N=18, Q_v=0.40, best=0.76, ubc=0.76)
├── (a=2, N=3, Q_v=0.45, best=0.76, ubc=1.14)
├── (a=3, N=1, Q_v=0.33, best=0.33, ubc=1.07)
└── (a=14, N=1, Q_v=0.76, best=0.76, ubc=1.50)
├── (a=8, N=3, Q_v=0.38, best=0.47, ubc=1.08)
├── (a=2, N=1, Q_v=0.33, best=0.33, ubc=1.07)
└── (a=14, N=1, Q_v=0.35, best=0.35, ubc=1.09)
├── (a=14, N=2, Q_v=0.29, best=0.53, ubc=1.14)
└── (a=2, N=1, Q_v=0.53, best=0.53, ubc=1.12)
├── (a=22, N=3, Q_v=0.44, best=0.53, ubc=1.14)
├── (a=2, N=1, Q_v=0.38, best=0.38, ubc=1.12)
└── (a=23, N=1, Q_v=0.53, best=0.53, ubc=1.27)
├── (a=29, N=3, Q_v=0.40, best=0.60, ubc=1.09)
├── (a=2, N=1, Q_v=0.25, best=0.25, ubc=1.00)
└── (a=30, N=1, Q_v=0.35, best=0.35, ubc=1.09)
└── (a=31, N=3, Q_v=0.28, best=0.62, ubc=0.97)
    ├── (a=2, N=1, Q_v=0.13, best=0.13, ubc=0.87)
    └── (a=8, N=1, Q_v=0.09, best=0.09, ubc=0.83)
├── (a=22, N=23, Q_v=0.45, best=0.65, ubc=0.77)
├── (a=2, N=5, Q_v=0.52, best=0.65, ubc=1.08)
├── (a=3, N=1, Q_v=0.65, best=0.65, ubc=1.55)
├── (a=8, N=1, Q_v=0.40, best=0.40, ubc=1.30)
├── (a=13, N=1, Q_v=0.56, best=0.56, ubc=1.46)
└── (a=23, N=1, Q_v=0.42, best=0.42, ubc=1.32)
├── (a=8, N=3, Q_v=0.41, best=0.62, ubc=1.13)
├── (a=2, N=1, Q_v=0.27, best=0.27, ubc=1.01)
└── (a=29, N=1, Q_v=0.35, best=0.35, ubc=1.09)
├── (a=13, N=4, Q_v=0.44, best=0.55, ubc=1.06)
├── (a=2, N=1, Q_v=0.55, best=0.55, ubc=1.38)
├── (a=8, N=1, Q_v=0.31, best=0.31, ubc=1.14)
└── (a=29, N=1, Q_v=0.36, best=0.36, ubc=1.20)
├── (a=23, N=4, Q_v=0.50, best=0.62, ubc=1.12)
├── (a=2, N=1, Q_v=0.38, best=0.38, ubc=1.21)
├── (a=8, N=1, Q_v=0.42, best=0.42, ubc=1.25)
└── (a=13, N=1, Q_v=0.62, best=0.62, ubc=1.45)
├── (a=29, N=2, Q_v=0.28, best=0.36, ubc=1.17)
└── (a=8, N=1, Q_v=0.20, best=0.20, ubc=0.79)
└── (a=31, N=4, Q_v=0.41, best=0.53, ubc=1.04)
    ├── (a=2, N=1, Q_v=0.47, best=0.47, ubc=1.31)
    ├── (a=8, N=1, Q_v=0.20, best=0.20, ubc=1.03)
    └── (a=13, N=1, Q_v=0.53, best=0.53, ubc=1.36)
├── (a=29, N=15, Q_v=0.36, best=0.64, ubc=0.76)
├── (a=2, N=3, Q_v=0.38, best=0.51, ubc=1.05)
├── (a=3, N=1, Q_v=0.31, best=0.31, ubc=1.05)
└── (a=22, N=1, Q_v=0.31, best=0.31, ubc=1.05)
├── (a=8, N=2, Q_v=0.39, best=0.42, ubc=1.21)
└── (a=22, N=1, Q_v=0.42, best=0.42, ubc=1.01)
├── (a=13, N=3, Q_v=0.33, best=0.53, ubc=1.00)
├── (a=2, N=1, Q_v=0.53, best=0.53, ubc=1.27)
└── (a=8, N=1, Q_v=0.04, best=0.04, ubc=0.78)
├── (a=22, N=2, Q_v=0.41, best=0.44, ubc=1.23)
└── (a=23, N=1, Q_v=0.38, best=0.38, ubc=0.97)
├── (a=30, N=2, Q_v=0.27, best=0.44, ubc=1.10)
└── (a=13, N=1, Q_v=0.44, best=0.44, ubc=1.02)
└── (a=31, N=2, Q_v=0.40, best=0.64, ubc=1.22)
    └── (a=13, N=1, Q_v=0.64, best=0.64, ubc=1.22)
└── (a=31, N=20, Q_v=0.42, best=0.75, ubc=0.77)
    ├── (a=2, N=2, Q_v=0.17, best=0.27, ubc=1.04)
    └── (a=32, N=1, Q_v=0.27, best=0.27, ubc=0.86)
    ├── (a=8, N=3, Q_v=0.47, best=0.65, ubc=1.18)
    ├── (a=2, N=1, Q_v=0.20, best=0.20, ubc=0.94)
    └── (a=13, N=1, Q_v=0.65, best=0.65, ubc=1.40)
    ├── (a=13, N=4, Q_v=0.50, best=0.75, ubc=1.11)
    ├── (a=2, N=1, Q_v=0.56, best=0.56, ubc=1.40)
    ├── (a=8, N=1, Q_v=0.38, best=0.38, ubc=1.21)
    └── (a=14, N=1, Q_v=0.29, best=0.29, ubc=1.12)
    ├── (a=22, N=4, Q_v=0.40, best=0.56, ubc=1.01)
    ├── (a=2, N=1, Q_v=0.38, best=0.38, ubc=1.21)
    ├── (a=8, N=1, Q_v=0.09, best=0.09, ubc=0.92)
    └── (a=13, N=1, Q_v=0.56, best=0.56, ubc=1.40)
    ├── (a=29, N=3, Q_v=0.41, best=0.49, ubc=1.12)
    ├── (a=2, N=1, Q_v=0.38, best=0.38, ubc=1.12)
    └── (a=8, N=1, Q_v=0.36, best=0.36, ubc=1.10)
    └── (a=32, N=3, Q_v=0.45, best=0.69, ubc=1.15)
        ├── (a=2, N=1, Q_v=0.51, best=0.51, ubc=1.25)
        └── (a=8, N=1, Q_v=0.15, best=0.15, ubc=0.89)
[16:53:50] INFO     selected action 2 after 125 simulations.
           INFO     current action list: [1, 19, 20, 25, 21, 26, 27, 7, 28, 2]
(N=125, Q_v=0.41, best=0.69)
├── (a=3, N=17, Q_v=0.37, best=0.69, ubc=0.74)
├── (a=4, N=2, Q_v=0.33, best=0.45, ubc=1.17)
└── (a=31, N=1, Q_v=0.20, best=0.20, ubc=0.79)
├── (a=8, N=3, Q_v=0.43, best=0.64, ubc=1.12)
├── (a=4, N=1, Q_v=0.24, best=0.24, ubc=0.98)
└── (a=22, N=1, Q_v=0.64, best=0.64, ubc=1.38)
├── (a=13, N=3, Q_v=0.49, best=0.69, ubc=1.18)
├── (a=4, N=1, Q_v=0.18, best=0.18, ubc=0.92)
└── (a=14, N=1, Q_v=0.69, best=0.69, ubc=1.43)
├── (a=22, N=3, Q_v=0.39, best=0.42, ubc=1.08)
├── (a=4, N=1, Q_v=0.42, best=0.42, ubc=1.16)
└── (a=8, N=1, Q_v=0.35, best=0.35, ubc=1.09)
├── (a=29, N=2, Q_v=0.29, best=0.35, ubc=1.13)
└── (a=13, N=1, Q_v=0.24, best=0.24, ubc=0.82)
└── (a=31, N=3, Q_v=0.35, best=0.45, ubc=1.03)
    ├── (a=4, N=1, Q_v=0.35, best=0.35, ubc=1.09)
    └── (a=8, N=1, Q_v=0.45, best=0.45, ubc=1.20)
├── (a=8, N=19, Q_v=0.38, best=0.69, ubc=0.74)
├── (a=3, N=3, Q_v=0.42, best=0.51, ubc=1.12)
├── (a=4, N=1, Q_v=0.40, best=0.40, ubc=1.14)
└── (a=29, N=1, Q_v=0.51, best=0.51, ubc=1.25)
├── (a=9, N=4, Q_v=0.37, best=0.67, ubc=0.98)
├── (a=3, N=1, Q_v=0.40, best=0.40, ubc=1.23)
├── (a=10, N=1, Q_v=-0.02, best=-0.02, ubc=0.81)
└── (a=31, N=1, Q_v=0.44, best=0.44, ubc=1.27)
├── (a=13, N=2, Q_v=0.35, best=0.35, ubc=1.20)
└── (a=9, N=1, Q_v=0.35, best=0.35, ubc=0.93)
├── (a=22, N=4, Q_v=0.50, best=0.58, ubc=1.10)
├── (a=3, N=1, Q_v=0.58, best=0.58, ubc=1.41)
├── (a=9, N=1, Q_v=0.42, best=0.42, ubc=1.25)
└── (a=23, N=1, Q_v=0.58, best=0.58, ubc=1.41)
├── (a=29, N=3, Q_v=0.35, best=0.44, ubc=1.05)
├── (a=3, N=1, Q_v=0.25, best=0.25, ubc=1.00)
└── (a=22, N=1, Q_v=0.44, best=0.44, ubc=1.18)
└── (a=31, N=2, Q_v=0.07, best=0.15, ubc=0.93)
    └── (a=22, N=1, Q_v=0.15, best=0.15, ubc=0.73)
├── (a=13, N=26, Q_v=0.45, best=0.67, ubc=0.75)
├── (a=3, N=4, Q_v=0.43, best=0.58, ubc=1.07)
├── (a=4, N=1, Q_v=0.29, best=0.29, ubc=1.12)
├── (a=8, N=1, Q_v=0.35, best=0.35, ubc=1.18)
└── (a=14, N=1, Q_v=0.51, best=0.51, ubc=1.34)
├── (a=8, N=5, Q_v=0.47, best=0.67, ubc=1.04)
├── (a=3, N=1, Q_v=0.36, best=0.36, ubc=1.26)
├── (a=9, N=1, Q_v=0.33, best=0.33, ubc=1.22)
├── (a=14, N=1, Q_v=0.65, best=0.65, ubc=1.55)
└── (a=22, N=1, Q_v=0.33, best=0.33, ubc=1.22)
├── (a=14, N=3, Q_v=0.39, best=0.55, ubc=1.12)
├── (a=3, N=1, Q_v=0.36, best=0.36, ubc=1.10)
└── (a=8, N=1, Q_v=0.55, best=0.55, ubc=1.29)
├── (a=22, N=5, Q_v=0.52, best=0.60, ubc=1.09)
├── (a=3, N=1, Q_v=0.51, best=0.51, ubc=1.41)
├── (a=8, N=1, Q_v=0.56, best=0.56, ubc=1.46)
├── (a=14, N=1, Q_v=0.42, best=0.42, ubc=1.32)
└── (a=29, N=1, Q_v=0.53, best=0.53, ubc=1.42)
├── (a=29, N=3, Q_v=0.30, best=0.38, ubc=1.04)
├── (a=3, N=1, Q_v=0.31, best=0.31, ubc=1.05)
└── (a=30, N=1, Q_v=0.38, best=0.38, ubc=1.12)
└── (a=31, N=5, Q_v=0.47, best=0.60, ubc=1.04)
    ├── (a=3, N=1, Q_v=0.33, best=0.33, ubc=1.22)
    ├── (a=8, N=1, Q_v=0.55, best=0.55, ubc=1.44)
    ├── (a=14, N=1, Q_v=0.49, best=0.49, ubc=1.39)
    └── (a=22, N=1, Q_v=0.38, best=0.38, ubc=1.28)
├── (a=22, N=20, Q_v=0.41, best=0.53, ubc=0.75)
├── (a=3, N=3, Q_v=0.44, best=0.53, ubc=1.15)
├── (a=4, N=1, Q_v=0.47, best=0.47, ubc=1.21)
└── (a=31, N=1, Q_v=0.33, best=0.33, ubc=1.07)
├── (a=8, N=3, Q_v=0.31, best=0.38, ubc=1.02)
├── (a=3, N=1, Q_v=0.27, best=0.27, ubc=1.01)
└── (a=9, N=1, Q_v=0.27, best=0.27, ubc=1.01)
├── (a=13, N=3, Q_v=0.40, best=0.51, ubc=1.11)
├── (a=3, N=1, Q_v=0.51, best=0.51, ubc=1.25)
└── (a=8, N=1, Q_v=0.31, best=0.31, ubc=1.05)
├── (a=23, N=3, Q_v=0.30, best=0.45, ubc=1.01)
├── (a=3, N=1, Q_v=0.15, best=0.15, ubc=0.89)
└── (a=8, N=1, Q_v=0.31, best=0.31, ubc=1.05)
├── (a=29, N=3, Q_v=0.45, best=0.49, ubc=1.15)
├── (a=3, N=1, Q_v=0.49, best=0.49, ubc=1.23)
└── (a=8, N=1, Q_v=0.45, best=0.45, ubc=1.20)
└── (a=31, N=4, Q_v=0.48, best=0.51, ubc=1.09)
    ├── (a=3, N=1, Q_v=0.47, best=0.47, ubc=1.31)
    ├── (a=8, N=1, Q_v=0.51, best=0.51, ubc=1.34)
    └── (a=23, N=1, Q_v=0.49, best=0.49, ubc=1.32)
├── (a=29, N=17, Q_v=0.38, best=0.53, ubc=0.75)
├── (a=3, N=2, Q_v=0.16, best=0.29, ubc=1.01)
└── (a=4, N=1, Q_v=0.29, best=0.29, ubc=0.88)
├── (a=8, N=3, Q_v=0.43, best=0.49, ubc=1.12)
├── (a=3, N=1, Q_v=0.40, best=0.40, ubc=1.14)
└── (a=31, N=1, Q_v=0.40, best=0.40, ubc=1.14)
├── (a=13, N=3, Q_v=0.42, best=0.47, ubc=1.11)
├── (a=3, N=1, Q_v=0.40, best=0.40, ubc=1.14)
└── (a=30, N=1, Q_v=0.47, best=0.47, ubc=1.21)
├── (a=22, N=3, Q_v=0.47, best=0.53, ubc=1.16)
├── (a=3, N=1, Q_v=0.53, best=0.53, ubc=1.27)
└── (a=30, N=1, Q_v=0.49, best=0.49, ubc=1.23)
├── (a=30, N=2, Q_v=0.29, best=0.45, ubc=1.13)
└── (a=31, N=1, Q_v=0.13, best=0.13, ubc=0.72)
└── (a=31, N=3, Q_v=0.35, best=0.42, ubc=1.03)
    ├── (a=3, N=1, Q_v=0.33, best=0.33, ubc=1.07)
    └── (a=22, N=1, Q_v=0.29, best=0.29, ubc=1.03)
└── (a=31, N=25, Q_v=0.45, best=0.67, ubc=0.76)
    ├── (a=3, N=3, Q_v=0.35, best=0.45, ubc=1.08)
    ├── (a=4, N=1, Q_v=0.22, best=0.22, ubc=0.96)
    └── (a=32, N=1, Q_v=0.45, best=0.45, ubc=1.20)
    ├── (a=8, N=5, Q_v=0.52, best=0.58, ubc=1.08)
    ├── (a=3, N=1, Q_v=0.55, best=0.55, ubc=1.44)
    ├── (a=9, N=1, Q_v=0.58, best=0.58, ubc=1.48)
    ├── (a=13, N=1, Q_v=0.58, best=0.58, ubc=1.48)
    └── (a=29, N=1, Q_v=0.45, best=0.45, ubc=1.35)
    ├── (a=13, N=3, Q_v=0.28, best=0.47, ubc=1.02)
    ├── (a=3, N=1, Q_v=0.18, best=0.18, ubc=0.92)
    └── (a=22, N=1, Q_v=0.47, best=0.47, ubc=1.21)
    ├── (a=22, N=4, Q_v=0.44, best=0.56, ubc=1.08)
    ├── (a=3, N=1, Q_v=0.56, best=0.56, ubc=1.40)
    ├── (a=8, N=1, Q_v=0.49, best=0.49, ubc=1.32)
    └── (a=32, N=1, Q_v=0.15, best=0.15, ubc=0.98)
    ├── (a=29, N=3, Q_v=0.32, best=0.49, ubc=1.05)
    ├── (a=3, N=1, Q_v=0.49, best=0.49, ubc=1.23)
    └── (a=30, N=1, Q_v=0.07, best=0.07, ubc=0.81)
    └── (a=32, N=6, Q_v=0.55, best=0.67, ubc=1.07)
        ├── (a=3, N=1, Q_v=0.64, best=0.64, ubc=1.58)
        ├── (a=8, N=1, Q_v=0.49, best=0.49, ubc=1.44)
        ├── (a=13, N=1, Q_v=0.64, best=0.64, ubc=1.58)
        ├── (a=22, N=1, Q_v=0.49, best=0.49, ubc=1.44)
        └── (a=33, N=1, Q_v=0.67, best=0.67, ubc=1.62)
[16:53:53] INFO     selected action 13 after 125 simulations.
           INFO     current action list: [1, 19, 20, 25, 21, 26, 27, 7, 28, 2, 13]
(N=125, Q_v=0.42, best=0.75)
├── (a=3, N=13, Q_v=0.33, best=0.56, ubc=0.77)
├── (a=4, N=2, Q_v=0.30, best=0.40, ubc=1.10)
└── (a=8, N=1, Q_v=0.40, best=0.40, ubc=0.99)
├── (a=8, N=2, Q_v=0.37, best=0.49, ubc=1.17)
└── (a=14, N=1, Q_v=0.49, best=0.49, ubc=1.08)
├── (a=14, N=2, Q_v=0.41, best=0.51, ubc=1.21)
└── (a=15, N=1, Q_v=0.31, best=0.31, ubc=0.90)
├── (a=22, N=2, Q_v=0.38, best=0.56, ubc=1.18)
└── (a=31, N=1, Q_v=0.20, best=0.20, ubc=0.79)
├── (a=29, N=2, Q_v=0.22, best=0.45, ubc=1.02)
└── (a=4, N=1, Q_v=-0.02, best=-0.02, ubc=0.57)
└── (a=31, N=2, Q_v=0.39, best=0.47, ubc=1.19)
    └── (a=22, N=1, Q_v=0.47, best=0.47, ubc=1.06)
├── (a=8, N=22, Q_v=0.44, best=0.67, ubc=0.77)
├── (a=3, N=3, Q_v=0.33, best=0.42, ubc=1.05)
├── (a=4, N=1, Q_v=0.33, best=0.33, ubc=1.07)
└── (a=9, N=1, Q_v=0.25, best=0.25, ubc=1.00)
├── (a=9, N=3, Q_v=0.32, best=0.44, ubc=1.03)
├── (a=3, N=1, Q_v=0.16, best=0.16, ubc=0.90)
└── (a=10, N=1, Q_v=0.35, best=0.35, ubc=1.09)
├── (a=14, N=5, Q_v=0.57, best=0.67, ubc=1.13)
├── (a=3, N=1, Q_v=0.55, best=0.55, ubc=1.44)
├── (a=9, N=1, Q_v=0.47, best=0.47, ubc=1.37)
├── (a=15, N=1, Q_v=0.55, best=0.55, ubc=1.44)
└── (a=22, N=1, Q_v=0.67, best=0.67, ubc=1.57)
├── (a=22, N=5, Q_v=0.54, best=0.62, ubc=1.10)
├── (a=3, N=1, Q_v=0.56, best=0.56, ubc=1.46)
├── (a=9, N=1, Q_v=0.49, best=0.49, ubc=1.39)
├── (a=14, N=1, Q_v=0.58, best=0.58, ubc=1.48)
└── (a=29, N=1, Q_v=0.45, best=0.45, ubc=1.35)
├── (a=29, N=2, Q_v=0.26, best=0.33, ubc=1.14)
└── (a=3, N=1, Q_v=0.20, best=0.20, ubc=0.79)
└── (a=31, N=3, Q_v=0.41, best=0.49, ubc=1.13)
    ├── (a=3, N=1, Q_v=0.36, best=0.36, ubc=1.10)
    └── (a=22, N=1, Q_v=0.38, best=0.38, ubc=1.12)
├── (a=14, N=19, Q_v=0.41, best=0.75, ubc=0.77)
├── (a=3, N=4, Q_v=0.53, best=0.69, ubc=1.14)
├── (a=4, N=1, Q_v=0.58, best=0.58, ubc=1.41)
├── (a=8, N=1, Q_v=0.25, best=0.25, ubc=1.09)
└── (a=15, N=1, Q_v=0.69, best=0.69, ubc=1.52)
├── (a=8, N=4, Q_v=0.50, best=0.75, ubc=1.10)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=9, N=1, Q_v=0.35, best=0.35, ubc=1.18)
└── (a=31, N=1, Q_v=0.36, best=0.36, ubc=1.20)
├── (a=15, N=3, Q_v=0.31, best=0.55, ubc=1.01)
├── (a=3, N=1, Q_v=0.18, best=0.18, ubc=0.92)
└── (a=8, N=1, Q_v=0.20, best=0.20, ubc=0.94)
├── (a=22, N=3, Q_v=0.45, best=0.56, ubc=1.15)
├── (a=3, N=1, Q_v=0.56, best=0.56, ubc=1.30)
└── (a=31, N=1, Q_v=0.29, best=0.29, ubc=1.03)
├── (a=29, N=2, Q_v=0.20, best=0.36, ubc=1.06)
└── (a=3, N=1, Q_v=0.36, best=0.36, ubc=0.95)
└── (a=31, N=2, Q_v=0.22, best=0.24, ubc=1.08)
    └── (a=29, N=1, Q_v=0.20, best=0.20, ubc=0.79)
├── (a=22, N=29, Q_v=0.47, best=0.75, ubc=0.76)
├── (a=3, N=4, Q_v=0.43, best=0.53, ubc=1.08)
├── (a=4, N=1, Q_v=0.51, best=0.51, ubc=1.34)
├── (a=8, N=1, Q_v=0.53, best=0.53, ubc=1.36)
└── (a=31, N=1, Q_v=0.36, best=0.36, ubc=1.20)
├── (a=8, N=6, Q_v=0.53, best=0.67, ubc=1.06)
├── (a=3, N=1, Q_v=0.67, best=0.67, ubc=1.62)
├── (a=9, N=1, Q_v=0.55, best=0.55, ubc=1.49)
├── (a=14, N=1, Q_v=0.56, best=0.56, ubc=1.51)
├── (a=23, N=1, Q_v=0.56, best=0.56, ubc=1.51)
└── (a=29, N=1, Q_v=0.36, best=0.36, ubc=1.31)
├── (a=14, N=6, Q_v=0.58, best=0.75, ubc=1.11)
├── (a=3, N=1, Q_v=0.60, best=0.60, ubc=1.55)
├── (a=8, N=1, Q_v=0.75, best=0.75, ubc=1.69)
├── (a=15, N=1, Q_v=0.56, best=0.56, ubc=1.51)
├── (a=23, N=1, Q_v=0.60, best=0.60, ubc=1.55)
└── (a=29, N=1, Q_v=0.38, best=0.38, ubc=1.33)
├── (a=23, N=3, Q_v=0.32, best=0.56, ubc=1.06)
├── (a=3, N=1, Q_v=0.56, best=0.56, ubc=1.30)
└── (a=8, N=1, Q_v=0.31, best=0.31, ubc=1.05)
├── (a=29, N=4, Q_v=0.45, best=0.55, ubc=1.10)
├── (a=3, N=1, Q_v=0.49, best=0.49, ubc=1.32)
├── (a=8, N=1, Q_v=0.49, best=0.49, ubc=1.32)
└── (a=23, N=1, Q_v=0.27, best=0.27, ubc=1.11)
└── (a=31, N=5, Q_v=0.43, best=0.51, ubc=1.01)
    ├── (a=3, N=1, Q_v=0.51, best=0.51, ubc=1.41)
    ├── (a=8, N=1, Q_v=0.38, best=0.38, ubc=1.28)
    ├── (a=14, N=1, Q_v=0.24, best=0.24, ubc=1.13)
    └── (a=32, N=1, Q_v=0.49, best=0.49, ubc=1.39)
├── (a=29, N=19, Q_v=0.38, best=0.69, ubc=0.74)
├── (a=3, N=3, Q_v=0.32, best=0.56, ubc=1.02)
├── (a=4, N=1, Q_v=-0.04, best=-0.04, ubc=0.70)
└── (a=22, N=1, Q_v=0.56, best=0.56, ubc=1.30)
├── (a=8, N=4, Q_v=0.40, best=0.69, ubc=1.01)
├── (a=3, N=1, Q_v=0.65, best=0.65, ubc=1.49)
├── (a=9, N=1, Q_v=0.04, best=0.04, ubc=0.87)
└── (a=31, N=1, Q_v=0.69, best=0.69, ubc=1.52)
├── (a=14, N=3, Q_v=0.40, best=0.65, ubc=1.10)
├── (a=3, N=1, Q_v=0.25, best=0.25, ubc=1.00)
└── (a=15, N=1, Q_v=0.29, best=0.29, ubc=1.03)
├── (a=22, N=3, Q_v=0.49, best=0.49, ubc=1.19)
├── (a=3, N=1, Q_v=0.49, best=0.49, ubc=1.23)
└── (a=30, N=1, Q_v=0.49, best=0.49, ubc=1.23)
├── (a=30, N=2, Q_v=0.15, best=0.25, ubc=1.00)
└── (a=31, N=1, Q_v=0.25, best=0.25, ubc=0.84)
└── (a=31, N=3, Q_v=0.45, best=0.69, ubc=1.15)
    ├── (a=3, N=1, Q_v=0.38, best=0.38, ubc=1.12)
    └── (a=32, N=1, Q_v=0.29, best=0.29, ubc=1.03)
└── (a=31, N=22, Q_v=0.43, best=0.69, ubc=0.76)
    ├── (a=3, N=2, Q_v=0.24, best=0.31, ubc=1.12)
    └── (a=4, N=1, Q_v=0.16, best=0.16, ubc=0.75)
    ├── (a=8, N=3, Q_v=0.21, best=0.65, ubc=0.92)
    ├── (a=3, N=1, Q_v=-0.13, best=-0.13, ubc=0.61)
    └── (a=32, N=1, Q_v=0.65, best=0.65, ubc=1.40)
    ├── (a=14, N=3, Q_v=0.36, best=0.53, ubc=1.08)
    ├── (a=3, N=1, Q_v=0.45, best=0.45, ubc=1.20)
    └── (a=29, N=1, Q_v=0.53, best=0.53, ubc=1.27)
    ├── (a=22, N=5, Q_v=0.53, best=0.69, ubc=1.08)
    ├── (a=3, N=1, Q_v=0.62, best=0.62, ubc=1.52)
    ├── (a=8, N=1, Q_v=0.69, best=0.69, ubc=1.59)
    ├── (a=14, N=1, Q_v=0.38, best=0.38, ubc=1.28)
    └── (a=29, N=1, Q_v=0.53, best=0.53, ubc=1.42)
    ├── (a=29, N=4, Q_v=0.53, best=0.62, ubc=1.15)
    ├── (a=3, N=1, Q_v=0.53, best=0.53, ubc=1.36)
    ├── (a=8, N=1, Q_v=0.62, best=0.62, ubc=1.45)
    └── (a=14, N=1, Q_v=0.36, best=0.36, ubc=1.20)
    └── (a=32, N=4, Q_v=0.53, best=0.67, ubc=1.15)
        ├── (a=3, N=1, Q_v=0.67, best=0.67, ubc=1.51)
        ├── (a=8, N=1, Q_v=0.47, best=0.47, ubc=1.31)
        └── (a=14, N=1, Q_v=0.56, best=0.56, ubc=1.40)
[16:53:56] INFO     selected action 22 after 125 simulations.
           INFO     current action list: [1, 19, 20, 25, 21, 26, 27, 7, 28, 2, 13, 22]
(N=125, Q_v=0.46, best=0.84)
├── (a=3, N=19, Q_v=0.43, best=0.58, ubc=0.79)
├── (a=4, N=3, Q_v=0.45, best=0.56, ubc=1.15)
├── (a=5, N=1, Q_v=0.27, best=0.27, ubc=1.01)
└── (a=31, N=1, Q_v=0.56, best=0.56, ubc=1.30)
├── (a=8, N=3, Q_v=0.42, best=0.56, ubc=1.12)
├── (a=4, N=1, Q_v=0.56, best=0.56, ubc=1.30)
└── (a=9, N=1, Q_v=0.33, best=0.33, ubc=1.07)
├── (a=14, N=3, Q_v=0.45, best=0.56, ubc=1.15)
├── (a=4, N=1, Q_v=0.56, best=0.56, ubc=1.30)
└── (a=15, N=1, Q_v=0.38, best=0.38, ubc=1.12)
├── (a=23, N=2, Q_v=0.35, best=0.45, ubc=1.20)
└── (a=31, N=1, Q_v=0.24, best=0.24, ubc=0.82)
├── (a=29, N=3, Q_v=0.39, best=0.56, ubc=1.09)
├── (a=4, N=1, Q_v=0.25, best=0.25, ubc=1.00)
└── (a=8, N=1, Q_v=0.56, best=0.56, ubc=1.30)
└── (a=31, N=4, Q_v=0.46, best=0.58, ubc=1.07)
    ├── (a=4, N=1, Q_v=0.55, best=0.55, ubc=1.38)
    ├── (a=8, N=1, Q_v=0.24, best=0.24, ubc=1.07)
    └── (a=14, N=1, Q_v=0.47, best=0.47, ubc=1.31)
├── (a=8, N=14, Q_v=0.39, best=0.69, ubc=0.80)
├── (a=3, N=2, Q_v=0.31, best=0.36, ubc=1.12)
└── (a=14, N=1, Q_v=0.36, best=0.36, ubc=0.95)
├── (a=9, N=2, Q_v=0.40, best=0.47, ubc=1.21)
└── (a=29, N=1, Q_v=0.33, best=0.33, ubc=0.92)
├── (a=14, N=2, Q_v=0.36, best=0.44, ubc=1.18)
└── (a=15, N=1, Q_v=0.29, best=0.29, ubc=0.88)
├── (a=23, N=2, Q_v=0.38, best=0.40, ubc=1.19)
└── (a=29, N=1, Q_v=0.36, best=0.36, ubc=0.95)
├── (a=29, N=3, Q_v=0.38, best=0.49, ubc=1.04)
├── (a=3, N=1, Q_v=0.15, best=0.15, ubc=0.89)
└── (a=30, N=1, Q_v=0.49, best=0.49, ubc=1.23)
└── (a=31, N=2, Q_v=0.35, best=0.51, ubc=1.17)
    └── (a=9, N=1, Q_v=0.20, best=0.20, ubc=0.79)
├── (a=14, N=28, Q_v=0.51, best=0.65, ubc=0.80)
├── (a=3, N=4, Q_v=0.47, best=0.56, ubc=1.11)
├── (a=4, N=1, Q_v=0.38, best=0.38, ubc=1.21)
├── (a=8, N=1, Q_v=0.51, best=0.51, ubc=1.34)
└── (a=29, N=1, Q_v=0.42, best=0.42, ubc=1.25)
├── (a=8, N=5, Q_v=0.50, best=0.65, ubc=1.08)
├── (a=3, N=1, Q_v=0.53, best=0.53, ubc=1.42)
├── (a=9, N=1, Q_v=0.25, best=0.25, ubc=1.15)
├── (a=15, N=1, Q_v=0.62, best=0.62, ubc=1.52)
└── (a=23, N=1, Q_v=0.45, best=0.45, ubc=1.35)
├── (a=15, N=4, Q_v=0.45, best=0.56, ubc=1.10)
├── (a=3, N=1, Q_v=0.40, best=0.40, ubc=1.23)
├── (a=8, N=1, Q_v=0.42, best=0.42, ubc=1.25)
└── (a=16, N=1, Q_v=0.56, best=0.56, ubc=1.40)
├── (a=23, N=5, Q_v=0.51, best=0.58, ubc=1.08)
├── (a=3, N=1, Q_v=0.51, best=0.51, ubc=1.41)
├── (a=8, N=1, Q_v=0.51, best=0.51, ubc=1.41)
├── (a=15, N=1, Q_v=0.58, best=0.58, ubc=1.48)
└── (a=24, N=1, Q_v=0.40, best=0.40, ubc=1.30)
├── (a=29, N=5, Q_v=0.58, best=0.65, ubc=1.16)
├── (a=3, N=1, Q_v=0.65, best=0.65, ubc=1.55)
├── (a=8, N=1, Q_v=0.60, best=0.60, ubc=1.50)
├── (a=15, N=1, Q_v=0.53, best=0.53, ubc=1.42)
└── (a=23, N=1, Q_v=0.56, best=0.56, ubc=1.46)
└── (a=31, N=4, Q_v=0.50, best=0.60, ubc=1.15)
    ├── (a=3, N=1, Q_v=0.53, best=0.53, ubc=1.36)
    ├── (a=8, N=1, Q_v=0.60, best=0.60, ubc=1.43)
    └── (a=23, N=1, Q_v=0.55, best=0.55, ubc=1.38)
├── (a=23, N=21, Q_v=0.46, best=0.73, ubc=0.80)
├── (a=3, N=4, Q_v=0.47, best=0.73, ubc=1.08)
├── (a=4, N=1, Q_v=0.51, best=0.51, ubc=1.34)
├── (a=8, N=1, Q_v=0.73, best=0.73, ubc=1.56)
└── (a=14, N=1, Q_v=0.31, best=0.31, ubc=1.14)
├── (a=8, N=4, Q_v=0.54, best=0.62, ubc=1.15)
├── (a=3, N=1, Q_v=0.55, best=0.55, ubc=1.38)
├── (a=9, N=1, Q_v=0.49, best=0.49, ubc=1.32)
└── (a=14, N=1, Q_v=0.62, best=0.62, ubc=1.45)
├── (a=14, N=3, Q_v=0.49, best=0.53, ubc=1.20)
├── (a=3, N=1, Q_v=0.49, best=0.49, ubc=1.23)
└── (a=8, N=1, Q_v=0.45, best=0.45, ubc=1.20)
├── (a=24, N=3, Q_v=0.36, best=0.56, ubc=1.07)
├── (a=3, N=1, Q_v=0.05, best=0.05, ubc=0.80)
└── (a=14, N=1, Q_v=0.56, best=0.56, ubc=1.30)
├── (a=29, N=2, Q_v=0.25, best=0.53, ubc=1.13)
└── (a=31, N=1, Q_v=0.53, best=0.53, ubc=1.12)
└── (a=31, N=4, Q_v=0.55, best=0.65, ubc=1.17)
    ├── (a=3, N=1, Q_v=0.53, best=0.53, ubc=1.36)
    ├── (a=8, N=1, Q_v=0.65, best=0.65, ubc=1.49)
    └── (a=24, N=1, Q_v=0.56, best=0.56, ubc=1.40)
├── (a=29, N=18, Q_v=0.43, best=0.60, ubc=0.80)
├── (a=3, N=3, Q_v=0.48, best=0.55, ubc=1.17)
├── (a=4, N=1, Q_v=0.55, best=0.55, ubc=1.29)
└── (a=31, N=1, Q_v=0.47, best=0.47, ubc=1.21)
├── (a=8, N=3, Q_v=0.48, best=0.56, ubc=1.17)
├── (a=3, N=1, Q_v=0.42, best=0.42, ubc=1.16)
└── (a=9, N=1, Q_v=0.45, best=0.45, ubc=1.20)
├── (a=14, N=3, Q_v=0.47, best=0.60, ubc=1.16)
├── (a=3, N=1, Q_v=0.40, best=0.40, ubc=1.14)
└── (a=31, N=1, Q_v=0.60, best=0.60, ubc=1.34)
├── (a=23, N=3, Q_v=0.50, best=0.56, ubc=1.20)
├── (a=3, N=1, Q_v=0.51, best=0.51, ubc=1.25)
└── (a=8, N=1, Q_v=0.56, best=0.56, ubc=1.30)
├── (a=30, N=2, Q_v=0.37, best=0.44, ubc=1.22)
└── (a=14, N=1, Q_v=0.44, best=0.44, ubc=1.02)
└── (a=31, N=3, Q_v=0.34, best=0.56, ubc=1.03)
    ├── (a=3, N=1, Q_v=0.22, best=0.22, ubc=0.96)
    └── (a=30, N=1, Q_v=0.56, best=0.56, ubc=1.30)
└── (a=31, N=24, Q_v=0.48, best=0.84, ubc=0.80)
    ├── (a=3, N=4, Q_v=0.46, best=0.58, ubc=1.09)
    ├── (a=4, N=1, Q_v=0.58, best=0.58, ubc=1.41)
    ├── (a=8, N=1, Q_v=0.49, best=0.49, ubc=1.32)
    └── (a=32, N=1, Q_v=0.42, best=0.42, ubc=1.25)
    ├── (a=8, N=5, Q_v=0.56, best=0.84, ubc=1.13)
    ├── (a=3, N=1, Q_v=0.53, best=0.53, ubc=1.42)
    ├── (a=9, N=1, Q_v=0.58, best=0.58, ubc=1.48)
    ├── (a=14, N=1, Q_v=0.40, best=0.40, ubc=1.30)
    └── (a=32, N=1, Q_v=0.84, best=0.84, ubc=1.73)
    ├── (a=14, N=4, Q_v=0.54, best=0.62, ubc=1.17)
    ├── (a=3, N=1, Q_v=0.42, best=0.42, ubc=1.25)
    ├── (a=8, N=1, Q_v=0.56, best=0.56, ubc=1.40)
    └── (a=29, N=1, Q_v=0.62, best=0.62, ubc=1.45)
    ├── (a=23, N=3, Q_v=0.32, best=0.60, ubc=1.04)
    ├── (a=3, N=1, Q_v=0.02, best=0.02, ubc=0.76)
    └── (a=29, N=1, Q_v=0.60, best=0.60, ubc=1.34)
    ├── (a=29, N=4, Q_v=0.50, best=0.69, ubc=1.13)
    ├── (a=3, N=1, Q_v=0.33, best=0.33, ubc=1.16)
    ├── (a=8, N=1, Q_v=0.69, best=0.69, ubc=1.52)
    └── (a=14, N=1, Q_v=0.56, best=0.56, ubc=1.40)
    └── (a=32, N=3, Q_v=0.39, best=0.45, ubc=1.12)
        ├── (a=3, N=1, Q_v=0.45, best=0.45, ubc=1.20)
        └── (a=8, N=1, Q_v=0.31, best=0.31, ubc=1.05)
[16:53:59] INFO     selected action 14 after 125 simulations.
           INFO     current action list: [1, 19, 20, 25, 21, 26, 27, 7, 28, 2, 13, 22, 14]
(N=125, Q_v=0.47, best=0.73)
├── (a=3, N=19, Q_v=0.46, best=0.65, ubc=0.82)
├── (a=4, N=3, Q_v=0.45, best=0.58, ubc=1.15)
├── (a=5, N=1, Q_v=0.42, best=0.42, ubc=1.16)
└── (a=8, N=1, Q_v=0.36, best=0.36, ubc=1.10)
├── (a=8, N=2, Q_v=0.19, best=0.24, ubc=1.05)
└── (a=23, N=1, Q_v=0.15, best=0.15, ubc=0.73)
├── (a=15, N=4, Q_v=0.57, best=0.60, ubc=1.18)
├── (a=4, N=1, Q_v=0.56, best=0.56, ubc=1.40)
├── (a=8, N=1, Q_v=0.60, best=0.60, ubc=1.43)
└── (a=23, N=1, Q_v=0.60, best=0.60, ubc=1.43)
├── (a=23, N=4, Q_v=0.53, best=0.60, ubc=1.13)
├── (a=4, N=1, Q_v=0.60, best=0.60, ubc=1.43)
├── (a=8, N=1, Q_v=0.42, best=0.42, ubc=1.25)
└── (a=15, N=1, Q_v=0.53, best=0.53, ubc=1.36)
├── (a=29, N=2, Q_v=0.31, best=0.56, ubc=1.17)
└── (a=30, N=1, Q_v=0.05, best=0.05, ubc=0.64)
└── (a=31, N=3, Q_v=0.53, best=0.65, ubc=1.23)
    ├── (a=4, N=1, Q_v=0.42, best=0.42, ubc=1.16)
    └── (a=8, N=1, Q_v=0.65, best=0.65, ubc=1.40)
├── (a=8, N=20, Q_v=0.46, best=0.65, ubc=0.81)
├── (a=3, N=3, Q_v=0.50, best=0.56, ubc=1.20)
├── (a=4, N=1, Q_v=0.56, best=0.56, ubc=1.30)
└── (a=29, N=1, Q_v=0.55, best=0.55, ubc=1.29)
├── (a=9, N=4, Q_v=0.46, best=0.58, ubc=1.07)
├── (a=3, N=1, Q_v=0.58, best=0.58, ubc=1.41)
├── (a=10, N=1, Q_v=0.20, best=0.20, ubc=1.03)
└── (a=29, N=1, Q_v=0.56, best=0.56, ubc=1.40)
├── (a=15, N=4, Q_v=0.58, best=0.65, ubc=1.19)
├── (a=3, N=1, Q_v=0.65, best=0.65, ubc=1.49)
├── (a=9, N=1, Q_v=0.40, best=0.40, ubc=1.23)
└── (a=31, N=1, Q_v=0.65, best=0.65, ubc=1.49)
├── (a=23, N=2, Q_v=0.31, best=0.44, ubc=1.17)
└── (a=3, N=1, Q_v=0.44, best=0.44, ubc=1.02)
├── (a=29, N=3, Q_v=0.42, best=0.53, ubc=1.12)
├── (a=3, N=1, Q_v=0.47, best=0.47, ubc=1.21)
└── (a=31, N=1, Q_v=0.25, best=0.25, ubc=1.00)
└── (a=31, N=3, Q_v=0.51, best=0.62, ubc=1.22)
    ├── (a=3, N=1, Q_v=0.44, best=0.44, ubc=1.18)
    └── (a=29, N=1, Q_v=0.62, best=0.62, ubc=1.36)
├── (a=15, N=21, Q_v=0.47, best=0.65, ubc=0.81)
├── (a=3, N=3, Q_v=0.35, best=0.45, ubc=1.06)
├── (a=4, N=1, Q_v=0.20, best=0.20, ubc=0.94)
└── (a=16, N=1, Q_v=0.45, best=0.45, ubc=1.20)
├── (a=8, N=3, Q_v=0.42, best=0.55, ubc=1.13)
├── (a=3, N=1, Q_v=0.47, best=0.47, ubc=1.21)
└── (a=31, N=1, Q_v=0.55, best=0.55, ubc=1.29)
├── (a=16, N=4, Q_v=0.50, best=0.56, ubc=1.12)
├── (a=3, N=1, Q_v=0.56, best=0.56, ubc=1.40)
├── (a=8, N=1, Q_v=0.51, best=0.51, ubc=1.34)
└── (a=29, N=1, Q_v=0.40, best=0.40, ubc=1.23)
├── (a=23, N=3, Q_v=0.48, best=0.60, ubc=1.20)
├── (a=3, N=1, Q_v=0.40, best=0.40, ubc=1.14)
└── (a=16, N=1, Q_v=0.45, best=0.45, ubc=1.20)
├── (a=29, N=4, Q_v=0.55, best=0.65, ubc=1.17)
├── (a=3, N=1, Q_v=0.60, best=0.60, ubc=1.43)
├── (a=8, N=1, Q_v=0.47, best=0.47, ubc=1.31)
└── (a=16, N=1, Q_v=0.65, best=0.65, ubc=1.49)
└── (a=31, N=3, Q_v=0.49, best=0.51, ubc=1.20)
    ├── (a=3, N=1, Q_v=0.49, best=0.49, ubc=1.23)
    └── (a=8, N=1, Q_v=0.47, best=0.47, ubc=1.21)
├── (a=23, N=20, Q_v=0.46, best=0.60, ubc=0.80)
├── (a=3, N=3, Q_v=0.40, best=0.44, ubc=1.11)
├── (a=4, N=1, Q_v=0.36, best=0.36, ubc=1.10)
└── (a=29, N=1, Q_v=0.44, best=0.44, ubc=1.18)
├── (a=8, N=3, Q_v=0.45, best=0.53, ubc=1.15)
├── (a=3, N=1, Q_v=0.33, best=0.33, ubc=1.07)
└── (a=9, N=1, Q_v=0.49, best=0.49, ubc=1.23)
├── (a=15, N=3, Q_v=0.48, best=0.56, ubc=1.19)
├── (a=3, N=1, Q_v=0.42, best=0.42, ubc=1.16)
└── (a=8, N=1, Q_v=0.47, best=0.47, ubc=1.21)
├── (a=24, N=3, Q_v=0.48, best=0.55, ubc=1.19)
├── (a=3, N=1, Q_v=0.53, best=0.53, ubc=1.27)
└── (a=31, N=1, Q_v=0.55, best=0.55, ubc=1.29)
├── (a=29, N=4, Q_v=0.47, best=0.60, ubc=1.08)
├── (a=3, N=1, Q_v=0.42, best=0.42, ubc=1.25)
├── (a=8, N=1, Q_v=0.35, best=0.35, ubc=1.18)
└── (a=31, N=1, Q_v=0.60, best=0.60, ubc=1.43)
└── (a=31, N=3, Q_v=0.48, best=0.55, ubc=1.19)
    ├── (a=3, N=1, Q_v=0.45, best=0.45, ubc=1.20)
    └── (a=8, N=1, Q_v=0.55, best=0.55, ubc=1.29)
├── (a=29, N=19, Q_v=0.45, best=0.60, ubc=0.81)
├── (a=3, N=2, Q_v=0.35, best=0.53, ubc=1.21)
└── (a=31, N=1, Q_v=0.18, best=0.18, ubc=0.77)
├── (a=8, N=3, Q_v=0.39, best=0.53, ubc=1.09)
├── (a=3, N=1, Q_v=0.24, best=0.24, ubc=0.98)
└── (a=30, N=1, Q_v=0.40, best=0.40, ubc=1.14)
├── (a=15, N=4, Q_v=0.56, best=0.60, ubc=1.17)
├── (a=3, N=1, Q_v=0.60, best=0.60, ubc=1.43)
├── (a=8, N=1, Q_v=0.53, best=0.53, ubc=1.36)
└── (a=23, N=1, Q_v=0.53, best=0.53, ubc=1.36)
├── (a=23, N=3, Q_v=0.41, best=0.45, ubc=1.11)
├── (a=3, N=1, Q_v=0.44, best=0.44, ubc=1.18)
└── (a=30, N=1, Q_v=0.45, best=0.45, ubc=1.20)
├── (a=30, N=3, Q_v=0.43, best=0.55, ubc=1.13)
├── (a=3, N=1, Q_v=0.33, best=0.33, ubc=1.07)
└── (a=15, N=1, Q_v=0.42, best=0.42, ubc=1.16)
└── (a=31, N=3, Q_v=0.50, best=0.60, ubc=1.20)
    ├── (a=3, N=1, Q_v=0.55, best=0.55, ubc=1.29)
    └── (a=8, N=1, Q_v=0.35, best=0.35, ubc=1.09)
└── (a=31, N=25, Q_v=0.50, best=0.73, ubc=0.81)
    ├── (a=3, N=1, Q_v=-0.15, best=-0.15, ubc=1.12)
    ├── (a=8, N=3, Q_v=0.41, best=0.56, ubc=1.14)
    ├── (a=3, N=1, Q_v=0.56, best=0.56, ubc=1.30)
    └── (a=29, N=1, Q_v=0.18, best=0.18, ubc=0.92)
    ├── (a=15, N=6, Q_v=0.61, best=0.65, ubc=1.13)
    ├── (a=3, N=1, Q_v=0.55, best=0.55, ubc=1.49)
    ├── (a=8, N=1, Q_v=0.60, best=0.60, ubc=1.55)
    ├── (a=16, N=1, Q_v=0.62, best=0.62, ubc=1.56)
    ├── (a=23, N=1, Q_v=0.60, best=0.60, ubc=1.55)
    └── (a=29, N=1, Q_v=0.65, best=0.65, ubc=1.60)
    ├── (a=23, N=4, Q_v=0.51, best=0.62, ubc=1.14)
    ├── (a=3, N=1, Q_v=0.42, best=0.42, ubc=1.25)
    ├── (a=8, N=1, Q_v=0.40, best=0.40, ubc=1.23)
    └── (a=15, N=1, Q_v=0.62, best=0.62, ubc=1.45)
    ├── (a=29, N=5, Q_v=0.53, best=0.73, ubc=1.09)
    ├── (a=3, N=1, Q_v=0.42, best=0.42, ubc=1.32)
    ├── (a=8, N=1, Q_v=0.36, best=0.36, ubc=1.26)
    ├── (a=15, N=1, Q_v=0.60, best=0.60, ubc=1.50)
    └── (a=23, N=1, Q_v=0.53, best=0.53, ubc=1.42)
    └── (a=32, N=5, Q_v=0.58, best=0.64, ubc=1.15)
        ├── (a=3, N=1, Q_v=0.55, best=0.55, ubc=1.44)
        ├── (a=8, N=1, Q_v=0.64, best=0.64, ubc=1.53)
        ├── (a=15, N=1, Q_v=0.60, best=0.60, ubc=1.50)
        └── (a=29, N=1, Q_v=0.56, best=0.56, ubc=1.46)
[16:54:02] INFO     selected action 31 after 125 simulations.
           INFO     current action list: [1, 19, 20, 25, 21, 26, 27, 7, 28, 2, 13, 22, 14, 31]
(N=125, Q_v=0.49, best=0.76)
├── (a=3, N=19, Q_v=0.47, best=0.65, ubc=0.83)
├── (a=4, N=2, Q_v=0.27, best=0.42, ubc=1.13)
└── (a=5, N=1, Q_v=0.42, best=0.42, ubc=1.01)
├── (a=8, N=4, Q_v=0.51, best=0.55, ubc=1.12)
├── (a=4, N=1, Q_v=0.55, best=0.55, ubc=1.38)
├── (a=9, N=1, Q_v=0.44, best=0.44, ubc=1.27)
└── (a=29, N=1, Q_v=0.55, best=0.55, ubc=1.38)
├── (a=15, N=3, Q_v=0.49, best=0.65, ubc=1.19)
├── (a=4, N=1, Q_v=0.56, best=0.56, ubc=1.30)
└── (a=8, N=1, Q_v=0.65, best=0.65, ubc=1.40)
├── (a=23, N=3, Q_v=0.45, best=0.60, ubc=1.15)
├── (a=4, N=1, Q_v=0.18, best=0.18, ubc=0.92)
└── (a=29, N=1, Q_v=0.60, best=0.60, ubc=1.34)
├── (a=29, N=3, Q_v=0.50, best=0.60, ubc=1.20)
├── (a=4, N=1, Q_v=0.60, best=0.60, ubc=1.34)
└── (a=23, N=1, Q_v=0.36, best=0.36, ubc=1.10)
└── (a=32, N=3, Q_v=0.49, best=0.56, ubc=1.19)
    ├── (a=4, N=1, Q_v=0.42, best=0.42, ubc=1.16)
    └── (a=15, N=1, Q_v=0.49, best=0.49, ubc=1.23)
├── (a=8, N=21, Q_v=0.49, best=0.76, ubc=0.83)
├── (a=3, N=4, Q_v=0.60, best=0.73, ubc=1.21)
├── (a=4, N=1, Q_v=0.33, best=0.33, ubc=1.16)
├── (a=9, N=1, Q_v=0.62, best=0.62, ubc=1.45)
└── (a=29, N=1, Q_v=0.71, best=0.71, ubc=1.54)
├── (a=9, N=3, Q_v=0.44, best=0.56, ubc=1.15)
├── (a=3, N=1, Q_v=0.42, best=0.42, ubc=1.16)
└── (a=10, N=1, Q_v=0.35, best=0.35, ubc=1.09)
├── (a=15, N=4, Q_v=0.59, best=0.76, ubc=1.21)
├── (a=3, N=1, Q_v=0.76, best=0.76, ubc=1.60)
├── (a=9, N=1, Q_v=0.62, best=0.62, ubc=1.45)
└── (a=29, N=1, Q_v=0.65, best=0.65, ubc=1.49)
├── (a=23, N=3, Q_v=0.41, best=0.45, ubc=1.12)
├── (a=3, N=1, Q_v=0.45, best=0.45, ubc=1.20)
└── (a=9, N=1, Q_v=0.42, best=0.42, ubc=1.16)
├── (a=29, N=3, Q_v=0.52, best=0.65, ubc=1.23)
├── (a=3, N=1, Q_v=0.65, best=0.65, ubc=1.40)
└── (a=9, N=1, Q_v=0.49, best=0.49, ubc=1.23)
└── (a=32, N=3, Q_v=0.40, best=0.60, ubc=1.11)
    ├── (a=3, N=1, Q_v=0.25, best=0.25, ubc=1.00)
    └── (a=15, N=1, Q_v=0.60, best=0.60, ubc=1.34)
├── (a=15, N=30, Q_v=0.54, best=0.75, ubc=0.83)
├── (a=3, N=5, Q_v=0.59, best=0.64, ubc=1.18)
├── (a=4, N=1, Q_v=0.56, best=0.56, ubc=1.46)
├── (a=8, N=1, Q_v=0.60, best=0.60, ubc=1.50)
├── (a=16, N=1, Q_v=0.60, best=0.60, ubc=1.50)
└── (a=23, N=1, Q_v=0.64, best=0.64, ubc=1.53)
├── (a=8, N=5, Q_v=0.58, best=0.65, ubc=1.16)
├── (a=3, N=1, Q_v=0.60, best=0.60, ubc=1.50)
├── (a=9, N=1, Q_v=0.65, best=0.65, ubc=1.55)
├── (a=16, N=1, Q_v=0.60, best=0.60, ubc=1.50)
└── (a=23, N=1, Q_v=0.62, best=0.62, ubc=1.52)
├── (a=16, N=6, Q_v=0.54, best=0.71, ubc=1.07)
├── (a=3, N=1, Q_v=0.56, best=0.56, ubc=1.51)
├── (a=8, N=1, Q_v=0.60, best=0.60, ubc=1.55)
├── (a=17, N=1, Q_v=0.65, best=0.65, ubc=1.60)
├── (a=23, N=1, Q_v=0.71, best=0.71, ubc=1.66)
└── (a=29, N=1, Q_v=0.05, best=0.05, ubc=1.00)
├── (a=23, N=3, Q_v=0.41, best=0.60, ubc=1.16)
├── (a=3, N=1, Q_v=0.02, best=0.02, ubc=0.76)
└── (a=24, N=1, Q_v=0.60, best=0.60, ubc=1.34)
├── (a=29, N=5, Q_v=0.54, best=0.62, ubc=1.12)
├── (a=3, N=1, Q_v=0.56, best=0.56, ubc=1.46)
├── (a=8, N=1, Q_v=0.62, best=0.62, ubc=1.52)
├── (a=16, N=1, Q_v=0.51, best=0.51, ubc=1.41)
└── (a=23, N=1, Q_v=0.47, best=0.47, ubc=1.37)
└── (a=32, N=5, Q_v=0.55, best=0.75, ubc=1.13)
    ├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    ├── (a=8, N=1, Q_v=0.35, best=0.35, ubc=1.24)
    ├── (a=16, N=1, Q_v=0.60, best=0.60, ubc=1.50)
    └── (a=23, N=1, Q_v=0.47, best=0.47, ubc=1.37)
├── (a=23, N=18, Q_v=0.46, best=0.65, ubc=0.83)
├── (a=3, N=3, Q_v=0.53, best=0.60, ubc=1.22)
├── (a=4, N=1, Q_v=0.56, best=0.56, ubc=1.30)
└── (a=15, N=1, Q_v=0.60, best=0.60, ubc=1.34)
├── (a=8, N=3, Q_v=0.42, best=0.56, ubc=1.11)
├── (a=3, N=1, Q_v=0.36, best=0.36, ubc=1.10)
└── (a=29, N=1, Q_v=0.33, best=0.33, ubc=1.07)
├── (a=15, N=4, Q_v=0.57, best=0.65, ubc=1.17)
├── (a=3, N=1, Q_v=0.65, best=0.65, ubc=1.49)
├── (a=8, N=1, Q_v=0.60, best=0.60, ubc=1.43)
└── (a=32, N=1, Q_v=0.44, best=0.44, ubc=1.27)
├── (a=24, N=2, Q_v=0.24, best=0.33, ubc=1.09)
└── (a=3, N=1, Q_v=0.15, best=0.15, ubc=0.73)
├── (a=29, N=3, Q_v=0.49, best=0.60, ubc=1.18)
├── (a=3, N=1, Q_v=0.56, best=0.56, ubc=1.30)
└── (a=24, N=1, Q_v=0.31, best=0.31, ubc=1.05)
└── (a=32, N=2, Q_v=0.40, best=0.65, ubc=1.25)
    └── (a=15, N=1, Q_v=0.65, best=0.65, ubc=1.24)
├── (a=29, N=22, Q_v=0.50, best=0.75, ubc=0.83)
├── (a=3, N=4, Q_v=0.49, best=0.60, ubc=1.11)
├── (a=4, N=1, Q_v=0.60, best=0.60, ubc=1.43)
├── (a=8, N=1, Q_v=0.40, best=0.40, ubc=1.23)
└── (a=30, N=1, Q_v=0.40, best=0.40, ubc=1.23)
├── (a=8, N=3, Q_v=0.47, best=0.65, ubc=1.19)
├── (a=3, N=1, Q_v=0.44, best=0.44, ubc=1.18)
└── (a=32, N=1, Q_v=0.33, best=0.33, ubc=1.07)
├── (a=15, N=4, Q_v=0.52, best=0.60, ubc=1.14)
├── (a=3, N=1, Q_v=0.60, best=0.60, ubc=1.43)
├── (a=8, N=1, Q_v=0.42, best=0.42, ubc=1.25)
└── (a=16, N=1, Q_v=0.55, best=0.55, ubc=1.38)
├── (a=23, N=4, Q_v=0.52, best=0.60, ubc=1.14)
├── (a=3, N=1, Q_v=0.60, best=0.60, ubc=1.43)
├── (a=8, N=1, Q_v=0.42, best=0.42, ubc=1.25)
└── (a=32, N=1, Q_v=0.45, best=0.45, ubc=1.29)
├── (a=30, N=3, Q_v=0.47, best=0.53, ubc=1.18)
├── (a=3, N=1, Q_v=0.53, best=0.53, ubc=1.27)
└── (a=32, N=1, Q_v=0.36, best=0.36, ubc=1.10)
└── (a=32, N=3, Q_v=0.49, best=0.75, ubc=1.21)
    ├── (a=3, N=1, Q_v=0.13, best=0.13, ubc=0.87)
    └── (a=33, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=32, N=14, Q_v=0.41, best=0.65, ubc=0.82)
    ├── (a=3, N=2, Q_v=0.13, best=0.20, ubc=0.94)
    └── (a=33, N=1, Q_v=0.05, best=0.05, ubc=0.64)
    ├── (a=8, N=2, Q_v=0.46, best=0.47, ubc=1.28)
    └── (a=29, N=1, Q_v=0.47, best=0.47, ubc=1.06)
    ├── (a=15, N=3, Q_v=0.60, best=0.65, ubc=1.26)
    ├── (a=3, N=1, Q_v=0.65, best=0.65, ubc=1.40)
    └── (a=33, N=1, Q_v=0.60, best=0.60, ubc=1.34)
    ├── (a=23, N=2, Q_v=0.37, best=0.60, ubc=1.18)
    └── (a=8, N=1, Q_v=0.15, best=0.15, ubc=0.73)
    ├── (a=29, N=2, Q_v=0.48, best=0.55, ubc=1.29)
    └── (a=8, N=1, Q_v=0.42, best=0.42, ubc=1.01)
    └── (a=33, N=2, Q_v=0.42, best=0.60, ubc=1.23)
        └── (a=34, N=1, Q_v=0.24, best=0.24, ubc=0.82)
[16:54:05] INFO     selected action 15 after 125 simulations.
           INFO     current action list: [1, 19, 20, 25, 21, 26, 27, 7, 28, 2, 13, 22, 14, 31, 15]
(N=125, Q_v=0.55, best=0.82)
├── (a=3, N=19, Q_v=0.54, best=0.71, ubc=0.90)
├── (a=4, N=3, Q_v=0.56, best=0.56, ubc=1.26)
├── (a=5, N=1, Q_v=0.56, best=0.56, ubc=1.30)
└── (a=16, N=1, Q_v=0.55, best=0.55, ubc=1.29)
├── (a=8, N=3, Q_v=0.55, best=0.71, ubc=1.25)
├── (a=4, N=1, Q_v=0.36, best=0.36, ubc=1.10)
└── (a=32, N=1, Q_v=0.58, best=0.58, ubc=1.32)
├── (a=16, N=4, Q_v=0.63, best=0.71, ubc=1.24)
├── (a=4, N=1, Q_v=0.62, best=0.62, ubc=1.45)
├── (a=8, N=1, Q_v=0.51, best=0.51, ubc=1.34)
└── (a=32, N=1, Q_v=0.69, best=0.69, ubc=1.52)
├── (a=23, N=3, Q_v=0.50, best=0.60, ubc=1.20)
├── (a=4, N=1, Q_v=0.60, best=0.60, ubc=1.34)
└── (a=32, N=1, Q_v=0.51, best=0.51, ubc=1.25)
├── (a=29, N=3, Q_v=0.61, best=0.62, ubc=1.31)
├── (a=4, N=1, Q_v=0.60, best=0.60, ubc=1.34)
└── (a=23, N=1, Q_v=0.60, best=0.60, ubc=1.34)
└── (a=32, N=2, Q_v=0.37, best=0.60, ubc=1.23)
    └── (a=4, N=1, Q_v=0.15, best=0.15, ubc=0.73)
├── (a=8, N=27, Q_v=0.60, best=0.82, ubc=0.90)
├── (a=3, N=5, Q_v=0.64, best=0.82, ubc=1.22)
├── (a=4, N=1, Q_v=0.55, best=0.55, ubc=1.44)
├── (a=9, N=1, Q_v=0.82, best=0.82, ubc=1.72)
├── (a=16, N=1, Q_v=0.60, best=0.60, ubc=1.50)
└── (a=23, N=1, Q_v=0.65, best=0.65, ubc=1.55)
├── (a=9, N=4, Q_v=0.55, best=0.75, ubc=1.19)
├── (a=3, N=1, Q_v=0.51, best=0.51, ubc=1.34)
├── (a=10, N=1, Q_v=0.42, best=0.42, ubc=1.25)
└── (a=16, N=1, Q_v=0.51, best=0.51, ubc=1.34)
├── (a=16, N=4, Q_v=0.55, best=0.65, ubc=1.19)
├── (a=3, N=1, Q_v=0.51, best=0.51, ubc=1.34)
├── (a=9, N=1, Q_v=0.56, best=0.56, ubc=1.40)
└── (a=23, N=1, Q_v=0.47, best=0.47, ubc=1.31)
├── (a=23, N=4, Q_v=0.58, best=0.60, ubc=1.22)
├── (a=3, N=1, Q_v=0.58, best=0.58, ubc=1.41)
├── (a=9, N=1, Q_v=0.56, best=0.56, ubc=1.40)
└── (a=29, N=1, Q_v=0.58, best=0.58, ubc=1.41)
├── (a=29, N=4, Q_v=0.63, best=0.69, ubc=1.27)
├── (a=3, N=1, Q_v=0.65, best=0.65, ubc=1.49)
├── (a=9, N=1, Q_v=0.69, best=0.69, ubc=1.52)
└── (a=16, N=1, Q_v=0.62, best=0.62, ubc=1.45)
└── (a=32, N=5, Q_v=0.63, best=0.71, ubc=1.20)
    ├── (a=3, N=1, Q_v=0.58, best=0.58, ubc=1.48)
    ├── (a=9, N=1, Q_v=0.71, best=0.71, ubc=1.61)
    ├── (a=16, N=1, Q_v=0.60, best=0.60, ubc=1.50)
    └── (a=33, N=1, Q_v=0.58, best=0.58, ubc=1.48)
├── (a=16, N=22, Q_v=0.57, best=0.69, ubc=0.90)
├── (a=3, N=3, Q_v=0.56, best=0.62, ubc=1.28)
├── (a=4, N=1, Q_v=0.56, best=0.56, ubc=1.30)
└── (a=8, N=1, Q_v=0.62, best=0.62, ubc=1.36)
├── (a=8, N=4, Q_v=0.59, best=0.69, ubc=1.21)
├── (a=3, N=1, Q_v=0.56, best=0.56, ubc=1.40)
├── (a=9, N=1, Q_v=0.49, best=0.49, ubc=1.32)
└── (a=23, N=1, Q_v=0.60, best=0.60, ubc=1.43)
├── (a=17, N=3, Q_v=0.55, best=0.65, ubc=1.27)
├── (a=3, N=1, Q_v=0.49, best=0.49, ubc=1.23)
└── (a=8, N=1, Q_v=0.51, best=0.51, ubc=1.25)
├── (a=23, N=4, Q_v=0.58, best=0.65, ubc=1.20)
├── (a=3, N=1, Q_v=0.65, best=0.65, ubc=1.49)
├── (a=8, N=1, Q_v=0.42, best=0.42, ubc=1.25)
└── (a=29, N=1, Q_v=0.60, best=0.60, ubc=1.43)
├── (a=29, N=3, Q_v=0.47, best=0.56, ubc=1.19)
├── (a=3, N=1, Q_v=0.56, best=0.56, ubc=1.30)
└── (a=30, N=1, Q_v=0.56, best=0.56, ubc=1.30)
└── (a=32, N=4, Q_v=0.63, best=0.65, ubc=1.25)
    ├── (a=3, N=1, Q_v=0.60, best=0.60, ubc=1.43)
    ├── (a=8, N=1, Q_v=0.60, best=0.60, ubc=1.43)
    └── (a=17, N=1, Q_v=0.65, best=0.65, ubc=1.49)
├── (a=23, N=21, Q_v=0.56, best=0.71, ubc=0.90)
├── (a=3, N=3, Q_v=0.44, best=0.55, ubc=1.15)
├── (a=4, N=1, Q_v=0.31, best=0.31, ubc=1.05)
└── (a=8, N=1, Q_v=0.45, best=0.45, ubc=1.20)
├── (a=8, N=3, Q_v=0.59, best=0.65, ubc=1.31)
├── (a=3, N=1, Q_v=0.65, best=0.65, ubc=1.40)
└── (a=32, N=1, Q_v=0.53, best=0.53, ubc=1.27)
├── (a=16, N=4, Q_v=0.64, best=0.71, ubc=1.25)
├── (a=3, N=1, Q_v=0.71, best=0.71, ubc=1.54)
├── (a=8, N=1, Q_v=0.64, best=0.64, ubc=1.47)
└── (a=17, N=1, Q_v=0.60, best=0.60, ubc=1.43)
├── (a=24, N=4, Q_v=0.55, best=0.62, ubc=1.17)
├── (a=3, N=1, Q_v=0.60, best=0.60, ubc=1.43)
├── (a=8, N=1, Q_v=0.40, best=0.40, ubc=1.23)
└── (a=16, N=1, Q_v=0.62, best=0.62, ubc=1.45)
├── (a=29, N=3, Q_v=0.58, best=0.60, ubc=1.29)
├── (a=3, N=1, Q_v=0.55, best=0.55, ubc=1.29)
└── (a=30, N=1, Q_v=0.60, best=0.60, ubc=1.34)
└── (a=32, N=3, Q_v=0.52, best=0.60, ubc=1.23)
    ├── (a=3, N=1, Q_v=0.60, best=0.60, ubc=1.34)
    └── (a=8, N=1, Q_v=0.35, best=0.35, ubc=1.09)
├── (a=29, N=19, Q_v=0.52, best=0.76, ubc=0.88)
├── (a=3, N=1, Q_v=-0.11, best=-0.11, ubc=1.10)
├── (a=8, N=3, Q_v=0.59, best=0.73, ubc=1.29)
├── (a=3, N=1, Q_v=0.73, best=0.73, ubc=1.47)
└── (a=23, N=1, Q_v=0.47, best=0.47, ubc=1.21)
├── (a=16, N=3, Q_v=0.59, best=0.65, ubc=1.29)
├── (a=3, N=1, Q_v=0.65, best=0.65, ubc=1.40)
└── (a=30, N=1, Q_v=0.56, best=0.56, ubc=1.30)
├── (a=23, N=3, Q_v=0.52, best=0.60, ubc=1.22)
├── (a=3, N=1, Q_v=0.60, best=0.60, ubc=1.34)
└── (a=8, N=1, Q_v=0.35, best=0.35, ubc=1.09)
├── (a=30, N=3, Q_v=0.33, best=0.53, ubc=1.03)
├── (a=3, N=1, Q_v=0.09, best=0.09, ubc=0.83)
└── (a=8, N=1, Q_v=0.36, best=0.36, ubc=1.10)
└── (a=32, N=5, Q_v=0.69, best=0.76, ubc=1.24)
    ├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    ├── (a=8, N=1, Q_v=0.76, best=0.76, ubc=1.66)
    ├── (a=16, N=1, Q_v=0.76, best=0.76, ubc=1.66)
    └── (a=23, N=1, Q_v=0.60, best=0.60, ubc=1.50)
└── (a=32, N=16, Q_v=0.50, best=0.65, ubc=0.89)
    ├── (a=3, N=3, Q_v=0.58, best=0.60, ubc=1.26)
    ├── (a=4, N=1, Q_v=0.53, best=0.53, ubc=1.27)
    └── (a=33, N=1, Q_v=0.60, best=0.60, ubc=1.34)
    ├── (a=8, N=3, Q_v=0.50, best=0.56, ubc=1.18)
    ├── (a=3, N=1, Q_v=0.42, best=0.42, ubc=1.16)
    └── (a=9, N=1, Q_v=0.53, best=0.53, ubc=1.27)
    ├── (a=16, N=2, Q_v=0.37, best=0.53, ubc=1.21)
    └── (a=3, N=1, Q_v=0.53, best=0.53, ubc=1.12)
    ├── (a=23, N=2, Q_v=0.51, best=0.60, ubc=1.34)
    └── (a=3, N=1, Q_v=0.42, best=0.42, ubc=1.01)
    ├── (a=29, N=3, Q_v=0.55, best=0.65, ubc=1.23)
    ├── (a=3, N=1, Q_v=0.38, best=0.38, ubc=1.12)
    └── (a=33, N=1, Q_v=0.60, best=0.60, ubc=1.34)
    └── (a=33, N=2, Q_v=0.41, best=0.60, ubc=1.24)
        └── (a=16, N=1, Q_v=0.22, best=0.22, ubc=0.81)
[16:54:07] INFO     selected action 8 after 125 simulations.
           INFO     current action list: [1, 19, 20, 25, 21, 26, 27, 7, 28, 2, 13, 22, 14, 31, 15, 8]
(N=125, Q_v=0.53, best=0.76)
├── (a=3, N=18, Q_v=0.51, best=0.65, ubc=0.87)
├── (a=4, N=3, Q_v=0.52, best=0.56, ubc=1.21)
├── (a=5, N=1, Q_v=0.56, best=0.56, ubc=1.30)
└── (a=9, N=1, Q_v=0.42, best=0.42, ubc=1.16)
├── (a=9, N=3, Q_v=0.48, best=0.56, ubc=1.18)
├── (a=4, N=1, Q_v=0.56, best=0.56, ubc=1.30)
└── (a=10, N=1, Q_v=0.49, best=0.49, ubc=1.23)
├── (a=16, N=3, Q_v=0.55, best=0.65, ubc=1.24)
├── (a=4, N=1, Q_v=0.65, best=0.65, ubc=1.40)
└── (a=29, N=1, Q_v=0.49, best=0.49, ubc=1.23)
├── (a=23, N=2, Q_v=0.45, best=0.58, ubc=1.30)
└── (a=9, N=1, Q_v=0.33, best=0.33, ubc=0.92)
├── (a=29, N=3, Q_v=0.48, best=0.60, ubc=1.17)
├── (a=4, N=1, Q_v=0.38, best=0.38, ubc=1.12)
└── (a=30, N=1, Q_v=0.60, best=0.60, ubc=1.34)
└── (a=32, N=3, Q_v=0.52, best=0.60, ubc=1.22)
    ├── (a=4, N=1, Q_v=0.56, best=0.56, ubc=1.30)
    └── (a=23, N=1, Q_v=0.40, best=0.40, ubc=1.14)
├── (a=9, N=20, Q_v=0.52, best=0.65, ubc=0.87)
├── (a=3, N=2, Q_v=0.38, best=0.38, ubc=1.25)
└── (a=10, N=1, Q_v=0.38, best=0.38, ubc=0.97)
├── (a=10, N=3, Q_v=0.45, best=0.62, ubc=1.15)
├── (a=3, N=1, Q_v=0.45, best=0.45, ubc=1.20)
└── (a=32, N=1, Q_v=0.62, best=0.62, ubc=1.36)
├── (a=16, N=4, Q_v=0.59, best=0.65, ubc=1.20)
├── (a=3, N=1, Q_v=0.58, best=0.58, ubc=1.41)
├── (a=10, N=1, Q_v=0.62, best=0.62, ubc=1.45)
└── (a=17, N=1, Q_v=0.49, best=0.49, ubc=1.32)
├── (a=23, N=3, Q_v=0.56, best=0.65, ubc=1.27)
├── (a=3, N=1, Q_v=0.65, best=0.65, ubc=1.40)
└── (a=10, N=1, Q_v=0.42, best=0.42, ubc=1.16)
├── (a=29, N=3, Q_v=0.49, best=0.62, ubc=1.20)
├── (a=3, N=1, Q_v=0.62, best=0.62, ubc=1.36)
└── (a=30, N=1, Q_v=0.35, best=0.35, ubc=1.09)
└── (a=32, N=4, Q_v=0.55, best=0.64, ubc=1.16)
    ├── (a=3, N=1, Q_v=0.53, best=0.53, ubc=1.36)
    ├── (a=10, N=1, Q_v=0.45, best=0.45, ubc=1.29)
    └── (a=29, N=1, Q_v=0.56, best=0.56, ubc=1.40)
├── (a=16, N=27, Q_v=0.57, best=0.76, ubc=0.87)
├── (a=3, N=5, Q_v=0.58, best=0.71, ubc=1.16)
├── (a=4, N=1, Q_v=0.45, best=0.45, ubc=1.35)
├── (a=9, N=1, Q_v=0.71, best=0.71, ubc=1.61)
├── (a=17, N=1, Q_v=0.53, best=0.53, ubc=1.42)
└── (a=32, N=1, Q_v=0.56, best=0.56, ubc=1.46)
├── (a=9, N=4, Q_v=0.57, best=0.75, ubc=1.21)
├── (a=3, N=1, Q_v=0.53, best=0.53, ubc=1.36)
├── (a=10, N=1, Q_v=0.51, best=0.51, ubc=1.34)
└── (a=17, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=17, N=3, Q_v=0.42, best=0.51, ubc=1.16)
├── (a=3, N=1, Q_v=0.51, best=0.51, ubc=1.25)
└── (a=29, N=1, Q_v=0.49, best=0.49, ubc=1.23)
├── (a=23, N=4, Q_v=0.54, best=0.60, ubc=1.18)
├── (a=3, N=1, Q_v=0.56, best=0.56, ubc=1.40)
├── (a=9, N=1, Q_v=0.51, best=0.51, ubc=1.34)
└── (a=29, N=1, Q_v=0.60, best=0.60, ubc=1.43)
├── (a=29, N=5, Q_v=0.64, best=0.73, ubc=1.21)
├── (a=3, N=1, Q_v=0.55, best=0.55, ubc=1.44)
├── (a=9, N=1, Q_v=0.60, best=0.60, ubc=1.50)
├── (a=17, N=1, Q_v=0.73, best=0.73, ubc=1.62)
└── (a=23, N=1, Q_v=0.71, best=0.71, ubc=1.61)
└── (a=32, N=5, Q_v=0.59, best=0.76, ubc=1.17)
    ├── (a=3, N=1, Q_v=0.60, best=0.60, ubc=1.50)
    ├── (a=9, N=1, Q_v=0.49, best=0.49, ubc=1.39)
    ├── (a=17, N=1, Q_v=0.76, best=0.76, ubc=1.66)
    └── (a=23, N=1, Q_v=0.51, best=0.51, ubc=1.41)
├── (a=23, N=18, Q_v=0.50, best=0.65, ubc=0.87)
├── (a=3, N=3, Q_v=0.47, best=0.60, ubc=1.16)
├── (a=4, N=1, Q_v=0.29, best=0.29, ubc=1.03)
└── (a=24, N=1, Q_v=0.60, best=0.60, ubc=1.34)
├── (a=9, N=3, Q_v=0.42, best=0.65, ubc=1.12)
├── (a=3, N=1, Q_v=0.35, best=0.35, ubc=1.09)
└── (a=10, N=1, Q_v=0.27, best=0.27, ubc=1.01)
├── (a=16, N=3, Q_v=0.56, best=0.60, ubc=1.25)
├── (a=3, N=1, Q_v=0.60, best=0.60, ubc=1.34)
└── (a=9, N=1, Q_v=0.47, best=0.47, ubc=1.21)
├── (a=24, N=2, Q_v=0.44, best=0.45, ubc=1.29)
└── (a=3, N=1, Q_v=0.42, best=0.42, ubc=1.01)
├── (a=29, N=3, Q_v=0.59, best=0.65, ubc=1.29)
├── (a=3, N=1, Q_v=0.65, best=0.65, ubc=1.40)
└── (a=16, N=1, Q_v=0.62, best=0.62, ubc=1.36)
└── (a=32, N=3, Q_v=0.61, best=0.62, ubc=1.31)
    ├── (a=3, N=1, Q_v=0.62, best=0.62, ubc=1.36)
    └── (a=33, N=1, Q_v=0.62, best=0.62, ubc=1.36)
├── (a=29, N=20, Q_v=0.53, best=0.76, ubc=0.87)
├── (a=3, N=3, Q_v=0.56, best=0.76, ubc=1.26)
├── (a=4, N=1, Q_v=0.76, best=0.76, ubc=1.50)
└── (a=32, N=1, Q_v=0.36, best=0.36, ubc=1.10)
├── (a=9, N=3, Q_v=0.46, best=0.53, ubc=1.17)
├── (a=3, N=1, Q_v=0.51, best=0.51, ubc=1.25)
└── (a=10, N=1, Q_v=0.35, best=0.35, ubc=1.09)
├── (a=16, N=4, Q_v=0.63, best=0.69, ubc=1.24)
├── (a=3, N=1, Q_v=0.69, best=0.69, ubc=1.52)
├── (a=9, N=1, Q_v=0.60, best=0.60, ubc=1.43)
└── (a=17, N=1, Q_v=0.58, best=0.58, ubc=1.41)
├── (a=23, N=3, Q_v=0.48, best=0.60, ubc=1.19)
├── (a=3, N=1, Q_v=0.60, best=0.60, ubc=1.34)
└── (a=9, N=1, Q_v=0.35, best=0.35, ubc=1.09)
├── (a=30, N=3, Q_v=0.57, best=0.76, ubc=1.28)
├── (a=3, N=1, Q_v=0.47, best=0.47, ubc=1.21)
└── (a=9, N=1, Q_v=0.47, best=0.47, ubc=1.21)
└── (a=32, N=3, Q_v=0.41, best=0.49, ubc=1.11)
    ├── (a=3, N=1, Q_v=0.24, best=0.24, ubc=0.98)
    └── (a=16, N=1, Q_v=0.49, best=0.49, ubc=1.23)
└── (a=32, N=21, Q_v=0.52, best=0.71, ubc=0.86)
    ├── (a=3, N=4, Q_v=0.49, best=0.62, ubc=1.11)
    ├── (a=4, N=1, Q_v=0.60, best=0.60, ubc=1.43)
    ├── (a=9, N=1, Q_v=0.27, best=0.27, ubc=1.11)
    └── (a=29, N=1, Q_v=0.47, best=0.47, ubc=1.31)
    ├── (a=9, N=3, Q_v=0.53, best=0.56, ubc=1.25)
    ├── (a=3, N=1, Q_v=0.49, best=0.49, ubc=1.23)
    └── (a=33, N=1, Q_v=0.55, best=0.55, ubc=1.29)
    ├── (a=16, N=4, Q_v=0.61, best=0.71, ubc=1.23)
    ├── (a=3, N=1, Q_v=0.60, best=0.60, ubc=1.43)
    ├── (a=9, N=1, Q_v=0.71, best=0.71, ubc=1.54)
    └── (a=33, N=1, Q_v=0.65, best=0.65, ubc=1.49)
    ├── (a=23, N=3, Q_v=0.53, best=0.60, ubc=1.24)
    ├── (a=3, N=1, Q_v=0.60, best=0.60, ubc=1.34)
    └── (a=9, N=1, Q_v=0.40, best=0.40, ubc=1.14)
    ├── (a=29, N=3, Q_v=0.42, best=0.65, ubc=1.13)
    ├── (a=3, N=1, Q_v=0.40, best=0.40, ubc=1.14)
    └── (a=30, N=1, Q_v=0.20, best=0.20, ubc=0.94)
    └── (a=33, N=3, Q_v=0.51, best=0.60, ubc=1.22)
        ├── (a=3, N=1, Q_v=0.60, best=0.60, ubc=1.34)
        └── (a=23, N=1, Q_v=0.53, best=0.53, ubc=1.27)
[16:54:10] INFO     selected action 16 after 125 simulations.
           INFO     current action list: [1, 19, 20, 25, 21, 26, 27, 7, 28, 2, 13, 22, 14, 31, 15, 8, 16]
(N=125, Q_v=0.58, best=0.80)
├── (a=3, N=20, Q_v=0.57, best=0.76, ubc=0.92)
├── (a=4, N=3, Q_v=0.52, best=0.60, ubc=1.23)
├── (a=5, N=1, Q_v=0.56, best=0.56, ubc=1.30)
└── (a=23, N=1, Q_v=0.40, best=0.40, ubc=1.14)
├── (a=9, N=4, Q_v=0.58, best=0.62, ubc=1.19)
├── (a=4, N=1, Q_v=0.55, best=0.55, ubc=1.38)
├── (a=10, N=1, Q_v=0.62, best=0.62, ubc=1.45)
└── (a=17, N=1, Q_v=0.56, best=0.56, ubc=1.40)
├── (a=17, N=3, Q_v=0.58, best=0.60, ubc=1.29)
├── (a=4, N=1, Q_v=0.55, best=0.55, ubc=1.29)
└── (a=23, N=1, Q_v=0.60, best=0.60, ubc=1.34)
├── (a=23, N=3, Q_v=0.56, best=0.58, ubc=1.27)
├── (a=4, N=1, Q_v=0.56, best=0.56, ubc=1.30)
└── (a=24, N=1, Q_v=0.58, best=0.58, ubc=1.32)
├── (a=29, N=3, Q_v=0.56, best=0.60, ubc=1.27)
├── (a=4, N=1, Q_v=0.53, best=0.53, ubc=1.27)
└── (a=32, N=1, Q_v=0.60, best=0.60, ubc=1.34)
└── (a=32, N=3, Q_v=0.59, best=0.76, ubc=1.29)
    ├── (a=4, N=1, Q_v=0.38, best=0.38, ubc=1.12)
    └── (a=9, N=1, Q_v=0.76, best=0.76, ubc=1.50)
├── (a=9, N=16, Q_v=0.52, best=0.75, ubc=0.91)
├── (a=3, N=3, Q_v=0.47, best=0.53, ubc=1.15)
├── (a=4, N=1, Q_v=0.38, best=0.38, ubc=1.12)
└── (a=32, N=1, Q_v=0.53, best=0.53, ubc=1.27)
├── (a=10, N=2, Q_v=0.50, best=0.51, ubc=1.33)
└── (a=32, N=1, Q_v=0.49, best=0.49, ubc=1.08)
├── (a=17, N=2, Q_v=0.51, best=0.62, ubc=1.34)
└── (a=10, N=1, Q_v=0.40, best=0.40, ubc=0.99)
├── (a=23, N=3, Q_v=0.57, best=0.62, ubc=1.25)
├── (a=3, N=1, Q_v=0.62, best=0.62, ubc=1.36)
└── (a=10, N=1, Q_v=0.47, best=0.47, ubc=1.21)
├── (a=29, N=2, Q_v=0.40, best=0.45, ubc=1.23)
└── (a=3, N=1, Q_v=0.45, best=0.45, ubc=1.04)
└── (a=32, N=3, Q_v=0.67, best=0.75, ubc=1.35)
    ├── (a=3, N=1, Q_v=0.69, best=0.69, ubc=1.43)
    └── (a=10, N=1, Q_v=0.56, best=0.56, ubc=1.30)
├── (a=17, N=20, Q_v=0.56, best=0.67, ubc=0.91)
├── (a=3, N=3, Q_v=0.53, best=0.67, ubc=1.24)
├── (a=4, N=1, Q_v=0.67, best=0.67, ubc=1.41)
└── (a=23, N=1, Q_v=0.53, best=0.53, ubc=1.27)
├── (a=9, N=4, Q_v=0.57, best=0.67, ubc=1.18)
├── (a=3, N=1, Q_v=0.56, best=0.56, ubc=1.40)
├── (a=10, N=1, Q_v=0.67, best=0.67, ubc=1.51)
└── (a=18, N=1, Q_v=0.47, best=0.47, ubc=1.31)
├── (a=18, N=3, Q_v=0.57, best=0.62, ubc=1.28)
├── (a=3, N=1, Q_v=0.62, best=0.62, ubc=1.36)
└── (a=23, N=1, Q_v=0.60, best=0.60, ubc=1.34)
├── (a=23, N=3, Q_v=0.58, best=0.60, ubc=1.29)
├── (a=3, N=1, Q_v=0.56, best=0.56, ubc=1.30)
└── (a=24, N=1, Q_v=0.58, best=0.58, ubc=1.32)
├── (a=29, N=3, Q_v=0.58, best=0.65, ubc=1.28)
├── (a=3, N=1, Q_v=0.65, best=0.65, ubc=1.40)
└── (a=30, N=1, Q_v=0.51, best=0.51, ubc=1.25)
└── (a=32, N=3, Q_v=0.52, best=0.56, ubc=1.23)
    ├── (a=3, N=1, Q_v=0.56, best=0.56, ubc=1.30)
    └── (a=9, N=1, Q_v=0.51, best=0.51, ubc=1.25)
├── (a=23, N=20, Q_v=0.57, best=0.67, ubc=0.92)
├── (a=3, N=3, Q_v=0.55, best=0.58, ubc=1.26)
├── (a=4, N=1, Q_v=0.51, best=0.51, ubc=1.25)
└── (a=17, N=1, Q_v=0.56, best=0.56, ubc=1.30)
├── (a=9, N=3, Q_v=0.46, best=0.62, ubc=1.17)
├── (a=3, N=1, Q_v=0.29, best=0.29, ubc=1.03)
└── (a=10, N=1, Q_v=0.62, best=0.62, ubc=1.36)
├── (a=17, N=3, Q_v=0.56, best=0.60, ubc=1.27)
├── (a=3, N=1, Q_v=0.56, best=0.56, ubc=1.30)
└── (a=29, N=1, Q_v=0.60, best=0.60, ubc=1.34)
├── (a=24, N=3, Q_v=0.59, best=0.60, ubc=1.30)
├── (a=3, N=1, Q_v=0.58, best=0.58, ubc=1.32)
└── (a=29, N=1, Q_v=0.60, best=0.60, ubc=1.34)
├── (a=29, N=3, Q_v=0.62, best=0.67, ubc=1.32)
├── (a=3, N=1, Q_v=0.65, best=0.65, ubc=1.40)
└── (a=30, N=1, Q_v=0.67, best=0.67, ubc=1.41)
└── (a=32, N=4, Q_v=0.62, best=0.65, ubc=1.23)
    ├── (a=3, N=1, Q_v=0.60, best=0.60, ubc=1.43)
    ├── (a=9, N=1, Q_v=0.56, best=0.56, ubc=1.40)
    └── (a=29, N=1, Q_v=0.65, best=0.65, ubc=1.49)
├── (a=29, N=23, Q_v=0.59, best=0.76, ubc=0.92)
├── (a=3, N=4, Q_v=0.60, best=0.62, ubc=1.23)
├── (a=4, N=1, Q_v=0.58, best=0.58, ubc=1.41)
├── (a=9, N=1, Q_v=0.62, best=0.62, ubc=1.45)
└── (a=23, N=1, Q_v=0.60, best=0.60, ubc=1.43)
├── (a=9, N=3, Q_v=0.55, best=0.71, ubc=1.27)
├── (a=3, N=1, Q_v=0.45, best=0.45, ubc=1.20)
└── (a=10, N=1, Q_v=0.47, best=0.47, ubc=1.21)
├── (a=17, N=4, Q_v=0.65, best=0.73, ubc=1.28)
├── (a=3, N=1, Q_v=0.71, best=0.71, ubc=1.54)
├── (a=9, N=1, Q_v=0.73, best=0.73, ubc=1.56)
└── (a=30, N=1, Q_v=0.53, best=0.53, ubc=1.36)
├── (a=23, N=3, Q_v=0.51, best=0.60, ubc=1.23)
├── (a=3, N=1, Q_v=0.60, best=0.60, ubc=1.34)
└── (a=32, N=1, Q_v=0.45, best=0.45, ubc=1.20)
├── (a=30, N=3, Q_v=0.52, best=0.60, ubc=1.24)
├── (a=3, N=1, Q_v=0.51, best=0.51, ubc=1.25)
└── (a=9, N=1, Q_v=0.45, best=0.45, ubc=1.20)
└── (a=32, N=5, Q_v=0.68, best=0.76, ubc=1.24)
    ├── (a=3, N=1, Q_v=0.60, best=0.60, ubc=1.50)
    ├── (a=9, N=1, Q_v=0.65, best=0.65, ubc=1.55)
    ├── (a=17, N=1, Q_v=0.65, best=0.65, ubc=1.55)
    └── (a=30, N=1, Q_v=0.76, best=0.76, ubc=1.66)
└── (a=32, N=25, Q_v=0.61, best=0.80, ubc=0.92)
    ├── (a=3, N=3, Q_v=0.49, best=0.51, ubc=1.22)
    ├── (a=4, N=1, Q_v=0.47, best=0.47, ubc=1.21)
    └── (a=17, N=1, Q_v=0.49, best=0.49, ubc=1.23)
    ├── (a=9, N=5, Q_v=0.67, best=0.75, ubc=1.24)
    ├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    ├── (a=10, N=1, Q_v=0.51, best=0.51, ubc=1.41)
    ├── (a=17, N=1, Q_v=0.60, best=0.60, ubc=1.50)
    └── (a=33, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    ├── (a=17, N=4, Q_v=0.58, best=0.75, ubc=1.21)
    ├── (a=3, N=1, Q_v=0.65, best=0.65, ubc=1.49)
    ├── (a=9, N=1, Q_v=0.75, best=0.75, ubc=1.58)
    └── (a=18, N=1, Q_v=0.49, best=0.49, ubc=1.32)
    ├── (a=23, N=4, Q_v=0.63, best=0.80, ubc=1.26)
    ├── (a=3, N=1, Q_v=0.45, best=0.45, ubc=1.29)
    ├── (a=9, N=1, Q_v=0.80, best=0.80, ubc=1.63)
    └── (a=17, N=1, Q_v=0.60, best=0.60, ubc=1.43)
    ├── (a=29, N=4, Q_v=0.57, best=0.71, ubc=1.21)
    ├── (a=3, N=1, Q_v=0.40, best=0.40, ubc=1.23)
    ├── (a=9, N=1, Q_v=0.53, best=0.53, ubc=1.36)
    └── (a=17, N=1, Q_v=0.71, best=0.71, ubc=1.54)
    └── (a=33, N=4, Q_v=0.66, best=0.75, ubc=1.30)
        ├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.58)
        ├── (a=9, N=1, Q_v=0.60, best=0.60, ubc=1.43)
        └── (a=23, N=1, Q_v=0.65, best=0.65, ubc=1.49)
[16:54:12] INFO     selected action 32 after 125 simulations.
           INFO     current action list: [1, 19, 20, 25, 21, 26, 27, 7, 28, 2, 13, 22, 14, 31, 15, 8, 16, 32]
(N=125, Q_v=0.59, best=0.76)
├── (a=3, N=20, Q_v=0.59, best=0.76, ubc=0.93)
├── (a=4, N=3, Q_v=0.52, best=0.60, ubc=1.23)
├── (a=5, N=1, Q_v=0.40, best=0.40, ubc=1.14)
└── (a=29, N=1, Q_v=0.60, best=0.60, ubc=1.34)
├── (a=9, N=3, Q_v=0.56, best=0.62, ubc=1.26)
├── (a=4, N=1, Q_v=0.60, best=0.60, ubc=1.34)
└── (a=29, N=1, Q_v=0.62, best=0.62, ubc=1.36)
├── (a=17, N=3, Q_v=0.59, best=0.62, ubc=1.29)
├── (a=4, N=1, Q_v=0.58, best=0.58, ubc=1.32)
└── (a=9, N=1, Q_v=0.62, best=0.62, ubc=1.36)
├── (a=23, N=3, Q_v=0.58, best=0.60, ubc=1.28)
├── (a=4, N=1, Q_v=0.53, best=0.53, ubc=1.27)
└── (a=33, N=1, Q_v=0.60, best=0.60, ubc=1.34)
├── (a=29, N=3, Q_v=0.58, best=0.76, ubc=1.28)
├── (a=4, N=1, Q_v=0.36, best=0.36, ubc=1.10)
└── (a=30, N=1, Q_v=0.60, best=0.60, ubc=1.34)
└── (a=33, N=4, Q_v=0.66, best=0.76, ubc=1.28)
    ├── (a=4, N=1, Q_v=0.76, best=0.76, ubc=1.60)
    ├── (a=9, N=1, Q_v=0.71, best=0.71, ubc=1.54)
    └── (a=17, N=1, Q_v=0.49, best=0.49, ubc=1.32)
├── (a=9, N=22, Q_v=0.61, best=0.76, ubc=0.94)
├── (a=3, N=3, Q_v=0.53, best=0.76, ubc=1.24)
├── (a=4, N=1, Q_v=0.47, best=0.47, ubc=1.21)
└── (a=10, N=1, Q_v=0.35, best=0.35, ubc=1.09)
├── (a=10, N=3, Q_v=0.61, best=0.71, ubc=1.33)
├── (a=3, N=1, Q_v=0.71, best=0.71, ubc=1.45)
└── (a=33, N=1, Q_v=0.51, best=0.51, ubc=1.25)
├── (a=17, N=3, Q_v=0.55, best=0.56, ubc=1.27)
├── (a=3, N=1, Q_v=0.56, best=0.56, ubc=1.30)
└── (a=29, N=1, Q_v=0.56, best=0.56, ubc=1.30)
├── (a=23, N=4, Q_v=0.64, best=0.71, ubc=1.26)
├── (a=3, N=1, Q_v=0.64, best=0.64, ubc=1.47)
├── (a=10, N=1, Q_v=0.62, best=0.62, ubc=1.45)
└── (a=17, N=1, Q_v=0.71, best=0.71, ubc=1.54)
├── (a=29, N=4, Q_v=0.64, best=0.71, ubc=1.26)
├── (a=3, N=1, Q_v=0.62, best=0.62, ubc=1.45)
├── (a=10, N=1, Q_v=0.56, best=0.56, ubc=1.40)
└── (a=17, N=1, Q_v=0.65, best=0.65, ubc=1.49)
└── (a=33, N=4, Q_v=0.65, best=0.76, ubc=1.28)
    ├── (a=3, N=1, Q_v=0.58, best=0.58, ubc=1.41)
    ├── (a=10, N=1, Q_v=0.76, best=0.76, ubc=1.60)
    └── (a=17, N=1, Q_v=0.62, best=0.62, ubc=1.45)
├── (a=17, N=20, Q_v=0.58, best=0.76, ubc=0.93)
├── (a=3, N=3, Q_v=0.52, best=0.56, ubc=1.22)
├── (a=4, N=1, Q_v=0.51, best=0.51, ubc=1.25)
└── (a=29, N=1, Q_v=0.47, best=0.47, ubc=1.21)
├── (a=9, N=4, Q_v=0.67, best=0.71, ubc=1.28)
├── (a=3, N=1, Q_v=0.71, best=0.71, ubc=1.54)
├── (a=10, N=1, Q_v=0.71, best=0.71, ubc=1.54)
└── (a=18, N=1, Q_v=0.62, best=0.62, ubc=1.45)
├── (a=18, N=3, Q_v=0.52, best=0.56, ubc=1.22)
├── (a=3, N=1, Q_v=0.49, best=0.49, ubc=1.23)
└── (a=9, N=1, Q_v=0.49, best=0.49, ubc=1.23)
├── (a=23, N=3, Q_v=0.57, best=0.65, ubc=1.28)
├── (a=3, N=1, Q_v=0.65, best=0.65, ubc=1.40)
└── (a=24, N=1, Q_v=0.60, best=0.60, ubc=1.34)
├── (a=29, N=3, Q_v=0.53, best=0.56, ubc=1.23)
├── (a=3, N=1, Q_v=0.56, best=0.56, ubc=1.30)
└── (a=18, N=1, Q_v=0.49, best=0.49, ubc=1.23)
└── (a=33, N=3, Q_v=0.65, best=0.76, ubc=1.35)
    ├── (a=3, N=1, Q_v=0.65, best=0.65, ubc=1.40)
    └── (a=9, N=1, Q_v=0.53, best=0.53, ubc=1.27)
├── (a=23, N=18, Q_v=0.55, best=0.71, ubc=0.92)
├── (a=3, N=3, Q_v=0.53, best=0.71, ubc=1.22)
├── (a=4, N=1, Q_v=0.71, best=0.71, ubc=1.45)
└── (a=9, N=1, Q_v=0.40, best=0.40, ubc=1.14)
├── (a=9, N=2, Q_v=0.44, best=0.53, ubc=1.29)
└── (a=10, N=1, Q_v=0.35, best=0.35, ubc=0.93)
├── (a=17, N=3, Q_v=0.48, best=0.60, ubc=1.18)
├── (a=3, N=1, Q_v=0.40, best=0.40, ubc=1.14)
└── (a=29, N=1, Q_v=0.60, best=0.60, ubc=1.34)
├── (a=24, N=3, Q_v=0.60, best=0.60, ubc=1.29)
├── (a=3, N=1, Q_v=0.60, best=0.60, ubc=1.34)
└── (a=17, N=1, Q_v=0.60, best=0.60, ubc=1.34)
├── (a=29, N=3, Q_v=0.59, best=0.65, ubc=1.29)
├── (a=3, N=1, Q_v=0.56, best=0.56, ubc=1.30)
└── (a=9, N=1, Q_v=0.56, best=0.56, ubc=1.30)
└── (a=33, N=3, Q_v=0.62, best=0.64, ubc=1.31)
    ├── (a=3, N=1, Q_v=0.60, best=0.60, ubc=1.34)
    └── (a=24, N=1, Q_v=0.64, best=0.64, ubc=1.38)
├── (a=29, N=15, Q_v=0.53, best=0.75, ubc=0.94)
├── (a=3, N=2, Q_v=0.50, best=0.60, ubc=1.32)
└── (a=23, N=1, Q_v=0.40, best=0.40, ubc=0.99)
├── (a=9, N=2, Q_v=0.45, best=0.51, ubc=1.28)
└── (a=30, N=1, Q_v=0.40, best=0.40, ubc=0.99)
├── (a=17, N=3, Q_v=0.62, best=0.75, ubc=1.29)
├── (a=3, N=1, Q_v=0.49, best=0.49, ubc=1.23)
└── (a=30, N=1, Q_v=0.75, best=0.75, ubc=1.49)
├── (a=23, N=2, Q_v=0.53, best=0.60, ubc=1.35)
└── (a=33, N=1, Q_v=0.60, best=0.60, ubc=1.19)
├── (a=30, N=3, Q_v=0.54, best=0.60, ubc=1.21)
├── (a=3, N=1, Q_v=0.49, best=0.49, ubc=1.23)
└── (a=23, N=1, Q_v=0.60, best=0.60, ubc=1.34)
└── (a=33, N=2, Q_v=0.49, best=0.65, ubc=1.31)
    └── (a=34, N=1, Q_v=0.33, best=0.33, ubc=0.92)
└── (a=33, N=29, Q_v=0.65, best=0.76, ubc=0.93)
    ├── (a=3, N=6, Q_v=0.72, best=0.76, ubc=1.25)
    ├── (a=4, N=1, Q_v=0.75, best=0.75, ubc=1.69)
    ├── (a=9, N=1, Q_v=0.64, best=0.64, ubc=1.58)
    ├── (a=17, N=1, Q_v=0.65, best=0.65, ubc=1.60)
    ├── (a=23, N=1, Q_v=0.76, best=0.76, ubc=1.71)
    └── (a=29, N=1, Q_v=0.76, best=0.76, ubc=1.71)
    ├── (a=9, N=5, Q_v=0.70, best=0.76, ubc=1.28)
    ├── (a=3, N=1, Q_v=0.76, best=0.76, ubc=1.66)
    ├── (a=10, N=1, Q_v=0.62, best=0.62, ubc=1.52)
    ├── (a=17, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    └── (a=23, N=1, Q_v=0.62, best=0.62, ubc=1.52)
    ├── (a=17, N=4, Q_v=0.59, best=0.76, ubc=1.24)
    ├── (a=3, N=1, Q_v=0.49, best=0.49, ubc=1.32)
    ├── (a=9, N=1, Q_v=0.76, best=0.76, ubc=1.60)
    └── (a=18, N=1, Q_v=0.49, best=0.49, ubc=1.32)
    ├── (a=23, N=5, Q_v=0.63, best=0.65, ubc=1.21)
    ├── (a=3, N=1, Q_v=0.60, best=0.60, ubc=1.50)
    ├── (a=9, N=1, Q_v=0.65, best=0.65, ubc=1.55)
    ├── (a=17, N=1, Q_v=0.60, best=0.60, ubc=1.50)
    └── (a=29, N=1, Q_v=0.65, best=0.65, ubc=1.55)
    ├── (a=29, N=3, Q_v=0.42, best=0.60, ubc=1.17)
    ├── (a=3, N=1, Q_v=0.33, best=0.33, ubc=1.07)
    └── (a=34, N=1, Q_v=0.33, best=0.33, ubc=1.07)
    └── (a=34, N=5, Q_v=0.68, best=0.76, ubc=1.26)
        ├── (a=3, N=1, Q_v=0.38, best=0.38, ubc=1.28)
        ├── (a=9, N=1, Q_v=0.76, best=0.76, ubc=1.66)
        ├── (a=17, N=1, Q_v=0.75, best=0.75, ubc=1.64)
        └── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.64)
[16:54:14] INFO     selected action 33 after 125 simulations.
           INFO     current action list: [1, 19, 20, 25, 21, 26, 27, 7, 28, 2, 13, 22, 14, 31, 15, 8, 16, 32, 33]
(N=125, Q_v=0.63, best=0.80)
├── (a=3, N=17, Q_v=0.58, best=0.76, ubc=0.96)
├── (a=4, N=3, Q_v=0.53, best=0.65, ubc=1.22)
├── (a=5, N=1, Q_v=0.35, best=0.35, ubc=1.09)
└── (a=34, N=1, Q_v=0.65, best=0.65, ubc=1.40)
├── (a=9, N=2, Q_v=0.63, best=0.65, ubc=1.47)
└── (a=29, N=1, Q_v=0.65, best=0.65, ubc=1.24)
├── (a=17, N=3, Q_v=0.67, best=0.75, ubc=1.35)
├── (a=4, N=1, Q_v=0.60, best=0.60, ubc=1.34)
└── (a=9, N=1, Q_v=0.75, best=0.75, ubc=1.49)
├── (a=23, N=2, Q_v=0.53, best=0.65, ubc=1.37)
└── (a=24, N=1, Q_v=0.65, best=0.65, ubc=1.24)
├── (a=29, N=3, Q_v=0.64, best=0.76, ubc=1.32)
├── (a=4, N=1, Q_v=0.49, best=0.49, ubc=1.23)
└── (a=9, N=1, Q_v=0.65, best=0.65, ubc=1.40)
└── (a=34, N=3, Q_v=0.59, best=0.76, ubc=1.28)
    ├── (a=4, N=1, Q_v=0.25, best=0.25, ubc=1.00)
    └── (a=9, N=1, Q_v=0.76, best=0.76, ubc=1.50)
├── (a=9, N=24, Q_v=0.66, best=0.80, ubc=0.98)
├── (a=3, N=4, Q_v=0.65, best=0.80, ubc=1.28)
├── (a=4, N=1, Q_v=0.71, best=0.71, ubc=1.54)
├── (a=10, N=1, Q_v=0.40, best=0.40, ubc=1.23)
└── (a=34, N=1, Q_v=0.80, best=0.80, ubc=1.63)
├── (a=10, N=3, Q_v=0.56, best=0.75, ubc=1.29)
├── (a=3, N=1, Q_v=0.40, best=0.40, ubc=1.14)
└── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.49)
├── (a=17, N=3, Q_v=0.60, best=0.65, ubc=1.33)
├── (a=3, N=1, Q_v=0.62, best=0.62, ubc=1.36)
└── (a=10, N=1, Q_v=0.53, best=0.53, ubc=1.27)
├── (a=23, N=4, Q_v=0.66, best=0.75, ubc=1.29)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=10, N=1, Q_v=0.75, best=0.75, ubc=1.58)
└── (a=17, N=1, Q_v=0.53, best=0.53, ubc=1.36)
├── (a=29, N=4, Q_v=0.71, best=0.71, ubc=1.34)
├── (a=3, N=1, Q_v=0.71, best=0.71, ubc=1.54)
├── (a=10, N=1, Q_v=0.71, best=0.71, ubc=1.54)
└── (a=30, N=1, Q_v=0.71, best=0.71, ubc=1.54)
└── (a=34, N=5, Q_v=0.73, best=0.76, ubc=1.29)
    ├── (a=3, N=1, Q_v=0.76, best=0.76, ubc=1.66)
    ├── (a=10, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    ├── (a=17, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    └── (a=23, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=17, N=20, Q_v=0.63, best=0.76, ubc=0.98)
├── (a=3, N=3, Q_v=0.62, best=0.76, ubc=1.32)
├── (a=4, N=1, Q_v=0.49, best=0.49, ubc=1.23)
└── (a=29, N=1, Q_v=0.76, best=0.76, ubc=1.50)
├── (a=9, N=4, Q_v=0.70, best=0.75, ubc=1.31)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=10, N=1, Q_v=0.65, best=0.65, ubc=1.49)
└── (a=18, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=18, N=3, Q_v=0.58, best=0.65, ubc=1.29)
├── (a=3, N=1, Q_v=0.49, best=0.49, ubc=1.23)
└── (a=23, N=1, Q_v=0.60, best=0.60, ubc=1.34)
├── (a=23, N=3, Q_v=0.67, best=0.75, ubc=1.37)
├── (a=3, N=1, Q_v=0.65, best=0.65, ubc=1.40)
└── (a=29, N=1, Q_v=0.60, best=0.60, ubc=1.34)
├── (a=29, N=3, Q_v=0.67, best=0.76, ubc=1.38)
├── (a=3, N=1, Q_v=0.76, best=0.76, ubc=1.50)
└── (a=23, N=1, Q_v=0.65, best=0.65, ubc=1.40)
└── (a=34, N=3, Q_v=0.58, best=0.76, ubc=1.29)
    ├── (a=3, N=1, Q_v=0.60, best=0.60, ubc=1.34)
    └── (a=29, N=1, Q_v=0.38, best=0.38, ubc=1.12)
├── (a=23, N=24, Q_v=0.66, best=0.76, ubc=0.97)
├── (a=3, N=3, Q_v=0.62, best=0.65, ubc=1.35)
├── (a=4, N=1, Q_v=0.65, best=0.65, ubc=1.40)
└── (a=29, N=1, Q_v=0.60, best=0.60, ubc=1.34)
├── (a=9, N=4, Q_v=0.65, best=0.76, ubc=1.28)
├── (a=3, N=1, Q_v=0.76, best=0.76, ubc=1.60)
├── (a=10, N=1, Q_v=0.53, best=0.53, ubc=1.36)
└── (a=29, N=1, Q_v=0.65, best=0.65, ubc=1.49)
├── (a=17, N=4, Q_v=0.70, best=0.75, ubc=1.33)
├── (a=3, N=1, Q_v=0.64, best=0.64, ubc=1.47)
├── (a=9, N=1, Q_v=0.75, best=0.75, ubc=1.58)
└── (a=18, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=24, N=4, Q_v=0.64, best=0.65, ubc=1.27)
├── (a=3, N=1, Q_v=0.65, best=0.65, ubc=1.49)
├── (a=9, N=1, Q_v=0.60, best=0.60, ubc=1.43)
└── (a=29, N=1, Q_v=0.65, best=0.65, ubc=1.49)
├── (a=29, N=4, Q_v=0.65, best=0.65, ubc=1.28)
├── (a=3, N=1, Q_v=0.65, best=0.65, ubc=1.49)
├── (a=9, N=1, Q_v=0.62, best=0.62, ubc=1.45)
└── (a=30, N=1, Q_v=0.65, best=0.65, ubc=1.49)
└── (a=34, N=4, Q_v=0.68, best=0.76, ubc=1.31)
    ├── (a=3, N=1, Q_v=0.65, best=0.65, ubc=1.49)
    ├── (a=9, N=1, Q_v=0.76, best=0.76, ubc=1.60)
    └── (a=17, N=1, Q_v=0.65, best=0.65, ubc=1.49)
├── (a=29, N=21, Q_v=0.64, best=0.76, ubc=0.98)
├── (a=3, N=3, Q_v=0.56, best=0.62, ubc=1.28)
├── (a=4, N=1, Q_v=0.58, best=0.58, ubc=1.32)
└── (a=17, N=1, Q_v=0.49, best=0.49, ubc=1.23)
├── (a=9, N=3, Q_v=0.64, best=0.71, ubc=1.35)
├── (a=3, N=1, Q_v=0.60, best=0.60, ubc=1.34)
└── (a=23, N=1, Q_v=0.71, best=0.71, ubc=1.45)
├── (a=17, N=4, Q_v=0.67, best=0.76, ubc=1.29)
├── (a=3, N=1, Q_v=0.65, best=0.65, ubc=1.49)
├── (a=9, N=1, Q_v=0.53, best=0.53, ubc=1.36)
└── (a=30, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=23, N=3, Q_v=0.64, best=0.71, ubc=1.35)
├── (a=3, N=1, Q_v=0.62, best=0.62, ubc=1.36)
└── (a=9, N=1, Q_v=0.71, best=0.71, ubc=1.45)
├── (a=30, N=4, Q_v=0.68, best=0.71, ubc=1.30)
├── (a=3, N=1, Q_v=0.71, best=0.71, ubc=1.54)
├── (a=9, N=1, Q_v=0.60, best=0.60, ubc=1.43)
└── (a=34, N=1, Q_v=0.71, best=0.71, ubc=1.54)
└── (a=34, N=3, Q_v=0.58, best=0.71, ubc=1.29)
    ├── (a=3, N=1, Q_v=0.71, best=0.71, ubc=1.45)
    └── (a=30, N=1, Q_v=0.33, best=0.33, ubc=1.07)
└── (a=34, N=18, Q_v=0.61, best=0.76, ubc=0.98)
    ├── (a=3, N=3, Q_v=0.51, best=0.76, ubc=1.20)
    ├── (a=4, N=1, Q_v=0.38, best=0.38, ubc=1.12)
    └── (a=35, N=1, Q_v=0.38, best=0.38, ubc=1.12)
    ├── (a=9, N=3, Q_v=0.72, best=0.75, ubc=1.41)
    ├── (a=3, N=1, Q_v=0.65, best=0.65, ubc=1.40)
    └── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.49)
    ├── (a=17, N=3, Q_v=0.67, best=0.75, ubc=1.36)
    ├── (a=3, N=1, Q_v=0.60, best=0.60, ubc=1.34)
    └── (a=18, N=1, Q_v=0.65, best=0.65, ubc=1.40)
    ├── (a=23, N=3, Q_v=0.61, best=0.64, ubc=1.31)
    ├── (a=3, N=1, Q_v=0.60, best=0.60, ubc=1.34)
    └── (a=24, N=1, Q_v=0.64, best=0.64, ubc=1.38)
    ├── (a=29, N=3, Q_v=0.65, best=0.76, ubc=1.34)
    ├── (a=3, N=1, Q_v=0.76, best=0.76, ubc=1.50)
    └── (a=30, N=1, Q_v=0.65, best=0.65, ubc=1.40)
    └── (a=35, N=2, Q_v=0.38, best=0.38, ubc=1.23)
        └── (a=3, N=1, Q_v=0.38, best=0.38, ubc=0.97)
[16:54:16] INFO     selected action 9 after 125 simulations.
           INFO     current action list: [1, 19, 20, 25, 21, 26, 27, 7, 28, 2, 13, 22, 14, 31, 15, 8, 16, 32, 33,
                    9]
(N=125, Q_v=0.68, best=0.80)
├── (a=3, N=22, Q_v=0.68, best=0.76, ubc=1.02)
├── (a=4, N=4, Q_v=0.72, best=0.76, ubc=1.34)
├── (a=5, N=1, Q_v=0.76, best=0.76, ubc=1.60)
├── (a=10, N=1, Q_v=0.76, best=0.76, ubc=1.60)
└── (a=34, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=10, N=4, Q_v=0.66, best=0.76, ubc=1.29)
├── (a=4, N=1, Q_v=0.76, best=0.76, ubc=1.60)
├── (a=11, N=1, Q_v=0.53, best=0.53, ubc=1.36)
└── (a=17, N=1, Q_v=0.62, best=0.62, ubc=1.45)
├── (a=17, N=4, Q_v=0.69, best=0.76, ubc=1.31)
├── (a=4, N=1, Q_v=0.60, best=0.60, ubc=1.43)
├── (a=10, N=1, Q_v=0.65, best=0.65, ubc=1.49)
└── (a=34, N=1, Q_v=0.76, best=0.76, ubc=1.60)
├── (a=23, N=3, Q_v=0.66, best=0.76, ubc=1.38)
├── (a=4, N=1, Q_v=0.76, best=0.76, ubc=1.50)
└── (a=29, N=1, Q_v=0.62, best=0.62, ubc=1.36)
├── (a=29, N=2, Q_v=0.51, best=0.62, ubc=1.39)
└── (a=10, N=1, Q_v=0.40, best=0.40, ubc=0.99)
└── (a=34, N=4, Q_v=0.75, best=0.76, ubc=1.38)
    ├── (a=4, N=1, Q_v=0.76, best=0.76, ubc=1.60)
    ├── (a=10, N=1, Q_v=0.75, best=0.75, ubc=1.58)
    └── (a=35, N=1, Q_v=0.76, best=0.76, ubc=1.60)
├── (a=10, N=17, Q_v=0.64, best=0.80, ubc=1.01)
├── (a=3, N=3, Q_v=0.64, best=0.76, ubc=1.32)
├── (a=4, N=1, Q_v=0.76, best=0.76, ubc=1.50)
└── (a=11, N=1, Q_v=0.62, best=0.62, ubc=1.36)
├── (a=11, N=2, Q_v=0.55, best=0.71, ubc=1.40)
└── (a=3, N=1, Q_v=0.71, best=0.71, ubc=1.30)
├── (a=17, N=3, Q_v=0.63, best=0.75, ubc=1.32)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=11, N=1, Q_v=0.40, best=0.40, ubc=1.14)
├── (a=23, N=3, Q_v=0.69, best=0.80, ubc=1.38)
├── (a=3, N=1, Q_v=0.53, best=0.53, ubc=1.27)
└── (a=17, N=1, Q_v=0.80, best=0.80, ubc=1.54)
├── (a=29, N=2, Q_v=0.46, best=0.53, ubc=1.31)
└── (a=3, N=1, Q_v=0.53, best=0.53, ubc=1.12)
└── (a=34, N=3, Q_v=0.76, best=0.76, ubc=1.44)
    ├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.49)
    └── (a=17, N=1, Q_v=0.76, best=0.76, ubc=1.50)
├── (a=17, N=19, Q_v=0.66, best=0.75, ubc=1.01)
├── (a=3, N=3, Q_v=0.66, best=0.75, ubc=1.36)
├── (a=4, N=1, Q_v=0.62, best=0.62, ubc=1.36)
└── (a=10, N=1, Q_v=0.62, best=0.62, ubc=1.36)
├── (a=10, N=3, Q_v=0.70, best=0.75, ubc=1.40)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=29, N=1, Q_v=0.62, best=0.62, ubc=1.36)
├── (a=18, N=3, Q_v=0.62, best=0.75, ubc=1.32)
├── (a=3, N=1, Q_v=0.60, best=0.60, ubc=1.34)
└── (a=34, N=1, Q_v=0.75, best=0.75, ubc=1.49)
├── (a=23, N=3, Q_v=0.60, best=0.64, ubc=1.30)
├── (a=3, N=1, Q_v=0.64, best=0.64, ubc=1.38)
└── (a=18, N=1, Q_v=0.53, best=0.53, ubc=1.27)
├── (a=29, N=3, Q_v=0.68, best=0.71, ubc=1.38)
├── (a=3, N=1, Q_v=0.71, best=0.71, ubc=1.45)
└── (a=10, N=1, Q_v=0.62, best=0.62, ubc=1.36)
└── (a=34, N=3, Q_v=0.69, best=0.75, ubc=1.39)
    ├── (a=3, N=1, Q_v=0.58, best=0.58, ubc=1.32)
    └── (a=10, N=1, Q_v=0.75, best=0.75, ubc=1.49)
├── (a=23, N=19, Q_v=0.66, best=0.76, ubc=1.02)
├── (a=3, N=3, Q_v=0.63, best=0.71, ubc=1.33)
├── (a=4, N=1, Q_v=0.65, best=0.65, ubc=1.40)
└── (a=10, N=1, Q_v=0.53, best=0.53, ubc=1.27)
├── (a=10, N=3, Q_v=0.67, best=0.75, ubc=1.37)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=11, N=1, Q_v=0.53, best=0.53, ubc=1.27)
├── (a=17, N=3, Q_v=0.68, best=0.75, ubc=1.39)
├── (a=3, N=1, Q_v=0.65, best=0.65, ubc=1.40)
└── (a=34, N=1, Q_v=0.75, best=0.75, ubc=1.49)
├── (a=24, N=3, Q_v=0.63, best=0.65, ubc=1.33)
├── (a=3, N=1, Q_v=0.65, best=0.65, ubc=1.40)
└── (a=10, N=1, Q_v=0.64, best=0.64, ubc=1.38)
├── (a=29, N=3, Q_v=0.63, best=0.65, ubc=1.33)
├── (a=3, N=1, Q_v=0.65, best=0.65, ubc=1.40)
└── (a=30, N=1, Q_v=0.62, best=0.62, ubc=1.36)
└── (a=34, N=3, Q_v=0.70, best=0.76, ubc=1.40)
    ├── (a=3, N=1, Q_v=0.76, best=0.76, ubc=1.50)
    └── (a=10, N=1, Q_v=0.75, best=0.75, ubc=1.49)
├── (a=29, N=17, Q_v=0.64, best=0.76, ubc=1.02)
├── (a=3, N=3, Q_v=0.68, best=0.76, ubc=1.37)
├── (a=4, N=1, Q_v=0.76, best=0.76, ubc=1.50)
└── (a=23, N=1, Q_v=0.53, best=0.53, ubc=1.27)
├── (a=10, N=2, Q_v=0.55, best=0.69, ubc=1.39)
└── (a=3, N=1, Q_v=0.69, best=0.69, ubc=1.28)
├── (a=17, N=3, Q_v=0.65, best=0.76, ubc=1.34)
├── (a=3, N=1, Q_v=0.65, best=0.65, ubc=1.40)
└── (a=23, N=1, Q_v=0.53, best=0.53, ubc=1.27)
├── (a=23, N=3, Q_v=0.67, best=0.71, ubc=1.36)
├── (a=3, N=1, Q_v=0.65, best=0.65, ubc=1.40)
└── (a=10, N=1, Q_v=0.71, best=0.71, ubc=1.45)
├── (a=30, N=2, Q_v=0.61, best=0.62, ubc=1.45)
└── (a=10, N=1, Q_v=0.62, best=0.62, ubc=1.21)
└── (a=34, N=3, Q_v=0.70, best=0.76, ubc=1.38)
    ├── (a=3, N=1, Q_v=0.62, best=0.62, ubc=1.36)
    └── (a=17, N=1, Q_v=0.71, best=0.71, ubc=1.45)
└── (a=34, N=30, Q_v=0.73, best=0.76, ubc=1.02)
    ├── (a=3, N=5, Q_v=0.75, best=0.76, ubc=1.33)
    ├── (a=4, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    ├── (a=10, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    ├── (a=17, N=1, Q_v=0.76, best=0.76, ubc=1.66)
    └── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    ├── (a=10, N=5, Q_v=0.76, best=0.76, ubc=1.34)
    ├── (a=3, N=1, Q_v=0.76, best=0.76, ubc=1.66)
    ├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    ├── (a=17, N=1, Q_v=0.76, best=0.76, ubc=1.66)
    └── (a=29, N=1, Q_v=0.76, best=0.76, ubc=1.66)
    ├── (a=17, N=5, Q_v=0.75, best=0.76, ubc=1.34)
    ├── (a=3, N=1, Q_v=0.76, best=0.76, ubc=1.66)
    ├── (a=10, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    ├── (a=18, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    └── (a=29, N=1, Q_v=0.76, best=0.76, ubc=1.66)
    ├── (a=23, N=4, Q_v=0.71, best=0.75, ubc=1.36)
    ├── (a=3, N=1, Q_v=0.60, best=0.60, ubc=1.43)
    ├── (a=10, N=1, Q_v=0.75, best=0.75, ubc=1.58)
    └── (a=35, N=1, Q_v=0.75, best=0.75, ubc=1.58)
    ├── (a=29, N=5, Q_v=0.71, best=0.75, ubc=1.29)
    ├── (a=3, N=1, Q_v=0.65, best=0.65, ubc=1.55)
    ├── (a=10, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    ├── (a=17, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    └── (a=23, N=1, Q_v=0.65, best=0.65, ubc=1.55)
    └── (a=35, N=5, Q_v=0.72, best=0.76, ubc=1.30)
        ├── (a=3, N=1, Q_v=0.65, best=0.65, ubc=1.55)
        ├── (a=10, N=1, Q_v=0.76, best=0.76, ubc=1.66)
        ├── (a=17, N=1, Q_v=0.76, best=0.76, ubc=1.66)
        └── (a=23, N=1, Q_v=0.75, best=0.75, ubc=1.64)
[16:54:17] INFO     selected action 34 after 125 simulations.
           INFO     current action list: [1, 19, 20, 25, 21, 26, 27, 7, 28, 2, 13, 22, 14, 31, 15, 8, 16, 32, 33,
                    9, 34]
(N=125, Q_v=0.73, best=0.80)
├── (a=3, N=20, Q_v=0.72, best=0.76, ubc=1.07)
├── (a=4, N=3, Q_v=0.70, best=0.76, ubc=1.41)
├── (a=5, N=1, Q_v=0.60, best=0.60, ubc=1.34)
└── (a=10, N=1, Q_v=0.76, best=0.76, ubc=1.50)
├── (a=10, N=3, Q_v=0.74, best=0.76, ubc=1.45)
├── (a=4, N=1, Q_v=0.71, best=0.71, ubc=1.45)
└── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.49)
├── (a=17, N=3, Q_v=0.70, best=0.76, ubc=1.41)
├── (a=4, N=1, Q_v=0.76, best=0.76, ubc=1.50)
└── (a=18, N=1, Q_v=0.75, best=0.75, ubc=1.49)
├── (a=23, N=3, Q_v=0.69, best=0.75, ubc=1.40)
├── (a=4, N=1, Q_v=0.58, best=0.58, ubc=1.32)
└── (a=35, N=1, Q_v=0.75, best=0.75, ubc=1.49)
├── (a=29, N=4, Q_v=0.75, best=0.76, ubc=1.37)
├── (a=4, N=1, Q_v=0.76, best=0.76, ubc=1.60)
├── (a=10, N=1, Q_v=0.75, best=0.75, ubc=1.58)
└── (a=35, N=1, Q_v=0.76, best=0.76, ubc=1.60)
└── (a=35, N=3, Q_v=0.72, best=0.76, ubc=1.42)
    ├── (a=4, N=1, Q_v=0.76, best=0.76, ubc=1.50)
    └── (a=23, N=1, Q_v=0.64, best=0.64, ubc=1.38)
├── (a=10, N=24, Q_v=0.75, best=0.80, ubc=1.07)
├── (a=3, N=4, Q_v=0.76, best=0.80, ubc=1.39)
├── (a=4, N=1, Q_v=0.80, best=0.80, ubc=1.63)
├── (a=11, N=1, Q_v=0.76, best=0.76, ubc=1.60)
└── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=11, N=4, Q_v=0.77, best=0.80, ubc=1.40)
├── (a=3, N=1, Q_v=0.76, best=0.76, ubc=1.60)
├── (a=12, N=1, Q_v=0.75, best=0.75, ubc=1.58)
└── (a=29, N=1, Q_v=0.76, best=0.76, ubc=1.60)
├── (a=17, N=4, Q_v=0.75, best=0.75, ubc=1.38)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.58)
└── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=23, N=3, Q_v=0.73, best=0.75, ubc=1.46)
├── (a=3, N=1, Q_v=0.71, best=0.71, ubc=1.45)
└── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.49)
├── (a=29, N=4, Q_v=0.75, best=0.76, ubc=1.38)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.58)
└── (a=35, N=1, Q_v=0.75, best=0.75, ubc=1.58)
└── (a=35, N=4, Q_v=0.75, best=0.76, ubc=1.38)
    ├── (a=3, N=1, Q_v=0.76, best=0.76, ubc=1.60)
    ├── (a=11, N=1, Q_v=0.76, best=0.76, ubc=1.60)
    └── (a=23, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=17, N=21, Q_v=0.73, best=0.76, ubc=1.07)
├── (a=3, N=3, Q_v=0.72, best=0.75, ubc=1.43)
├── (a=4, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=29, N=1, Q_v=0.65, best=0.65, ubc=1.40)
├── (a=10, N=4, Q_v=0.75, best=0.75, ubc=1.36)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.58)
└── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=18, N=3, Q_v=0.75, best=0.75, ubc=1.46)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=10, N=1, Q_v=0.75, best=0.75, ubc=1.49)
├── (a=23, N=3, Q_v=0.68, best=0.76, ubc=1.40)
├── (a=3, N=1, Q_v=0.76, best=0.76, ubc=1.50)
└── (a=35, N=1, Q_v=0.65, best=0.65, ubc=1.40)
├── (a=29, N=3, Q_v=0.72, best=0.76, ubc=1.43)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=35, N=1, Q_v=0.65, best=0.65, ubc=1.40)
└── (a=35, N=4, Q_v=0.76, best=0.76, ubc=1.38)
    ├── (a=3, N=1, Q_v=0.76, best=0.76, ubc=1.60)
    ├── (a=10, N=1, Q_v=0.75, best=0.75, ubc=1.58)
    └── (a=29, N=1, Q_v=0.76, best=0.76, ubc=1.60)
├── (a=23, N=17, Q_v=0.69, best=0.75, ubc=1.07)
├── (a=3, N=3, Q_v=0.69, best=0.75, ubc=1.38)
├── (a=4, N=1, Q_v=0.69, best=0.69, ubc=1.43)
└── (a=24, N=1, Q_v=0.64, best=0.64, ubc=1.38)
├── (a=10, N=3, Q_v=0.75, best=0.75, ubc=1.43)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.49)
├── (a=17, N=3, Q_v=0.68, best=0.75, ubc=1.37)
├── (a=3, N=1, Q_v=0.65, best=0.65, ubc=1.40)
└── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.49)
├── (a=24, N=2, Q_v=0.65, best=0.65, ubc=1.50)
└── (a=35, N=1, Q_v=0.65, best=0.65, ubc=1.24)
├── (a=29, N=3, Q_v=0.68, best=0.75, ubc=1.37)
├── (a=3, N=1, Q_v=0.65, best=0.65, ubc=1.40)
└── (a=24, N=1, Q_v=0.64, best=0.64, ubc=1.38)
└── (a=35, N=2, Q_v=0.64, best=0.64, ubc=1.48)
    └── (a=17, N=1, Q_v=0.64, best=0.64, ubc=1.22)
├── (a=29, N=21, Q_v=0.73, best=0.76, ubc=1.07)
├── (a=3, N=4, Q_v=0.76, best=0.76, ubc=1.38)
├── (a=4, N=1, Q_v=0.76, best=0.76, ubc=1.60)
├── (a=10, N=1, Q_v=0.76, best=0.76, ubc=1.60)
└── (a=17, N=1, Q_v=0.76, best=0.76, ubc=1.60)
├── (a=10, N=3, Q_v=0.75, best=0.75, ubc=1.46)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.49)
├── (a=17, N=3, Q_v=0.70, best=0.76, ubc=1.41)
├── (a=3, N=1, Q_v=0.58, best=0.58, ubc=1.32)
└── (a=35, N=1, Q_v=0.76, best=0.76, ubc=1.50)
├── (a=23, N=3, Q_v=0.68, best=0.75, ubc=1.40)
├── (a=3, N=1, Q_v=0.65, best=0.65, ubc=1.40)
└── (a=24, N=1, Q_v=0.65, best=0.65, ubc=1.40)
├── (a=30, N=4, Q_v=0.75, best=0.76, ubc=1.37)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=10, N=1, Q_v=0.75, best=0.75, ubc=1.58)
└── (a=17, N=1, Q_v=0.76, best=0.76, ubc=1.60)
└── (a=35, N=3, Q_v=0.72, best=0.76, ubc=1.43)
    ├── (a=3, N=1, Q_v=0.76, best=0.76, ubc=1.50)
    └── (a=23, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=35, N=21, Q_v=0.72, best=0.76, ubc=1.06)
    ├── (a=3, N=4, Q_v=0.76, best=0.76, ubc=1.38)
    ├── (a=4, N=1, Q_v=0.76, best=0.76, ubc=1.60)
    ├── (a=10, N=1, Q_v=0.75, best=0.75, ubc=1.58)
    └── (a=29, N=1, Q_v=0.76, best=0.76, ubc=1.60)
    ├── (a=10, N=4, Q_v=0.75, best=0.76, ubc=1.37)
    ├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.58)
    ├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.58)
    └── (a=17, N=1, Q_v=0.75, best=0.75, ubc=1.58)
    ├── (a=17, N=3, Q_v=0.75, best=0.75, ubc=1.46)
    ├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.49)
    └── (a=10, N=1, Q_v=0.75, best=0.75, ubc=1.49)
    ├── (a=23, N=3, Q_v=0.64, best=0.65, ubc=1.35)
    ├── (a=3, N=1, Q_v=0.60, best=0.60, ubc=1.34)
    └── (a=36, N=1, Q_v=0.65, best=0.65, ubc=1.40)
    ├── (a=29, N=3, Q_v=0.72, best=0.75, ubc=1.43)
    ├── (a=3, N=1, Q_v=0.65, best=0.65, ubc=1.40)
    └── (a=17, N=1, Q_v=0.75, best=0.75, ubc=1.49)
    └── (a=36, N=3, Q_v=0.72, best=0.76, ubc=1.43)
        ├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.49)
        └── (a=17, N=1, Q_v=0.64, best=0.64, ubc=1.38)
[16:54:19] INFO     selected action 10 after 125 simulations.
           INFO     current action list: [1, 19, 20, 25, 21, 26, 27, 7, 28, 2, 13, 22, 14, 31, 15, 8, 16, 32, 33,
                    9, 34, 10]
(N=125, Q_v=0.75, best=0.80)
├── (a=3, N=20, Q_v=0.74, best=0.76, ubc=1.08)
├── (a=4, N=3, Q_v=0.75, best=0.76, ubc=1.46)
├── (a=5, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=35, N=1, Q_v=0.75, best=0.75, ubc=1.49)
├── (a=11, N=4, Q_v=0.76, best=0.76, ubc=1.37)
├── (a=4, N=1, Q_v=0.76, best=0.76, ubc=1.60)
├── (a=12, N=1, Q_v=0.76, best=0.76, ubc=1.60)
└── (a=23, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=17, N=3, Q_v=0.76, best=0.76, ubc=1.46)
├── (a=4, N=1, Q_v=0.76, best=0.76, ubc=1.50)
└── (a=11, N=1, Q_v=0.76, best=0.76, ubc=1.50)
├── (a=23, N=3, Q_v=0.68, best=0.76, ubc=1.39)
├── (a=4, N=1, Q_v=0.76, best=0.76, ubc=1.50)
└── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.49)
├── (a=29, N=3, Q_v=0.72, best=0.75, ubc=1.42)
├── (a=4, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=17, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=35, N=3, Q_v=0.75, best=0.76, ubc=1.46)
    ├── (a=4, N=1, Q_v=0.75, best=0.75, ubc=1.49)
    └── (a=36, N=1, Q_v=0.75, best=0.75, ubc=1.49)
├── (a=11, N=20, Q_v=0.74, best=0.80, ubc=1.09)
├── (a=3, N=3, Q_v=0.75, best=0.76, ubc=1.46)
├── (a=4, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=12, N=1, Q_v=0.76, best=0.76, ubc=1.50)
├── (a=12, N=4, Q_v=0.76, best=0.80, ubc=1.37)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=17, N=1, Q_v=0.75, best=0.75, ubc=1.58)
└── (a=23, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=17, N=3, Q_v=0.73, best=0.75, ubc=1.43)
├── (a=3, N=1, Q_v=0.69, best=0.69, ubc=1.43)
└── (a=23, N=1, Q_v=0.75, best=0.75, ubc=1.49)
├── (a=23, N=3, Q_v=0.68, best=0.76, ubc=1.39)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=12, N=1, Q_v=0.76, best=0.76, ubc=1.50)
├── (a=29, N=3, Q_v=0.75, best=0.75, ubc=1.45)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=17, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=35, N=3, Q_v=0.76, best=0.76, ubc=1.46)
    ├── (a=3, N=1, Q_v=0.76, best=0.76, ubc=1.50)
    └── (a=12, N=1, Q_v=0.75, best=0.75, ubc=1.49)
├── (a=17, N=21, Q_v=0.75, best=0.80, ubc=1.09)
├── (a=3, N=4, Q_v=0.76, best=0.80, ubc=1.38)
├── (a=4, N=1, Q_v=0.80, best=0.80, ubc=1.63)
├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.58)
└── (a=18, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=11, N=4, Q_v=0.75, best=0.76, ubc=1.37)
├── (a=3, N=1, Q_v=0.76, best=0.76, ubc=1.60)
├── (a=12, N=1, Q_v=0.75, best=0.75, ubc=1.58)
└── (a=35, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=18, N=3, Q_v=0.75, best=0.76, ubc=1.46)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.49)
├── (a=23, N=3, Q_v=0.73, best=0.80, ubc=1.45)
├── (a=3, N=1, Q_v=0.80, best=0.80, ubc=1.54)
└── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.49)
├── (a=29, N=3, Q_v=0.75, best=0.76, ubc=1.46)
├── (a=3, N=1, Q_v=0.76, best=0.76, ubc=1.50)
└── (a=23, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=35, N=3, Q_v=0.75, best=0.75, ubc=1.46)
    ├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.49)
    └── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.49)
├── (a=23, N=21, Q_v=0.75, best=0.80, ubc=1.09)
├── (a=3, N=4, Q_v=0.75, best=0.76, ubc=1.37)
├── (a=4, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.58)
└── (a=17, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=11, N=3, Q_v=0.75, best=0.75, ubc=1.46)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.49)
├── (a=17, N=4, Q_v=0.76, best=0.80, ubc=1.38)
├── (a=3, N=1, Q_v=0.76, best=0.76, ubc=1.60)
├── (a=11, N=1, Q_v=0.80, best=0.80, ubc=1.63)
└── (a=18, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=24, N=3, Q_v=0.75, best=0.75, ubc=1.46)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=35, N=1, Q_v=0.75, best=0.75, ubc=1.49)
├── (a=29, N=3, Q_v=0.75, best=0.75, ubc=1.46)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=35, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=35, N=3, Q_v=0.75, best=0.76, ubc=1.46)
    ├── (a=3, N=1, Q_v=0.76, best=0.76, ubc=1.50)
    └── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.49)
├── (a=29, N=21, Q_v=0.74, best=0.76, ubc=1.08)
├── (a=3, N=3, Q_v=0.73, best=0.75, ubc=1.44)
├── (a=4, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=30, N=1, Q_v=0.69, best=0.69, ubc=1.43)
├── (a=11, N=3, Q_v=0.75, best=0.75, ubc=1.46)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=17, N=1, Q_v=0.75, best=0.75, ubc=1.49)
├── (a=17, N=4, Q_v=0.75, best=0.76, ubc=1.37)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.58)
└── (a=18, N=1, Q_v=0.76, best=0.76, ubc=1.60)
├── (a=23, N=4, Q_v=0.75, best=0.76, ubc=1.37)
├── (a=3, N=1, Q_v=0.76, best=0.76, ubc=1.60)
├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.58)
└── (a=17, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=30, N=3, Q_v=0.73, best=0.75, ubc=1.44)
├── (a=3, N=1, Q_v=0.69, best=0.69, ubc=1.43)
└── (a=23, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=35, N=3, Q_v=0.75, best=0.76, ubc=1.46)
    ├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.49)
    └── (a=11, N=1, Q_v=0.76, best=0.76, ubc=1.50)
└── (a=35, N=21, Q_v=0.75, best=0.76, ubc=1.09)
    ├── (a=3, N=4, Q_v=0.76, best=0.76, ubc=1.38)
    ├── (a=4, N=1, Q_v=0.76, best=0.76, ubc=1.60)
    ├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.58)
    └── (a=23, N=1, Q_v=0.76, best=0.76, ubc=1.60)
    ├── (a=11, N=3, Q_v=0.75, best=0.75, ubc=1.46)
    ├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.49)
    └── (a=17, N=1, Q_v=0.75, best=0.75, ubc=1.49)
    ├── (a=17, N=4, Q_v=0.75, best=0.76, ubc=1.37)
    ├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.58)
    ├── (a=11, N=1, Q_v=0.76, best=0.76, ubc=1.60)
    └── (a=18, N=1, Q_v=0.75, best=0.75, ubc=1.58)
    ├── (a=23, N=3, Q_v=0.75, best=0.75, ubc=1.46)
    ├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.49)
    └── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.49)
    ├── (a=29, N=3, Q_v=0.75, best=0.76, ubc=1.46)
    ├── (a=3, N=1, Q_v=0.76, best=0.76, ubc=1.50)
    └── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.49)
    └── (a=36, N=3, Q_v=0.75, best=0.75, ubc=1.46)
        ├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.49)
        └── (a=17, N=1, Q_v=0.75, best=0.75, ubc=1.49)
[16:54:20] INFO     selected action 23 after 125 simulations.
           INFO     current action list: [1, 19, 20, 25, 21, 26, 27, 7, 28, 2, 13, 22, 14, 31, 15, 8, 16, 32, 33,
                    9, 34, 10, 23]
(N=125, Q_v=0.75, best=0.80)
├── (a=3, N=21, Q_v=0.75, best=0.80, ubc=1.08)
├── (a=4, N=3, Q_v=0.74, best=0.76, ubc=1.45)
├── (a=5, N=1, Q_v=0.76, best=0.76, ubc=1.50)
└── (a=35, N=1, Q_v=0.75, best=0.75, ubc=1.49)
├── (a=11, N=4, Q_v=0.75, best=0.76, ubc=1.37)
├── (a=4, N=1, Q_v=0.76, best=0.76, ubc=1.60)
├── (a=12, N=1, Q_v=0.76, best=0.76, ubc=1.60)
└── (a=17, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=17, N=4, Q_v=0.76, best=0.80, ubc=1.38)
├── (a=4, N=1, Q_v=0.76, best=0.76, ubc=1.60)
├── (a=11, N=1, Q_v=0.80, best=0.80, ubc=1.63)
└── (a=18, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=24, N=3, Q_v=0.72, best=0.75, ubc=1.43)
├── (a=4, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.49)
├── (a=29, N=3, Q_v=0.75, best=0.75, ubc=1.46)
├── (a=4, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=35, N=3, Q_v=0.75, best=0.75, ubc=1.46)
    ├── (a=4, N=1, Q_v=0.75, best=0.75, ubc=1.49)
    └── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.49)
├── (a=11, N=21, Q_v=0.75, best=0.80, ubc=1.09)
├── (a=3, N=4, Q_v=0.75, best=0.76, ubc=1.37)
├── (a=4, N=1, Q_v=0.76, best=0.76, ubc=1.60)
├── (a=12, N=1, Q_v=0.76, best=0.76, ubc=1.60)
└── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=12, N=3, Q_v=0.75, best=0.76, ubc=1.46)
├── (a=3, N=1, Q_v=0.76, best=0.76, ubc=1.50)
└── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.49)
├── (a=17, N=3, Q_v=0.75, best=0.75, ubc=1.46)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=35, N=1, Q_v=0.75, best=0.75, ubc=1.49)
├── (a=24, N=3, Q_v=0.75, best=0.75, ubc=1.46)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=35, N=1, Q_v=0.75, best=0.75, ubc=1.49)
├── (a=29, N=4, Q_v=0.76, best=0.80, ubc=1.38)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=12, N=1, Q_v=0.75, best=0.75, ubc=1.58)
└── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.58)
└── (a=35, N=3, Q_v=0.75, best=0.75, ubc=1.46)
    ├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.49)
    └── (a=36, N=1, Q_v=0.75, best=0.75, ubc=1.49)
├── (a=17, N=21, Q_v=0.75, best=0.80, ubc=1.09)
├── (a=3, N=4, Q_v=0.76, best=0.80, ubc=1.38)
├── (a=4, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.58)
└── (a=18, N=1, Q_v=0.80, best=0.80, ubc=1.63)
├── (a=11, N=4, Q_v=0.76, best=0.80, ubc=1.38)
├── (a=3, N=1, Q_v=0.76, best=0.76, ubc=1.60)
├── (a=12, N=1, Q_v=0.75, best=0.75, ubc=1.58)
└── (a=29, N=1, Q_v=0.80, best=0.80, ubc=1.63)
├── (a=18, N=3, Q_v=0.75, best=0.76, ubc=1.46)
├── (a=3, N=1, Q_v=0.76, best=0.76, ubc=1.50)
└── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.49)
├── (a=24, N=3, Q_v=0.75, best=0.75, ubc=1.46)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.49)
├── (a=29, N=3, Q_v=0.75, best=0.75, ubc=1.46)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=35, N=3, Q_v=0.75, best=0.75, ubc=1.46)
    ├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.49)
    └── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.49)
├── (a=24, N=19, Q_v=0.73, best=0.75, ubc=1.09)
├── (a=3, N=4, Q_v=0.75, best=0.75, ubc=1.35)
├── (a=4, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.58)
└── (a=17, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=11, N=4, Q_v=0.72, best=0.75, ubc=1.33)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=12, N=1, Q_v=0.75, best=0.75, ubc=1.58)
└── (a=17, N=1, Q_v=0.65, best=0.65, ubc=1.49)
├── (a=17, N=4, Q_v=0.75, best=0.75, ubc=1.35)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.58)
└── (a=35, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=29, N=3, Q_v=0.68, best=0.75, ubc=1.39)
├── (a=3, N=1, Q_v=0.65, best=0.65, ubc=1.40)
└── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=35, N=3, Q_v=0.75, best=0.75, ubc=1.45)
    ├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.49)
    └── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.49)
├── (a=29, N=21, Q_v=0.75, best=0.76, ubc=1.09)
├── (a=3, N=3, Q_v=0.75, best=0.75, ubc=1.46)
├── (a=4, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=17, N=1, Q_v=0.75, best=0.75, ubc=1.49)
├── (a=11, N=4, Q_v=0.75, best=0.76, ubc=1.37)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=12, N=1, Q_v=0.75, best=0.75, ubc=1.58)
└── (a=30, N=1, Q_v=0.76, best=0.76, ubc=1.60)
├── (a=17, N=3, Q_v=0.75, best=0.75, ubc=1.46)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=18, N=1, Q_v=0.75, best=0.75, ubc=1.49)
├── (a=24, N=3, Q_v=0.75, best=0.75, ubc=1.46)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=30, N=1, Q_v=0.75, best=0.75, ubc=1.49)
├── (a=30, N=4, Q_v=0.75, best=0.76, ubc=1.37)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.58)
└── (a=35, N=1, Q_v=0.75, best=0.75, ubc=1.58)
└── (a=35, N=3, Q_v=0.75, best=0.75, ubc=1.46)
    ├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.49)
    └── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=35, N=21, Q_v=0.75, best=0.76, ubc=1.09)
    ├── (a=3, N=4, Q_v=0.75, best=0.76, ubc=1.37)
    ├── (a=4, N=1, Q_v=0.76, best=0.76, ubc=1.60)
    ├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.58)
    └── (a=17, N=1, Q_v=0.75, best=0.75, ubc=1.58)
    ├── (a=11, N=4, Q_v=0.75, best=0.75, ubc=1.36)
    ├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.58)
    ├── (a=12, N=1, Q_v=0.75, best=0.75, ubc=1.58)
    └── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.58)
    ├── (a=17, N=3, Q_v=0.75, best=0.75, ubc=1.46)
    ├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.49)
    └── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.49)
    ├── (a=24, N=3, Q_v=0.75, best=0.75, ubc=1.46)
    ├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.49)
    └── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.49)
    ├── (a=29, N=3, Q_v=0.75, best=0.75, ubc=1.46)
    ├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.49)
    └── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.49)
    └── (a=36, N=3, Q_v=0.75, best=0.75, ubc=1.46)
        ├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.49)
        └── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.49)
[16:54:22] INFO     selected action 17 after 125 simulations.
           INFO     current action list: [1, 19, 20, 25, 21, 26, 27, 7, 28, 2, 13, 22, 14, 31, 15, 8, 16, 32, 33,
                    9, 34, 10, 23, 17]
(N=125, Q_v=0.74, best=0.80)
├── (a=3, N=20, Q_v=0.74, best=0.76, ubc=1.08)
├── (a=4, N=3, Q_v=0.73, best=0.76, ubc=1.44)
├── (a=5, N=1, Q_v=0.69, best=0.69, ubc=1.43)
└── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.49)
├── (a=11, N=3, Q_v=0.75, best=0.75, ubc=1.45)
├── (a=4, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=12, N=1, Q_v=0.75, best=0.75, ubc=1.49)
├── (a=18, N=3, Q_v=0.72, best=0.76, ubc=1.43)
├── (a=4, N=1, Q_v=0.76, best=0.76, ubc=1.50)
└── (a=35, N=1, Q_v=0.75, best=0.75, ubc=1.49)
├── (a=24, N=3, Q_v=0.75, best=0.75, ubc=1.45)
├── (a=4, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.49)
├── (a=29, N=3, Q_v=0.72, best=0.75, ubc=1.42)
├── (a=4, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=35, N=4, Q_v=0.75, best=0.76, ubc=1.36)
    ├── (a=4, N=1, Q_v=0.76, best=0.76, ubc=1.60)
    ├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.58)
    └── (a=36, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=11, N=21, Q_v=0.75, best=0.80, ubc=1.09)
├── (a=3, N=3, Q_v=0.72, best=0.76, ubc=1.43)
├── (a=4, N=1, Q_v=0.76, best=0.76, ubc=1.50)
└── (a=12, N=1, Q_v=0.75, best=0.75, ubc=1.49)
├── (a=12, N=4, Q_v=0.76, best=0.80, ubc=1.38)
├── (a=3, N=1, Q_v=0.80, best=0.80, ubc=1.63)
├── (a=18, N=1, Q_v=0.75, best=0.75, ubc=1.58)
└── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=18, N=4, Q_v=0.76, best=0.80, ubc=1.38)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=12, N=1, Q_v=0.75, best=0.75, ubc=1.58)
└── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=24, N=3, Q_v=0.75, best=0.75, ubc=1.46)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=12, N=1, Q_v=0.75, best=0.75, ubc=1.49)
├── (a=29, N=3, Q_v=0.75, best=0.75, ubc=1.46)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=35, N=3, Q_v=0.75, best=0.75, ubc=1.46)
    ├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.49)
    └── (a=12, N=1, Q_v=0.75, best=0.75, ubc=1.49)
├── (a=18, N=22, Q_v=0.75, best=0.80, ubc=1.08)
├── (a=3, N=5, Q_v=0.77, best=0.80, ubc=1.33)
├── (a=4, N=1, Q_v=0.80, best=0.80, ubc=1.70)
├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.64)
└── (a=29, N=1, Q_v=0.76, best=0.76, ubc=1.66)
├── (a=11, N=4, Q_v=0.75, best=0.75, ubc=1.37)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=12, N=1, Q_v=0.75, best=0.75, ubc=1.58)
└── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=24, N=4, Q_v=0.75, best=0.75, ubc=1.37)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.58)
└── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=29, N=4, Q_v=0.76, best=0.76, ubc=1.38)
├── (a=3, N=1, Q_v=0.76, best=0.76, ubc=1.60)
├── (a=11, N=1, Q_v=0.76, best=0.76, ubc=1.60)
└── (a=35, N=1, Q_v=0.76, best=0.76, ubc=1.60)
└── (a=35, N=4, Q_v=0.75, best=0.75, ubc=1.37)
    ├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.58)
    ├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.58)
    └── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=24, N=19, Q_v=0.73, best=0.75, ubc=1.09)
├── (a=3, N=3, Q_v=0.67, best=0.75, ubc=1.37)
├── (a=4, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=35, N=1, Q_v=0.75, best=0.75, ubc=1.49)
├── (a=11, N=4, Q_v=0.75, best=0.75, ubc=1.35)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=12, N=1, Q_v=0.75, best=0.75, ubc=1.58)
└── (a=35, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=18, N=3, Q_v=0.72, best=0.75, ubc=1.42)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=29, N=1, Q_v=0.65, best=0.65, ubc=1.40)
├── (a=29, N=4, Q_v=0.75, best=0.75, ubc=1.35)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.58)
└── (a=18, N=1, Q_v=0.75, best=0.75, ubc=1.58)
└── (a=35, N=4, Q_v=0.75, best=0.75, ubc=1.35)
    ├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.58)
    ├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.58)
    └── (a=18, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=29, N=21, Q_v=0.75, best=0.76, ubc=1.09)
├── (a=3, N=4, Q_v=0.75, best=0.75, ubc=1.36)
├── (a=4, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.58)
└── (a=18, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=11, N=3, Q_v=0.75, best=0.75, ubc=1.46)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.49)
├── (a=18, N=4, Q_v=0.75, best=0.76, ubc=1.37)
├── (a=3, N=1, Q_v=0.76, best=0.76, ubc=1.60)
├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.58)
└── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=24, N=3, Q_v=0.75, best=0.75, ubc=1.46)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=18, N=1, Q_v=0.75, best=0.75, ubc=1.49)
├── (a=30, N=3, Q_v=0.75, best=0.75, ubc=1.46)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=18, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=35, N=3, Q_v=0.75, best=0.75, ubc=1.46)
    ├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.49)
    └── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.49)
└── (a=35, N=21, Q_v=0.75, best=0.76, ubc=1.09)
    ├── (a=3, N=4, Q_v=0.75, best=0.76, ubc=1.37)
    ├── (a=4, N=1, Q_v=0.76, best=0.76, ubc=1.60)
    ├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.58)
    └── (a=18, N=1, Q_v=0.75, best=0.75, ubc=1.58)
    ├── (a=11, N=4, Q_v=0.75, best=0.76, ubc=1.37)
    ├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.58)
    ├── (a=12, N=1, Q_v=0.75, best=0.75, ubc=1.58)
    └── (a=36, N=1, Q_v=0.75, best=0.75, ubc=1.58)
    ├── (a=18, N=3, Q_v=0.75, best=0.76, ubc=1.46)
    ├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.49)
    └── (a=36, N=1, Q_v=0.76, best=0.76, ubc=1.50)
    ├── (a=24, N=3, Q_v=0.75, best=0.75, ubc=1.46)
    ├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.49)
    └── (a=18, N=1, Q_v=0.75, best=0.75, ubc=1.49)
    ├── (a=29, N=3, Q_v=0.75, best=0.75, ubc=1.46)
    ├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.49)
    └── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.49)
    └── (a=36, N=3, Q_v=0.75, best=0.75, ubc=1.46)
        ├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.49)
        └── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.49)
[16:54:23] INFO     selected action 18 after 125 simulations.
           INFO     current action list: [1, 19, 20, 25, 21, 26, 27, 7, 28, 2, 13, 22, 14, 31, 15, 8, 16, 32, 33,
                    9, 34, 10, 23, 17, 18]
(N=125, Q_v=0.74, best=0.80)
├── (a=3, N=25, Q_v=0.75, best=0.80, ubc=1.06)
├── (a=4, N=5, Q_v=0.75, best=0.80, ubc=1.32)
├── (a=5, N=1, Q_v=0.80, best=0.80, ubc=1.70)
├── (a=11, N=1, Q_v=0.80, best=0.80, ubc=1.70)
├── (a=24, N=1, Q_v=0.65, best=0.65, ubc=1.55)
└── (a=29, N=1, Q_v=0.76, best=0.76, ubc=1.66)
├── (a=11, N=5, Q_v=0.77, best=0.80, ubc=1.33)
├── (a=4, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=12, N=1, Q_v=0.80, best=0.80, ubc=1.70)
├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.64)
└── (a=29, N=1, Q_v=0.80, best=0.80, ubc=1.70)
├── (a=24, N=4, Q_v=0.72, best=0.75, ubc=1.36)
├── (a=4, N=1, Q_v=0.65, best=0.65, ubc=1.49)
├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.58)
└── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=29, N=5, Q_v=0.75, best=0.76, ubc=1.32)
├── (a=4, N=1, Q_v=0.76, best=0.76, ubc=1.66)
├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.64)
└── (a=35, N=1, Q_v=0.75, best=0.75, ubc=1.64)
└── (a=35, N=5, Q_v=0.75, best=0.75, ubc=1.31)
    ├── (a=4, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    ├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    ├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    └── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=11, N=25, Q_v=0.75, best=0.80, ubc=1.06)
├── (a=3, N=4, Q_v=0.74, best=0.80, ubc=1.37)
├── (a=4, N=1, Q_v=0.80, best=0.80, ubc=1.63)
├── (a=12, N=1, Q_v=0.75, best=0.75, ubc=1.58)
└── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=12, N=5, Q_v=0.75, best=0.75, ubc=1.31)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.64)
└── (a=35, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=24, N=5, Q_v=0.75, best=0.75, ubc=1.31)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=12, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.64)
└── (a=35, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=29, N=5, Q_v=0.75, best=0.75, ubc=1.31)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=12, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.64)
└── (a=30, N=1, Q_v=0.75, best=0.75, ubc=1.64)
└── (a=35, N=5, Q_v=0.75, best=0.75, ubc=1.31)
    ├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    ├── (a=12, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    ├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    └── (a=36, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=24, N=24, Q_v=0.74, best=0.75, ubc=1.05)
├── (a=3, N=6, Q_v=0.75, best=0.75, ubc=1.26)
├── (a=4, N=2, Q_v=0.75, best=0.75, ubc=1.41)
├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.69)
├── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.69)
└── (a=35, N=1, Q_v=0.75, best=0.75, ubc=1.69)
├── (a=11, N=6, Q_v=0.73, best=0.75, ubc=1.24)
├── (a=3, N=1, Q_v=0.65, best=0.65, ubc=1.60)
├── (a=12, N=2, Q_v=0.75, best=0.75, ubc=1.41)
├── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.69)
└── (a=35, N=1, Q_v=0.75, best=0.75, ubc=1.69)
├── (a=29, N=5, Q_v=0.73, best=0.75, ubc=1.29)
├── (a=3, N=1, Q_v=0.65, best=0.65, ubc=1.55)
├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=30, N=1, Q_v=0.75, best=0.75, ubc=1.64)
└── (a=35, N=1, Q_v=0.75, best=0.75, ubc=1.64)
└── (a=35, N=6, Q_v=0.75, best=0.75, ubc=1.26)
    ├── (a=3, N=2, Q_v=0.75, best=0.75, ubc=1.41)
    ├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.69)
    ├── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.69)
    └── (a=36, N=1, Q_v=0.75, best=0.75, ubc=1.69)
├── (a=29, N=24, Q_v=0.74, best=0.76, ubc=1.06)
├── (a=3, N=4, Q_v=0.73, best=0.76, ubc=1.36)
├── (a=4, N=1, Q_v=0.76, best=0.76, ubc=1.60)
├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.58)
└── (a=30, N=1, Q_v=0.65, best=0.65, ubc=1.49)
├── (a=11, N=5, Q_v=0.75, best=0.75, ubc=1.31)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=12, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.64)
└── (a=30, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=24, N=5, Q_v=0.75, best=0.75, ubc=1.31)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=30, N=1, Q_v=0.75, best=0.75, ubc=1.64)
└── (a=35, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=30, N=4, Q_v=0.72, best=0.75, ubc=1.35)
├── (a=3, N=1, Q_v=0.65, best=0.65, ubc=1.49)
├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.58)
└── (a=35, N=1, Q_v=0.75, best=0.75, ubc=1.58)
└── (a=35, N=5, Q_v=0.75, best=0.76, ubc=1.31)
    ├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    ├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    ├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    └── (a=30, N=1, Q_v=0.76, best=0.76, ubc=1.66)
└── (a=35, N=26, Q_v=0.75, best=0.80, ubc=1.05)
    ├── (a=3, N=5, Q_v=0.76, best=0.80, ubc=1.33)
    ├── (a=4, N=1, Q_v=0.80, best=0.80, ubc=1.70)
    ├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    ├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    └── (a=36, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    ├── (a=11, N=5, Q_v=0.76, best=0.80, ubc=1.33)
    ├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    ├── (a=12, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    ├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    └── (a=29, N=1, Q_v=0.80, best=0.80, ubc=1.70)
    ├── (a=24, N=5, Q_v=0.75, best=0.75, ubc=1.32)
    ├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    ├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    ├── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    └── (a=36, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    ├── (a=29, N=5, Q_v=0.75, best=0.75, ubc=1.32)
    ├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    ├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    ├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    └── (a=30, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    └── (a=36, N=5, Q_v=0.75, best=0.75, ubc=1.32)
        ├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.64)
        ├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.64)
        ├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.64)
        └── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.64)
[16:54:24] INFO     selected action 35 after 125 simulations.
           INFO     current action list: [1, 19, 20, 25, 21, 26, 27, 7, 28, 2, 13, 22, 14, 31, 15, 8, 16, 32, 33,
                    9, 34, 10, 23, 17, 18, 35]
(N=125, Q_v=0.75, best=0.80)
├── (a=3, N=26, Q_v=0.76, best=0.80, ubc=1.06)
├── (a=4, N=5, Q_v=0.76, best=0.80, ubc=1.33)
├── (a=5, N=1, Q_v=0.80, best=0.80, ubc=1.70)
├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.64)
└── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=11, N=5, Q_v=0.77, best=0.80, ubc=1.34)
├── (a=4, N=1, Q_v=0.80, best=0.80, ubc=1.70)
├── (a=12, N=1, Q_v=0.80, best=0.80, ubc=1.70)
├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.64)
└── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=24, N=5, Q_v=0.75, best=0.75, ubc=1.32)
├── (a=4, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.64)
└── (a=36, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=29, N=5, Q_v=0.75, best=0.76, ubc=1.32)
├── (a=4, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.64)
└── (a=30, N=1, Q_v=0.76, best=0.76, ubc=1.66)
└── (a=36, N=5, Q_v=0.76, best=0.80, ubc=1.33)
    ├── (a=4, N=1, Q_v=0.80, best=0.80, ubc=1.70)
    ├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    ├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    └── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=11, N=25, Q_v=0.75, best=0.80, ubc=1.06)
├── (a=3, N=5, Q_v=0.76, best=0.80, ubc=1.32)
├── (a=4, N=1, Q_v=0.80, best=0.80, ubc=1.70)
├── (a=12, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.64)
└── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=12, N=5, Q_v=0.75, best=0.75, ubc=1.31)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.64)
└── (a=36, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=24, N=4, Q_v=0.75, best=0.75, ubc=1.38)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=12, N=1, Q_v=0.75, best=0.75, ubc=1.58)
└── (a=36, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=29, N=5, Q_v=0.76, best=0.80, ubc=1.32)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=12, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.64)
└── (a=30, N=1, Q_v=0.75, best=0.75, ubc=1.64)
└── (a=36, N=5, Q_v=0.76, best=0.80, ubc=1.32)
    ├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    ├── (a=12, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    ├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    └── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=24, N=24, Q_v=0.75, best=0.75, ubc=1.06)
├── (a=3, N=6, Q_v=0.75, best=0.75, ubc=1.26)
├── (a=4, N=2, Q_v=0.75, best=0.75, ubc=1.41)
├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.69)
├── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.69)
└── (a=36, N=1, Q_v=0.75, best=0.75, ubc=1.69)
├── (a=11, N=6, Q_v=0.75, best=0.75, ubc=1.26)
├── (a=3, N=2, Q_v=0.75, best=0.75, ubc=1.41)
├── (a=12, N=1, Q_v=0.75, best=0.75, ubc=1.69)
├── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.69)
└── (a=36, N=1, Q_v=0.75, best=0.75, ubc=1.69)
├── (a=29, N=6, Q_v=0.75, best=0.75, ubc=1.26)
├── (a=3, N=2, Q_v=0.75, best=0.75, ubc=1.41)
├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.69)
├── (a=30, N=1, Q_v=0.75, best=0.75, ubc=1.69)
└── (a=36, N=1, Q_v=0.75, best=0.75, ubc=1.69)
└── (a=36, N=5, Q_v=0.75, best=0.75, ubc=1.31)
    ├── (a=3, N=2, Q_v=0.75, best=0.75, ubc=1.38)
    ├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    └── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=29, N=24, Q_v=0.75, best=0.76, ubc=1.06)
├── (a=3, N=5, Q_v=0.75, best=0.75, ubc=1.31)
├── (a=4, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.64)
└── (a=36, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=11, N=5, Q_v=0.75, best=0.75, ubc=1.31)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=12, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.64)
└── (a=30, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=24, N=4, Q_v=0.75, best=0.75, ubc=1.38)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.58)
└── (a=36, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=30, N=5, Q_v=0.75, best=0.76, ubc=1.31)
├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.64)
└── (a=36, N=1, Q_v=0.75, best=0.75, ubc=1.64)
└── (a=36, N=4, Q_v=0.75, best=0.75, ubc=1.38)
    ├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.58)
    ├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.58)
    └── (a=30, N=1, Q_v=0.75, best=0.75, ubc=1.58)
└── (a=36, N=25, Q_v=0.75, best=0.80, ubc=1.06)
    ├── (a=3, N=6, Q_v=0.75, best=0.76, ubc=1.27)
    ├── (a=4, N=1, Q_v=0.75, best=0.75, ubc=1.69)
    ├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.69)
    ├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.69)
    └── (a=29, N=2, Q_v=0.75, best=0.76, ubc=1.42)
    ├── (a=11, N=6, Q_v=0.76, best=0.80, ubc=1.28)
    ├── (a=3, N=2, Q_v=0.80, best=0.80, ubc=1.47)
    ├── (a=12, N=1, Q_v=0.75, best=0.75, ubc=1.69)
    ├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.69)
    └── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.69)
    ├── (a=24, N=6, Q_v=0.75, best=0.75, ubc=1.26)
    ├── (a=3, N=2, Q_v=0.75, best=0.75, ubc=1.41)
    ├── (a=11, N=2, Q_v=0.75, best=0.75, ubc=1.41)
    └── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.69)
    └── (a=29, N=6, Q_v=0.75, best=0.76, ubc=1.27)
        ├── (a=3, N=1, Q_v=0.75, best=0.75, ubc=1.69)
        ├── (a=11, N=2, Q_v=0.75, best=0.76, ubc=1.42)
        ├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.69)
        └── (a=30, N=1, Q_v=0.75, best=0.75, ubc=1.69)
[16:54:25] INFO     selected action 3 after 125 simulations.
           INFO     current action list: [1, 19, 20, 25, 21, 26, 27, 7, 28, 2, 13, 22, 14, 31, 15, 8, 16, 32, 33,
                    9, 34, 10, 23, 17, 18, 35, 3]
(N=125, Q_v=0.75, best=0.80)
├── (a=4, N=27, Q_v=0.76, best=0.80, ubc=1.06)
├── (a=5, N=6, Q_v=0.78, best=0.80, ubc=1.31)
├── (a=6, N=1, Q_v=0.80, best=0.80, ubc=1.75)
├── (a=11, N=1, Q_v=0.80, best=0.80, ubc=1.75)
├── (a=24, N=1, Q_v=0.80, best=0.80, ubc=1.75)
├── (a=29, N=1, Q_v=0.76, best=0.76, ubc=1.71)
└── (a=36, N=1, Q_v=0.75, best=0.75, ubc=1.69)
├── (a=11, N=5, Q_v=0.77, best=0.80, ubc=1.34)
├── (a=5, N=1, Q_v=0.80, best=0.80, ubc=1.70)
├── (a=12, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.64)
└── (a=36, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=24, N=5, Q_v=0.75, best=0.75, ubc=1.32)
├── (a=5, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.64)
└── (a=36, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=29, N=5, Q_v=0.75, best=0.76, ubc=1.32)
├── (a=5, N=1, Q_v=0.76, best=0.76, ubc=1.66)
├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.64)
└── (a=30, N=1, Q_v=0.75, best=0.75, ubc=1.64)
└── (a=36, N=5, Q_v=0.78, best=0.80, ubc=1.35)
    ├── (a=5, N=1, Q_v=0.80, best=0.80, ubc=1.70)
    ├── (a=11, N=1, Q_v=0.80, best=0.80, ubc=1.70)
    ├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    └── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=11, N=25, Q_v=0.75, best=0.80, ubc=1.06)
├── (a=4, N=5, Q_v=0.77, best=0.80, ubc=1.33)
├── (a=5, N=1, Q_v=0.80, best=0.80, ubc=1.70)
├── (a=12, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.64)
└── (a=29, N=1, Q_v=0.80, best=0.80, ubc=1.70)
├── (a=12, N=5, Q_v=0.76, best=0.80, ubc=1.32)
├── (a=4, N=1, Q_v=0.80, best=0.80, ubc=1.70)
├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.64)
└── (a=36, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=24, N=5, Q_v=0.75, best=0.75, ubc=1.31)
├── (a=4, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=12, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.64)
└── (a=36, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=29, N=5, Q_v=0.76, best=0.80, ubc=1.32)
├── (a=4, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=12, N=1, Q_v=0.80, best=0.80, ubc=1.70)
├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.64)
└── (a=30, N=1, Q_v=0.75, best=0.75, ubc=1.64)
└── (a=36, N=4, Q_v=0.75, best=0.75, ubc=1.38)
    ├── (a=4, N=1, Q_v=0.75, best=0.75, ubc=1.58)
    ├── (a=12, N=1, Q_v=0.75, best=0.75, ubc=1.58)
    └── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=24, N=23, Q_v=0.75, best=0.75, ubc=1.07)
├── (a=4, N=6, Q_v=0.75, best=0.75, ubc=1.26)
├── (a=5, N=2, Q_v=0.75, best=0.75, ubc=1.41)
├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.69)
├── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.69)
└── (a=36, N=1, Q_v=0.75, best=0.75, ubc=1.69)
├── (a=11, N=6, Q_v=0.75, best=0.75, ubc=1.26)
├── (a=4, N=2, Q_v=0.75, best=0.75, ubc=1.41)
├── (a=12, N=1, Q_v=0.75, best=0.75, ubc=1.69)
├── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.69)
└── (a=36, N=1, Q_v=0.75, best=0.75, ubc=1.69)
├── (a=29, N=5, Q_v=0.75, best=0.75, ubc=1.31)
├── (a=4, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=30, N=1, Q_v=0.75, best=0.75, ubc=1.64)
└── (a=36, N=1, Q_v=0.75, best=0.75, ubc=1.64)
└── (a=36, N=5, Q_v=0.75, best=0.75, ubc=1.31)
    ├── (a=4, N=2, Q_v=0.75, best=0.75, ubc=1.38)
    ├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    └── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=29, N=24, Q_v=0.75, best=0.76, ubc=1.06)
├── (a=4, N=5, Q_v=0.75, best=0.76, ubc=1.31)
├── (a=5, N=1, Q_v=0.76, best=0.76, ubc=1.66)
├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.64)
└── (a=30, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=11, N=5, Q_v=0.75, best=0.76, ubc=1.31)
├── (a=4, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=12, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.64)
└── (a=30, N=1, Q_v=0.76, best=0.76, ubc=1.66)
├── (a=24, N=4, Q_v=0.75, best=0.75, ubc=1.38)
├── (a=4, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.58)
└── (a=36, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=30, N=4, Q_v=0.75, best=0.75, ubc=1.38)
├── (a=4, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.58)
└── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.58)
└── (a=36, N=5, Q_v=0.75, best=0.76, ubc=1.31)
    ├── (a=4, N=1, Q_v=0.76, best=0.76, ubc=1.66)
    ├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    ├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    └── (a=30, N=1, Q_v=0.75, best=0.75, ubc=1.64)
└── (a=36, N=25, Q_v=0.75, best=0.80, ubc=1.06)
    ├── (a=4, N=6, Q_v=0.76, best=0.80, ubc=1.28)
    ├── (a=5, N=1, Q_v=0.75, best=0.75, ubc=1.69)
    ├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.69)
    ├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.69)
    └── (a=29, N=2, Q_v=0.75, best=0.76, ubc=1.42)
    ├── (a=11, N=6, Q_v=0.76, best=0.80, ubc=1.28)
    ├── (a=4, N=1, Q_v=0.75, best=0.75, ubc=1.69)
    ├── (a=12, N=2, Q_v=0.77, best=0.80, ubc=1.44)
    ├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.69)
    └── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.69)
    ├── (a=24, N=6, Q_v=0.75, best=0.75, ubc=1.26)
    ├── (a=4, N=2, Q_v=0.75, best=0.75, ubc=1.41)
    ├── (a=11, N=2, Q_v=0.75, best=0.75, ubc=1.41)
    └── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.69)
    └── (a=29, N=6, Q_v=0.75, best=0.76, ubc=1.27)
        ├── (a=4, N=1, Q_v=0.75, best=0.75, ubc=1.69)
        ├── (a=11, N=2, Q_v=0.75, best=0.76, ubc=1.42)
        ├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.69)
        └── (a=30, N=1, Q_v=0.75, best=0.75, ubc=1.69)
[16:54:26] INFO     selected action 4 after 125 simulations.
           INFO     current action list: [1, 19, 20, 25, 21, 26, 27, 7, 28, 2, 13, 22, 14, 31, 15, 8, 16, 32, 33,
                    9, 34, 10, 23, 17, 18, 35, 3, 4]
(N=125, Q_v=0.76, best=0.80)
├── (a=5, N=27, Q_v=0.78, best=0.80, ubc=1.07)
├── (a=6, N=5, Q_v=0.76, best=0.80, ubc=1.34)
├── (a=11, N=1, Q_v=0.80, best=0.80, ubc=1.70)
├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=29, N=1, Q_v=0.76, best=0.76, ubc=1.66)
└── (a=36, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=11, N=6, Q_v=0.80, best=0.80, ubc=1.32)
├── (a=6, N=1, Q_v=0.80, best=0.80, ubc=1.75)
├── (a=12, N=1, Q_v=0.80, best=0.80, ubc=1.75)
├── (a=24, N=1, Q_v=0.80, best=0.80, ubc=1.75)
├── (a=29, N=1, Q_v=0.80, best=0.80, ubc=1.75)
└── (a=36, N=1, Q_v=0.80, best=0.80, ubc=1.75)
├── (a=24, N=5, Q_v=0.78, best=0.80, ubc=1.35)
├── (a=6, N=1, Q_v=0.80, best=0.80, ubc=1.70)
├── (a=11, N=1, Q_v=0.80, best=0.80, ubc=1.70)
├── (a=29, N=1, Q_v=0.76, best=0.76, ubc=1.66)
└── (a=36, N=1, Q_v=0.76, best=0.76, ubc=1.66)
├── (a=29, N=5, Q_v=0.75, best=0.76, ubc=1.33)
├── (a=6, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=11, N=1, Q_v=0.76, best=0.76, ubc=1.66)
├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.64)
└── (a=30, N=1, Q_v=0.76, best=0.76, ubc=1.66)
└── (a=36, N=5, Q_v=0.77, best=0.80, ubc=1.35)
    ├── (a=6, N=1, Q_v=0.80, best=0.80, ubc=1.70)
    ├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    ├── (a=24, N=1, Q_v=0.76, best=0.76, ubc=1.66)
    └── (a=29, N=1, Q_v=0.76, best=0.76, ubc=1.66)
├── (a=11, N=25, Q_v=0.76, best=0.80, ubc=1.07)
├── (a=5, N=5, Q_v=0.79, best=0.80, ubc=1.36)
├── (a=6, N=1, Q_v=0.80, best=0.80, ubc=1.70)
├── (a=12, N=1, Q_v=0.80, best=0.80, ubc=1.70)
├── (a=24, N=1, Q_v=0.80, best=0.80, ubc=1.70)
└── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=12, N=5, Q_v=0.77, best=0.80, ubc=1.33)
├── (a=5, N=1, Q_v=0.80, best=0.80, ubc=1.70)
├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.64)
└── (a=36, N=1, Q_v=0.80, best=0.80, ubc=1.70)
├── (a=24, N=4, Q_v=0.75, best=0.75, ubc=1.38)
├── (a=5, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=12, N=1, Q_v=0.75, best=0.75, ubc=1.58)
└── (a=36, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=29, N=5, Q_v=0.76, best=0.80, ubc=1.32)
├── (a=5, N=1, Q_v=0.80, best=0.80, ubc=1.70)
├── (a=12, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.64)
└── (a=30, N=1, Q_v=0.75, best=0.75, ubc=1.64)
└── (a=36, N=5, Q_v=0.76, best=0.80, ubc=1.32)
    ├── (a=5, N=1, Q_v=0.80, best=0.80, ubc=1.70)
    ├── (a=12, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    ├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    └── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=24, N=23, Q_v=0.75, best=0.75, ubc=1.07)
├── (a=5, N=6, Q_v=0.75, best=0.75, ubc=1.26)
├── (a=6, N=2, Q_v=0.75, best=0.75, ubc=1.41)
├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.69)
├── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.69)
└── (a=36, N=1, Q_v=0.75, best=0.75, ubc=1.69)
├── (a=11, N=6, Q_v=0.75, best=0.75, ubc=1.26)
├── (a=5, N=2, Q_v=0.75, best=0.75, ubc=1.41)
├── (a=12, N=1, Q_v=0.75, best=0.75, ubc=1.69)
├── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.69)
└── (a=36, N=1, Q_v=0.75, best=0.75, ubc=1.69)
├── (a=29, N=5, Q_v=0.75, best=0.75, ubc=1.31)
├── (a=5, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=30, N=1, Q_v=0.75, best=0.75, ubc=1.64)
└── (a=36, N=1, Q_v=0.75, best=0.75, ubc=1.64)
└── (a=36, N=5, Q_v=0.75, best=0.75, ubc=1.31)
    ├── (a=5, N=2, Q_v=0.75, best=0.75, ubc=1.38)
    ├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    └── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=29, N=24, Q_v=0.75, best=0.76, ubc=1.07)
├── (a=5, N=5, Q_v=0.76, best=0.76, ubc=1.32)
├── (a=6, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=11, N=1, Q_v=0.76, best=0.76, ubc=1.66)
├── (a=24, N=1, Q_v=0.76, best=0.76, ubc=1.66)
└── (a=30, N=1, Q_v=0.76, best=0.76, ubc=1.66)
├── (a=11, N=4, Q_v=0.75, best=0.76, ubc=1.38)
├── (a=5, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=12, N=1, Q_v=0.75, best=0.75, ubc=1.58)
└── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=24, N=4, Q_v=0.75, best=0.75, ubc=1.38)
├── (a=5, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.58)
└── (a=30, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=30, N=5, Q_v=0.76, best=0.76, ubc=1.32)
├── (a=5, N=1, Q_v=0.76, best=0.76, ubc=1.66)
├── (a=11, N=1, Q_v=0.76, best=0.76, ubc=1.66)
├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.64)
└── (a=36, N=1, Q_v=0.76, best=0.76, ubc=1.66)
└── (a=36, N=5, Q_v=0.75, best=0.76, ubc=1.32)
    ├── (a=5, N=1, Q_v=0.76, best=0.76, ubc=1.66)
    ├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    ├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    └── (a=30, N=1, Q_v=0.75, best=0.75, ubc=1.64)
└── (a=36, N=25, Q_v=0.76, best=0.80, ubc=1.07)
    ├── (a=5, N=6, Q_v=0.77, best=0.80, ubc=1.29)
    ├── (a=6, N=1, Q_v=0.76, best=0.76, ubc=1.71)
    ├── (a=11, N=2, Q_v=0.80, best=0.80, ubc=1.47)
    ├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.69)
    └── (a=29, N=1, Q_v=0.76, best=0.76, ubc=1.71)
    ├── (a=11, N=6, Q_v=0.75, best=0.80, ubc=1.27)
    ├── (a=5, N=2, Q_v=0.77, best=0.80, ubc=1.44)
    ├── (a=12, N=1, Q_v=0.75, best=0.75, ubc=1.69)
    ├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.69)
    └── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.69)
    ├── (a=24, N=6, Q_v=0.75, best=0.75, ubc=1.26)
    ├── (a=5, N=2, Q_v=0.75, best=0.75, ubc=1.41)
    ├── (a=11, N=2, Q_v=0.75, best=0.75, ubc=1.41)
    └── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.69)
    └── (a=29, N=6, Q_v=0.75, best=0.76, ubc=1.27)
        ├── (a=5, N=2, Q_v=0.75, best=0.76, ubc=1.42)
        ├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.69)
        ├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.69)
        └── (a=30, N=1, Q_v=0.75, best=0.75, ubc=1.69)
           INFO     selected action 5 after 125 simulations.
           INFO     current action list: [1, 19, 20, 25, 21, 26, 27, 7, 28, 2, 13, 22, 14, 31, 15, 8, 16, 32, 33,
                    9, 34, 10, 23, 17, 18, 35, 3, 4, 5]
(N=125, Q_v=0.77, best=0.80)
├── (a=6, N=25, Q_v=0.77, best=0.80, ubc=1.09)
├── (a=11, N=6, Q_v=0.79, best=0.80, ubc=1.31)
├── (a=12, N=2, Q_v=0.80, best=0.80, ubc=1.47)
├── (a=24, N=1, Q_v=0.80, best=0.80, ubc=1.75)
├── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.69)
└── (a=36, N=1, Q_v=0.80, best=0.80, ubc=1.75)
├── (a=24, N=6, Q_v=0.79, best=0.80, ubc=1.31)
├── (a=11, N=2, Q_v=0.80, best=0.80, ubc=1.47)
├── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.69)
└── (a=36, N=2, Q_v=0.80, best=0.80, ubc=1.47)
├── (a=29, N=6, Q_v=0.76, best=0.76, ubc=1.28)
├── (a=11, N=2, Q_v=0.75, best=0.76, ubc=1.42)
├── (a=24, N=1, Q_v=0.76, best=0.76, ubc=1.71)
├── (a=30, N=1, Q_v=0.76, best=0.76, ubc=1.71)
└── (a=36, N=1, Q_v=0.75, best=0.75, ubc=1.69)
└── (a=36, N=6, Q_v=0.76, best=0.80, ubc=1.28)
    ├── (a=11, N=2, Q_v=0.77, best=0.80, ubc=1.44)
    ├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.69)
    └── (a=29, N=2, Q_v=0.76, best=0.76, ubc=1.43)
├── (a=11, N=26, Q_v=0.78, best=0.80, ubc=1.09)
├── (a=6, N=5, Q_v=0.77, best=0.80, ubc=1.34)
├── (a=12, N=1, Q_v=0.80, best=0.80, ubc=1.70)
├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.64)
└── (a=36, N=1, Q_v=0.80, best=0.80, ubc=1.70)
├── (a=12, N=5, Q_v=0.80, best=0.80, ubc=1.37)
├── (a=6, N=1, Q_v=0.80, best=0.80, ubc=1.70)
├── (a=24, N=1, Q_v=0.80, best=0.80, ubc=1.70)
├── (a=29, N=1, Q_v=0.80, best=0.80, ubc=1.70)
└── (a=36, N=1, Q_v=0.80, best=0.80, ubc=1.70)
├── (a=24, N=5, Q_v=0.79, best=0.80, ubc=1.36)
├── (a=6, N=1, Q_v=0.80, best=0.80, ubc=1.70)
├── (a=12, N=1, Q_v=0.80, best=0.80, ubc=1.70)
├── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.64)
└── (a=36, N=1, Q_v=0.80, best=0.80, ubc=1.70)
├── (a=29, N=5, Q_v=0.77, best=0.80, ubc=1.34)
├── (a=6, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=12, N=1, Q_v=0.80, best=0.80, ubc=1.70)
├── (a=24, N=1, Q_v=0.80, best=0.80, ubc=1.70)
└── (a=30, N=1, Q_v=0.75, best=0.75, ubc=1.64)
└── (a=36, N=5, Q_v=0.78, best=0.80, ubc=1.35)
    ├── (a=6, N=1, Q_v=0.80, best=0.80, ubc=1.70)
    ├── (a=12, N=1, Q_v=0.80, best=0.80, ubc=1.70)
    ├── (a=24, N=1, Q_v=0.80, best=0.80, ubc=1.70)
    └── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=24, N=25, Q_v=0.77, best=0.80, ubc=1.08)
├── (a=6, N=6, Q_v=0.77, best=0.80, ubc=1.28)
├── (a=11, N=2, Q_v=0.77, best=0.80, ubc=1.44)
├── (a=29, N=1, Q_v=0.76, best=0.76, ubc=1.71)
└── (a=36, N=2, Q_v=0.77, best=0.80, ubc=1.44)
├── (a=11, N=6, Q_v=0.78, best=0.80, ubc=1.30)
├── (a=6, N=1, Q_v=0.75, best=0.75, ubc=1.69)
├── (a=12, N=2, Q_v=0.80, best=0.80, ubc=1.47)
├── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.69)
└── (a=36, N=1, Q_v=0.80, best=0.80, ubc=1.75)
├── (a=29, N=6, Q_v=0.76, best=0.76, ubc=1.28)
├── (a=6, N=2, Q_v=0.76, best=0.76, ubc=1.43)
├── (a=11, N=1, Q_v=0.76, best=0.76, ubc=1.71)
├── (a=30, N=1, Q_v=0.76, best=0.76, ubc=1.71)
└── (a=36, N=1, Q_v=0.76, best=0.76, ubc=1.71)
└── (a=36, N=6, Q_v=0.77, best=0.80, ubc=1.29)
    ├── (a=6, N=2, Q_v=0.75, best=0.76, ubc=1.42)
    ├── (a=11, N=2, Q_v=0.80, best=0.80, ubc=1.47)
    └── (a=29, N=1, Q_v=0.76, best=0.76, ubc=1.71)
├── (a=29, N=23, Q_v=0.76, best=0.76, ubc=1.08)
├── (a=6, N=4, Q_v=0.75, best=0.76, ubc=1.38)
├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=24, N=1, Q_v=0.76, best=0.76, ubc=1.60)
└── (a=30, N=1, Q_v=0.76, best=0.76, ubc=1.60)
├── (a=11, N=4, Q_v=0.75, best=0.76, ubc=1.38)
├── (a=6, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=12, N=1, Q_v=0.75, best=0.75, ubc=1.58)
└── (a=30, N=1, Q_v=0.76, best=0.76, ubc=1.60)
├── (a=24, N=5, Q_v=0.76, best=0.76, ubc=1.32)
├── (a=6, N=1, Q_v=0.76, best=0.76, ubc=1.66)
├── (a=11, N=1, Q_v=0.76, best=0.76, ubc=1.66)
├── (a=30, N=1, Q_v=0.76, best=0.76, ubc=1.66)
└── (a=36, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=30, N=5, Q_v=0.76, best=0.76, ubc=1.32)
├── (a=6, N=1, Q_v=0.76, best=0.76, ubc=1.66)
├── (a=11, N=1, Q_v=0.76, best=0.76, ubc=1.66)
├── (a=24, N=1, Q_v=0.76, best=0.76, ubc=1.66)
└── (a=36, N=1, Q_v=0.76, best=0.76, ubc=1.66)
└── (a=36, N=4, Q_v=0.76, best=0.76, ubc=1.39)
    ├── (a=6, N=1, Q_v=0.76, best=0.76, ubc=1.60)
    ├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.58)
    └── (a=24, N=1, Q_v=0.76, best=0.76, ubc=1.60)
└── (a=36, N=25, Q_v=0.78, best=0.80, ubc=1.09)
    ├── (a=6, N=6, Q_v=0.78, best=0.80, ubc=1.30)
    ├── (a=11, N=2, Q_v=0.80, best=0.80, ubc=1.47)
    ├── (a=24, N=2, Q_v=0.78, best=0.80, ubc=1.45)
    └── (a=29, N=1, Q_v=0.76, best=0.76, ubc=1.71)
    ├── (a=11, N=6, Q_v=0.80, best=0.80, ubc=1.32)
    ├── (a=6, N=2, Q_v=0.80, best=0.80, ubc=1.47)
    ├── (a=12, N=1, Q_v=0.80, best=0.80, ubc=1.75)
    ├── (a=24, N=1, Q_v=0.80, best=0.80, ubc=1.75)
    └── (a=29, N=1, Q_v=0.80, best=0.80, ubc=1.75)
    ├── (a=24, N=6, Q_v=0.77, best=0.80, ubc=1.29)
    ├── (a=6, N=2, Q_v=0.80, best=0.80, ubc=1.47)
    ├── (a=11, N=2, Q_v=0.77, best=0.80, ubc=1.44)
    └── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.69)
    └── (a=29, N=6, Q_v=0.76, best=0.76, ubc=1.28)
        ├── (a=6, N=2, Q_v=0.76, best=0.76, ubc=1.43)
        ├── (a=11, N=1, Q_v=0.75, best=0.75, ubc=1.69)
        ├── (a=24, N=1, Q_v=0.76, best=0.76, ubc=1.71)
        └── (a=30, N=1, Q_v=0.76, best=0.76, ubc=1.71)
[16:54:27] INFO     selected action 11 after 125 simulations.
           INFO     current action list: [1, 19, 20, 25, 21, 26, 27, 7, 28, 2, 13, 22, 14, 31, 15, 8, 16, 32, 33,
                    9, 34, 10, 23, 17, 18, 35, 3, 4, 5, 11]
(N=125, Q_v=0.79, best=0.80)
├── (a=6, N=24, Q_v=0.79, best=0.80, ubc=1.10)
├── (a=12, N=6, Q_v=0.80, best=0.80, ubc=1.31)
├── (a=24, N=2, Q_v=0.80, best=0.80, ubc=1.47)
├── (a=29, N=2, Q_v=0.80, best=0.80, ubc=1.47)
└── (a=36, N=1, Q_v=0.80, best=0.80, ubc=1.75)
├── (a=24, N=6, Q_v=0.78, best=0.80, ubc=1.30)
├── (a=12, N=2, Q_v=0.80, best=0.80, ubc=1.47)
├── (a=29, N=2, Q_v=0.77, best=0.80, ubc=1.44)
└── (a=36, N=1, Q_v=0.75, best=0.75, ubc=1.69)
├── (a=29, N=6, Q_v=0.78, best=0.80, ubc=1.30)
├── (a=12, N=2, Q_v=0.80, best=0.80, ubc=1.47)
├── (a=24, N=1, Q_v=0.80, best=0.80, ubc=1.75)
├── (a=30, N=1, Q_v=0.75, best=0.75, ubc=1.69)
└── (a=36, N=1, Q_v=0.80, best=0.80, ubc=1.75)
└── (a=36, N=5, Q_v=0.78, best=0.80, ubc=1.34)
    ├── (a=12, N=2, Q_v=0.80, best=0.80, ubc=1.43)
    ├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.64)
    └── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.64)
├── (a=12, N=27, Q_v=0.80, best=0.80, ubc=1.10)
├── (a=6, N=7, Q_v=0.80, best=0.80, ubc=1.29)
├── (a=24, N=2, Q_v=0.80, best=0.80, ubc=1.50)
├── (a=29, N=2, Q_v=0.80, best=0.80, ubc=1.50)
└── (a=36, N=2, Q_v=0.80, best=0.80, ubc=1.50)
├── (a=24, N=7, Q_v=0.80, best=0.80, ubc=1.29)
├── (a=6, N=2, Q_v=0.80, best=0.80, ubc=1.50)
├── (a=29, N=2, Q_v=0.80, best=0.80, ubc=1.50)
└── (a=36, N=2, Q_v=0.80, best=0.80, ubc=1.50)
├── (a=29, N=6, Q_v=0.80, best=0.80, ubc=1.32)
├── (a=6, N=2, Q_v=0.80, best=0.80, ubc=1.47)
├── (a=24, N=1, Q_v=0.80, best=0.80, ubc=1.75)
├── (a=30, N=1, Q_v=0.80, best=0.80, ubc=1.75)
└── (a=36, N=1, Q_v=0.80, best=0.80, ubc=1.75)
└── (a=36, N=6, Q_v=0.80, best=0.80, ubc=1.32)
    ├── (a=6, N=2, Q_v=0.80, best=0.80, ubc=1.47)
    ├── (a=24, N=2, Q_v=0.80, best=0.80, ubc=1.47)
    └── (a=29, N=1, Q_v=0.80, best=0.80, ubc=1.75)
├── (a=24, N=25, Q_v=0.79, best=0.80, ubc=1.10)
├── (a=6, N=6, Q_v=0.79, best=0.80, ubc=1.31)
├── (a=12, N=2, Q_v=0.80, best=0.80, ubc=1.47)
├── (a=29, N=2, Q_v=0.77, best=0.80, ubc=1.44)
└── (a=36, N=1, Q_v=0.80, best=0.80, ubc=1.75)
├── (a=12, N=6, Q_v=0.80, best=0.80, ubc=1.32)
├── (a=6, N=2, Q_v=0.80, best=0.80, ubc=1.47)
├── (a=29, N=2, Q_v=0.80, best=0.80, ubc=1.47)
└── (a=36, N=1, Q_v=0.80, best=0.80, ubc=1.75)
├── (a=29, N=6, Q_v=0.78, best=0.80, ubc=1.30)
├── (a=6, N=2, Q_v=0.80, best=0.80, ubc=1.47)
├── (a=12, N=1, Q_v=0.80, best=0.80, ubc=1.75)
├── (a=30, N=1, Q_v=0.75, best=0.75, ubc=1.69)
└── (a=36, N=1, Q_v=0.75, best=0.75, ubc=1.69)
└── (a=36, N=6, Q_v=0.79, best=0.80, ubc=1.31)
    ├── (a=6, N=2, Q_v=0.80, best=0.80, ubc=1.47)
    ├── (a=12, N=2, Q_v=0.80, best=0.80, ubc=1.47)
    └── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.69)
├── (a=29, N=23, Q_v=0.78, best=0.80, ubc=1.10)
├── (a=6, N=4, Q_v=0.79, best=0.80, ubc=1.41)
├── (a=12, N=1, Q_v=0.80, best=0.80, ubc=1.63)
├── (a=24, N=1, Q_v=0.80, best=0.80, ubc=1.63)
└── (a=30, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=12, N=5, Q_v=0.80, best=0.80, ubc=1.36)
├── (a=6, N=1, Q_v=0.80, best=0.80, ubc=1.70)
├── (a=24, N=1, Q_v=0.80, best=0.80, ubc=1.70)
├── (a=30, N=1, Q_v=0.80, best=0.80, ubc=1.70)
└── (a=36, N=1, Q_v=0.80, best=0.80, ubc=1.70)
├── (a=24, N=5, Q_v=0.79, best=0.80, ubc=1.35)
├── (a=6, N=1, Q_v=0.80, best=0.80, ubc=1.70)
├── (a=12, N=1, Q_v=0.80, best=0.80, ubc=1.70)
├── (a=30, N=1, Q_v=0.75, best=0.75, ubc=1.64)
└── (a=36, N=1, Q_v=0.80, best=0.80, ubc=1.70)
├── (a=30, N=4, Q_v=0.75, best=0.75, ubc=1.37)
├── (a=6, N=1, Q_v=0.75, best=0.75, ubc=1.58)
├── (a=12, N=1, Q_v=0.75, best=0.75, ubc=1.58)
└── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.58)
└── (a=36, N=4, Q_v=0.77, best=0.80, ubc=1.40)
    ├── (a=6, N=1, Q_v=0.80, best=0.80, ubc=1.63)
    ├── (a=12, N=1, Q_v=0.80, best=0.80, ubc=1.63)
    └── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.58)
└── (a=36, N=25, Q_v=0.79, best=0.80, ubc=1.10)
    ├── (a=6, N=6, Q_v=0.79, best=0.80, ubc=1.31)
    ├── (a=12, N=2, Q_v=0.80, best=0.80, ubc=1.47)
    ├── (a=24, N=2, Q_v=0.77, best=0.80, ubc=1.44)
    └── (a=29, N=1, Q_v=0.80, best=0.80, ubc=1.75)
    ├── (a=12, N=6, Q_v=0.80, best=0.80, ubc=1.32)
    ├── (a=6, N=2, Q_v=0.80, best=0.80, ubc=1.47)
    ├── (a=24, N=2, Q_v=0.80, best=0.80, ubc=1.47)
    └── (a=29, N=1, Q_v=0.80, best=0.80, ubc=1.75)
    ├── (a=24, N=6, Q_v=0.79, best=0.80, ubc=1.31)
    ├── (a=6, N=2, Q_v=0.80, best=0.80, ubc=1.47)
    ├── (a=12, N=2, Q_v=0.80, best=0.80, ubc=1.47)
    └── (a=29, N=1, Q_v=0.75, best=0.75, ubc=1.69)
    └── (a=29, N=6, Q_v=0.77, best=0.80, ubc=1.29)
        ├── (a=6, N=1, Q_v=0.75, best=0.75, ubc=1.69)
        ├── (a=12, N=2, Q_v=0.80, best=0.80, ubc=1.47)
        ├── (a=24, N=1, Q_v=0.75, best=0.75, ubc=1.69)
        └── (a=30, N=1, Q_v=0.75, best=0.75, ubc=1.69)
           INFO     selected action 12 after 125 simulations.
           INFO     current action list: [1, 19, 20, 25, 21, 26, 27, 7, 28, 2, 13, 22, 14, 31, 15, 8, 16, 32, 33,
                    9, 34, 10, 23, 17, 18, 35, 3, 4, 5, 11, 12]
(N=125, Q_v=0.80, best=0.80)
├── (a=6, N=31, Q_v=0.80, best=0.80, ubc=1.08)
├── (a=24, N=10, Q_v=0.80, best=0.80, ubc=1.21)
├── (a=29, N=5, Q_v=0.80, best=0.80, ubc=1.28)
└── (a=36, N=4, Q_v=0.80, best=0.80, ubc=1.34)
├── (a=29, N=10, Q_v=0.80, best=0.80, ubc=1.21)
├── (a=24, N=3, Q_v=0.80, best=0.80, ubc=1.42)
├── (a=30, N=3, Q_v=0.80, best=0.80, ubc=1.42)
└── (a=36, N=3, Q_v=0.80, best=0.80, ubc=1.42)
└── (a=36, N=10, Q_v=0.80, best=0.80, ubc=1.21)
    ├── (a=24, N=5, Q_v=0.80, best=0.80, ubc=1.28)
    └── (a=29, N=4, Q_v=0.80, best=0.80, ubc=1.34)
├── (a=24, N=31, Q_v=0.80, best=0.80, ubc=1.08)
├── (a=6, N=10, Q_v=0.80, best=0.80, ubc=1.21)
├── (a=29, N=5, Q_v=0.80, best=0.80, ubc=1.28)
└── (a=36, N=4, Q_v=0.80, best=0.80, ubc=1.34)
├── (a=29, N=10, Q_v=0.80, best=0.80, ubc=1.21)
├── (a=6, N=3, Q_v=0.80, best=0.80, ubc=1.42)
├── (a=30, N=3, Q_v=0.80, best=0.80, ubc=1.42)
└── (a=36, N=3, Q_v=0.80, best=0.80, ubc=1.42)
└── (a=36, N=10, Q_v=0.80, best=0.80, ubc=1.21)
    ├── (a=6, N=5, Q_v=0.80, best=0.80, ubc=1.28)
    └── (a=29, N=4, Q_v=0.80, best=0.80, ubc=1.34)
├── (a=29, N=31, Q_v=0.80, best=0.80, ubc=1.08)
├── (a=6, N=8, Q_v=0.80, best=0.80, ubc=1.26)
├── (a=24, N=3, Q_v=0.80, best=0.80, ubc=1.39)
├── (a=30, N=2, Q_v=0.80, best=0.80, ubc=1.52)
└── (a=36, N=2, Q_v=0.80, best=0.80, ubc=1.52)
├── (a=24, N=8, Q_v=0.80, best=0.80, ubc=1.26)
├── (a=6, N=3, Q_v=0.80, best=0.80, ubc=1.39)
├── (a=30, N=2, Q_v=0.80, best=0.80, ubc=1.52)
└── (a=36, N=2, Q_v=0.80, best=0.80, ubc=1.52)
├── (a=30, N=7, Q_v=0.80, best=0.80, ubc=1.30)
├── (a=6, N=2, Q_v=0.80, best=0.80, ubc=1.50)
├── (a=24, N=2, Q_v=0.80, best=0.80, ubc=1.50)
└── (a=36, N=2, Q_v=0.80, best=0.80, ubc=1.50)
└── (a=36, N=7, Q_v=0.80, best=0.80, ubc=1.30)
    ├── (a=6, N=2, Q_v=0.80, best=0.80, ubc=1.50)
    ├── (a=24, N=2, Q_v=0.80, best=0.80, ubc=1.50)
    └── (a=30, N=2, Q_v=0.80, best=0.80, ubc=1.50)
└── (a=36, N=31, Q_v=0.80, best=0.80, ubc=1.08)
    ├── (a=6, N=10, Q_v=0.80, best=0.80, ubc=1.21)
    ├── (a=24, N=5, Q_v=0.80, best=0.80, ubc=1.28)
    └── (a=29, N=4, Q_v=0.80, best=0.80, ubc=1.34)
    ├── (a=24, N=10, Q_v=0.80, best=0.80, ubc=1.21)
    ├── (a=6, N=5, Q_v=0.80, best=0.80, ubc=1.28)
    └── (a=29, N=4, Q_v=0.80, best=0.80, ubc=1.34)
    └── (a=29, N=10, Q_v=0.80, best=0.80, ubc=1.21)
        ├── (a=6, N=3, Q_v=0.80, best=0.80, ubc=1.42)
        ├── (a=24, N=3, Q_v=0.80, best=0.80, ubc=1.42)
        └── (a=30, N=3, Q_v=0.80, best=0.80, ubc=1.42)
[16:54:28] INFO     selected action 6 after 125 simulations.
           INFO     current action list: [1, 19, 20, 25, 21, 26, 27, 7, 28, 2, 13, 22, 14, 31, 15, 8, 16, 32, 33,
                    9, 34, 10, 23, 17, 18, 35, 3, 4, 5, 11, 12, 6]
(N=125, Q_v=0.80, best=0.80)
├── (a=24, N=42, Q_v=0.80, best=0.80, ubc=1.04)
├── (a=29, N=21, Q_v=0.80, best=0.80, ubc=1.10)
├── (a=30, N=10, Q_v=0.80, best=0.80, ubc=1.19)
└── (a=36, N=10, Q_v=0.80, best=0.80, ubc=1.19)
└── (a=36, N=20, Q_v=0.80, best=0.80, ubc=1.11)
    └── (a=29, N=19, Q_v=0.80, best=0.80, ubc=1.08)
├── (a=29, N=41, Q_v=0.80, best=0.80, ubc=1.04)
├── (a=24, N=14, Q_v=0.80, best=0.80, ubc=1.16)
├── (a=30, N=7, Q_v=0.80, best=0.80, ubc=1.23)
└── (a=36, N=6, Q_v=0.80, best=0.80, ubc=1.27)
├── (a=30, N=13, Q_v=0.80, best=0.80, ubc=1.18)
├── (a=24, N=6, Q_v=0.80, best=0.80, ubc=1.26)
└── (a=36, N=6, Q_v=0.80, best=0.80, ubc=1.26)
└── (a=36, N=13, Q_v=0.80, best=0.80, ubc=1.18)
    ├── (a=24, N=6, Q_v=0.80, best=0.80, ubc=1.26)
    └── (a=30, N=6, Q_v=0.80, best=0.80, ubc=1.26)
└── (a=36, N=41, Q_v=0.80, best=0.80, ubc=1.04)
    ├── (a=24, N=20, Q_v=0.80, best=0.80, ubc=1.10)
    └── (a=29, N=19, Q_v=0.80, best=0.80, ubc=1.08)
    └── (a=29, N=20, Q_v=0.80, best=0.80, ubc=1.10)
        ├── (a=24, N=10, Q_v=0.80, best=0.80, ubc=1.19)
        └── (a=30, N=9, Q_v=0.80, best=0.80, ubc=1.21)
           INFO     selected action 24 after 125 simulations.
           INFO     current action list: [1, 19, 20, 25, 21, 26, 27, 7, 28, 2, 13, 22, 14, 31, 15, 8, 16, 32, 33,
                    9, 34, 10, 23, 17, 18, 35, 3, 4, 5, 11, 12, 6, 24]
(N=125, Q_v=0.80, best=0.80)
├── (a=29, N=62, Q_v=0.80, best=0.80, ubc=1.00)
├── (a=30, N=31, Q_v=0.80, best=0.80, ubc=1.06)
└── (a=36, N=30, Q_v=0.80, best=0.80, ubc=1.04)
└── (a=36, N=30, Q_v=0.80, best=0.80, ubc=1.06)
    └── (a=30, N=29, Q_v=0.80, best=0.80, ubc=1.04)
└── (a=36, N=62, Q_v=0.80, best=0.80, ubc=1.00)
    └── (a=29, N=61, Q_v=0.80, best=0.80, ubc=0.98)
        └── (a=30, N=60, Q_v=0.80, best=0.80, ubc=0.99)
           INFO     selected action 29 after 125 simulations.
           INFO     current action list: [1, 19, 20, 25, 21, 26, 27, 7, 28, 2, 13, 22, 14, 31, 15, 8, 16, 32, 33,
                    9, 34, 10, 23, 17, 18, 35, 3, 4, 5, 11, 12, 6, 24, 29]
(N=125, Q_v=0.80, best=0.80)
├── (a=30, N=62, Q_v=0.80, best=0.80, ubc=1.00)
└── (a=36, N=61, Q_v=0.80, best=0.80, ubc=0.98)
└── (a=36, N=62, Q_v=0.80, best=0.80, ubc=1.00)
    └── (a=30, N=61, Q_v=0.80, best=0.80, ubc=0.98)
           INFO     selected action 30 after 125 simulations.
           INFO     current action list: [1, 19, 20, 25, 21, 26, 27, 7, 28, 2, 13, 22, 14, 31, 15, 8, 16, 32, 33,
                    9, 34, 10, 23, 17, 18, 35, 3, 4, 5, 11, 12, 6, 24, 29, 30]
(N=125, Q_v=0.80, best=0.80)
└── (a=36, N=124, Q_v=0.80, best=0.80, ubc=0.94)
           INFO     selected action 36 after 125 simulations.
           INFO     current action list: [1, 19, 20, 25, 21, 26, 27, 7, 28, 2, 13, 22, 14, 31, 15, 8, 16, 32, 33,
                    9, 34, 10, 23, 17, 18, 35, 3, 4, 5, 11, 12, 6, 24, 29, 30, 36]
           INFO     Final action list: [1, 19, 20, 25, 21, 26, 27, 7, 28, 2, 13, 22, 14, 31, 15, 8, 16, 32, 33, 9,
                    34, 10, 23, 17, 18, 35, 3, 4, 5, 11, 12, 6, 24, 29, 30, 36]
         ╔═══════════════════════════════════════════════════════╗
Job 0    ║║ Machine 0   
Job 1    ║           ║ Machine 1   
Job 2    ║             ║ Machine 2   
Job 3    ║║ Machine 3   
Job 4    ║ ║ Machine 4   
Job 5    ║     ║ Machine 5   
         ╚╦════╤════╤════╤════╤════╦════╤════╤════╤════╤════╦════╝
          0.0                      30.5                     60.9
makespan: 66