diff --git a/src/mcts.jl b/src/mcts.jl index c4d8d47..3648ce9 100644 --- a/src/mcts.jl +++ b/src/mcts.jl @@ -126,7 +126,7 @@ julia> # TODO [] update docstring [] try loop should limit to 3 times. if not succeed, skip - + [] newNodeKey ∉ keys(node.children). New state may have semantic vector close enought to one of existing child state. Which can be assume that they are the same state semantically-wise. # Signature """ function expand(a::T1, node::MCTSNode, decisionMaker::Function, @@ -190,7 +190,7 @@ function simulate(a, node::MCTSNode, decisionMaker::Function, progressValueEstim node = selectChildNode(node) end end - + #BUG new expanded state has reward but it is not included because it is over maxdept by 1 state return simTrajectoryReward end