update

2025-03-14 12:31:41 +07:00
parent 097484675c
commit 7e160f2031
2 changed files with 36 additions and 113 deletions
--- a/src/interface.jl
+++ b/src/interface.jl
@@ -66,7 +66,8 @@ function runMCTS(
  maxiterations::Integer=10,
  explorationweight::Number=1.0,
  earlystop::Union{Function,Nothing}=nothing,
-  saveSimulatedNode::Bool=false) where {T<:Any}
+  saveSimulatedNode::Bool=false,
+  multithread=false) where {T<:Any}
 # )::NamedTuple{(:bestNextState, :bestFinalState),Tuple{T,T}} where {T<:Any}

  root = MCTSNode("root", initialstate, 0, 0, 0, 0, false, nothing, Dict{String,MCTSNode}(),
@@ -85,26 +86,26 @@ function runMCTS(
      # do nothing then go directly to backpropagation. It means the end of this iteration
      backpropagate(node, node.reward)
    else
-      println(111)
      _ = expand(node, transition, transitionargs;
-                horizontalSample=horizontalSampleExpansionPhase)
-
-      println(666)
-      
-      @sync for (leafNodeKey, leafNode) in node.children
-        @spawn simulateThenBackpropagate(leafNode, transition, transitionargs;
-                maxSimulationDepth=maxSimulationDepth, 
-                horizontalSampleSimulationPhase=horizontalSampleSimulationPhase,
-                saveSimulatedNode=saveSimulatedNode)
+                horizontalSample=horizontalSampleExpansionPhase,
+                multithread=multithread)
+      if multithread
+        @sync for (leafNodeKey, leafNode) in node.children
+          @spawn simulateThenBackpropagate(leafNode, transition, transitionargs;
+                  maxSimulationDepth=maxSimulationDepth, 
+                  horizontalSampleSimulationPhase=horizontalSampleSimulationPhase,
+                  saveSimulatedNode=saveSimulatedNode,
+                  multithread=multithread)
+        end
+      else
+        for (leafNodeKey, leafNode) in node.children
+          simulateThenBackpropagate(leafNode, transition, transitionargs;
+                  maxSimulationDepth=maxSimulationDepth, 
+                  horizontalSampleSimulationPhase=horizontalSampleSimulationPhase,
+                  saveSimulatedNode=saveSimulatedNode,
+                  multithread=multithread)
+        end
      end
-
-      #CHANGE for testing
-      # for (leafNodeKey, leafNode) in node.children
-      #   simulateThenBackpropagate(leafNode, transition, transitionargs;
-      #           maxSimulationDepth=maxSimulationDepth, 
-      #           horizontalSampleSimulationPhase=horizontalSampleSimulationPhase,
-      #           saveSimulatedNode=saveSimulatedNode)
-      # end
    end

    # stop if the early stop condition is met
@@ -123,10 +124,12 @@ end

 function simulateThenBackpropagate(node::MCTSNode, transition::Function, transitionargs::NamedTuple; 
                maxSimulationDepth::Integer=3, horizontalSampleSimulationPhase::Integer=3,
-                saveSimulatedNode::Bool=false)
+                saveSimulatedNode::Bool=false,
+                multithread=false)
  simTrajectoryReward, terminalstate = simulate(node, transition, transitionargs;
                                                maxSimulationDepth=maxSimulationDepth, 
-                                                horizontalSample=horizontalSampleSimulationPhase)
+                                                horizontalSample=horizontalSampleSimulationPhase,
+                                                multithread=multithread)
  backpropagate(node, simTrajectoryReward)

  # check if the user wants to keep the simulated node
@@ -137,58 +140,6 @@ end



-# function runMCTS(
-#   initialstate::T,
-#   transition::Function,
-#   transitionargs::NamedTuple,
-#   ;
-#   totalsample::Integer=3,
-#   maxdepth::Integer=3,
-#   maxiterations::Integer=10,
-#   explorationweight::Number=1.0,
-# )::NamedTuple{(:bestNextState, :bestFinalState),Tuple{T,T}} where {T<:Any}
-
-#   root = MCTSNode("root", initialstate, 0, 0, 0, 0, false, nothing, Dict{String,MCTSNode}())
-
-#   for nth in 1:maxiterations
-#     node = root
-#     node.visits += 1
-
-#     while !isleaf(node)
-#       node = UCTselect(node, explorationweight)
-#     end
-#     if node.isterminal
-#       # MCTS arrive at the leaf node that is also a terminal state,
-#       # do nothing then go directly to backpropagation. It means the end of this iteration
-#       backpropagate(leafNode, node.reward)
-#     else
-#       expand(node, transition, transitionargs;
-#         totalsample=totalsample)
-#       leafNode = selectChildNode(node)
-#       simTrajectoryReward, terminalstate = simulate(leafNode, transition, transitionargs;
-#         maxdepth=maxdepth, totalsample=totalsample)
-#       # if terminalstate !== nothing  #XXX not sure why I need this 
-#       #   terminalstate[:totalTrajectoryReward] = simTrajectoryReward
-#       # end
-
-#       #[] write best state to file if it has higher simTrajectoryReward. Use to improve evaluation
-#       # open("trajectory.json", "w") do io
-#       #   JSON3.pretty(io, terminalstate)
-#       # end
-
-#       backpropagate(leafNode, simTrajectoryReward)
-#     end
-#   end
-
-#   bestNextState = selectBestNextNode(root)
-#   besttrajectory = selectBestTrajectoryNode(root)
-
-#   return (bestNextState=bestNextState.state, bestFinalState=besttrajectory.state)
-# end
-
-
-
-