update

2024-08-22 10:59:26 +07:00
parent c33d69b00c
commit 856308555f
1 changed files with 55 additions and 58 deletions
--- a/src/mcts.jl
+++ b/src/mcts.jl
@@ -196,51 +196,22 @@ end
 # Return
  - None
 # TODO
  - [WORKING] implement multithreads
 # Signature
 """
 function expand(node::MCTSNode, transition::Function, transitionargs::NamedTuple; 
          totalsample::Integer=3)
  # not use Any[] because I want to preserve result order
  results = Vector{Any}(undef, totalsample) 
  @sync for i in 1:totalsample
      @spawn begin
        result = transition(deepcopy(node.state), deepcopy(transitionargs))
        results[i] = result
      end
  end
  for result in results
    newNodeKey::AbstractString = result[:newNodeKey]
    newstate::AbstractDict = result[:newstate]
    progressvalue::Integer = result[:progressvalue]
    """
    [] newNodeKey ∉ keys(node.children). 
          New state may have semantic vector close enought to 
        one of existing child state. Which can be assume that they are the same state 
        semantically-wise i.e. De javu. This could be used to recall lessons for this 
        similar situation to improve decisionMaker and evaluator. 
    """
    if newNodeKey ∉ keys(node.children)
      node.children[newNodeKey] = 
        MCTSNode(newNodeKey, newstate, 0, progressvalue, 0, newstate[:reward], 
          newstate[:isterminal], node, Dict{String, MCTSNode}())
    end
  end
 end
 # function expand(node::MCTSNode, transition::Function, transitionargs::NamedTuple; 
 #           totalsample::Integer=3)
-#   nthSample = 0
+#   # not use Any[] because I want to preserve result order
-#   while true
+#   results = Vector{Any}(undef, totalsample) 
-#     nthSample += 1
+
-#     if nthSample <= totalsample
+#   @sync for i in 1:totalsample
-#       result = transition(node.state, transitionargs)
+#       @spawn begin
 #         result = transition(deepcopy(node.state), deepcopy(transitionargs))
 #         results[i] = result
 #       end
 #   end
 #   for result in results
 #     newNodeKey::AbstractString = result[:newNodeKey]
 #     newstate::AbstractDict = result[:newstate]
 #     progressvalue::Integer = result[:progressvalue]
@@ -257,11 +228,37 @@ end
 #         MCTSNode(newNodeKey, newstate, 0, progressvalue, 0, newstate[:reward], 
 #           newstate[:isterminal], node, Dict{String, MCTSNode}())
 #     end
 #     else
 #       break
 #     end
 #   end
 # end
 function expand(node::MCTSNode,transition::Function, transitionargs::NamedTuple; 
          totalsample::Integer=3)
  nthSample = 0
  while true
    nthSample += 1
    if nthSample <= totalsample
      result = transition(node.state, transitionargs)
      newNodeKey::AbstractString = result[:newNodeKey]
      newstate::AbstractDict = result[:newstate]
      progressvalue::Integer = result[:progressvalue]
      """
      [] newNodeKey ∉ keys(node.children). 
            New state may have semantic vector close enought to 
          one of existing child state. Which can be assume that they are the same state 
          semantically-wise i.e. De javu. This could be used to recall lessons for this 
          similar situation to improve decisionMaker and evaluator. 
      """
      if newNodeKey ∉ keys(node.children)
        node.children[newNodeKey] = 
          MCTSNode(newNodeKey, newstate, 0, progressvalue, 0, newstate[:reward], 
            newstate[:isterminal], node, Dict{String, MCTSNode}())
      end
    else
      break
    end
  end
 end
 """ Simulate interactions between agent and environment