update
This commit is contained in:
@@ -439,7 +439,7 @@ function conversation(a::T, userinput::Dict) where {T<:agent}
|
|||||||
)
|
)
|
||||||
)
|
)
|
||||||
bestplan = runMCTS(a, initialState, decisionMaker, progressValueEstimator, reflector,
|
bestplan = runMCTS(a, initialState, decisionMaker, progressValueEstimator, reflector,
|
||||||
isterminal, 2, 3, 100, 1.0)
|
isterminal, 2, 3, 2, 1.0)
|
||||||
error("---> bestplan")
|
error("---> bestplan")
|
||||||
|
|
||||||
# actor loop(bestplan)
|
# actor loop(bestplan)
|
||||||
|
|||||||
20
src/mcts.jl
20
src/mcts.jl
@@ -163,7 +163,7 @@ julia>
|
|||||||
|
|
||||||
# TODO
|
# TODO
|
||||||
- [] update docstring
|
- [] update docstring
|
||||||
- [WORKING] implement the function
|
- [x] implement the function
|
||||||
- [] check for the terminal state (node.reward != 0), break if it is terminal state
|
- [] check for the terminal state (node.reward != 0), break if it is terminal state
|
||||||
|
|
||||||
# Signature
|
# Signature
|
||||||
@@ -185,24 +185,6 @@ function simulate(a, node::MCTSNode, decisionMaker::Function, progressValueEstim
|
|||||||
|
|
||||||
return simTrajectoryReward
|
return simTrajectoryReward
|
||||||
end
|
end
|
||||||
# function simulate(a, node::MCTSNode, decisionMaker::Function, progressValueEstimator::Function,
|
|
||||||
# isterminal::Function, max_depth::Int; n=3)::Number
|
|
||||||
|
|
||||||
# simTrajectoryReward = 0.0
|
|
||||||
|
|
||||||
# for _ in 1:max_depth
|
|
||||||
# node = selectChildNode(node)
|
|
||||||
# simTrajectoryReward += node.reward
|
|
||||||
|
|
||||||
# if node.isterminal
|
|
||||||
# break
|
|
||||||
# else
|
|
||||||
# expand(a, node, decisionMaker, progressValueEstimator, isterminal, n=n)
|
|
||||||
# end
|
|
||||||
# end
|
|
||||||
|
|
||||||
# return simTrajectoryReward
|
|
||||||
# end
|
|
||||||
|
|
||||||
"""
|
"""
|
||||||
|
|
||||||
|
|||||||
Reference in New Issue
Block a user