learnEpisode(episode,learner);
}
private void explore(RState state, Map<Agent,Episode> episodes)
{
RState current_state = state;
while(!current_state.isTerminal())
{
Map<Agent,RAction> actions = new HashMap<Agent,RAction>();
for(Agent role : episodes.keySet())
{
RAction action = decideExplore(current_state, role.legalActions(current_state));
actions.put(role,action);
}
RState start = current_state;
current_state = current_state.next(actions.values());
RState result = current_state;
if(result.isTerminal())
{
result = null;
}
for(Agent role : episodes.keySet())