first, initial_state=self.envoirment.sample_initial_state() #here returns both initial state and solution
then root_node = TreeNode(state=initial_state) #here root_node contans solution too
third path_to_string here solution leaks to prompt
f"{node.parent.index if node.parent else -1}{node.index}{node.state}{value_to_rating_token(node.value)}"
for node in path[::-1]
first, initial_state=self.envoirment.sample_initial_state() #here returns both initial state and solution then root_node = TreeNode(state=initial_state) #here root_node contans solution too third path_to_string here solution leaks to prompt f"{node.parent.index if node.parent else -1}{node.index}{node.state}{value_to_rating_token(node.value)}"
for node in path[::-1]