def _compute_gt_value(self, vertex, target_vertices):
    """Computes groundtruth value of all the actions at the vertex.

    The value of each action is the difference each action makes in the length
    of the shortest path to the goal. If an action takes the agent one step