utils.py

from collections import deque
import csv
import random
import config
from pprint import pprint

from matplotlib.artist import get

import config

def update_prey_belief_state(prey_belief_state, agent_curr_pos, agent_prev_pos, arena, found_prey, surveyed_node, checkpoint):
    """
    Updates prey belief state

    Parameters:
    prey_belief_state (dict): Stores prey's belief state
    agent_curr_pos (int): Stores Agent's current position
    agent_prev_pos (int): Stores Agent's previous position
    arena (dict): Contains the graph
    found_prey (bool): Contains prey is found status
    surveyed_node (int): Contains the node that was surveyed by the agent
    checkpoint (string): Describes which part of the function to run


    Returns:
    new_prey_belief_state (dict): The updated belief state
    """

    # Initializing the new prey belief states
    new_prey_belief_state = dict.fromkeys([i for i in range(50)], 999.0)
    new_prey_belief_state[agent_curr_pos] = 0.0

    # After surveying the node
    if checkpoint == 'after_survey':
        if found_prey:
            for i in range(50):
                new_prey_belief_state[i] = 0.0
            new_prey_belief_state[surveyed_node] = 1.0
            return new_prey_belief_state
        else:
            new_prey_belief_state[surveyed_node] = 0.0
            for i in range(50):
                if i not in (agent_curr_pos, surveyed_node):
                    new_prey_belief_state[i] = prey_belief_state[i] / ( sum(prey_belief_state.values()) - prey_belief_state[surveyed_node] - prey_belief_state[agent_curr_pos])

            return new_prey_belief_state
    
    elif checkpoint == 'after_agent_moves':
        if found_prey:
            return prey_belief_state
        else:
            # print(f'agent_curr_pos in func: {agent_curr_pos}')
            new_prey_belief_state[agent_prev_pos] = 0.0
            new_prey_belief_state[agent_curr_pos] = 0.0
            new_prey_belief_state[surveyed_node] = 0.0
            
            for i in range(50):
                if i not in (agent_curr_pos, agent_prev_pos, surveyed_node):
                    new_prey_belief_state[i] = prey_belief_state[i] / ( sum(prey_belief_state.values()) - prey_belief_state[agent_curr_pos] - prey_belief_state[surveyed_node])

            return new_prey_belief_state

    elif checkpoint == 'after_prey_moves':
        new_prey_belief_state[agent_curr_pos] = 0.0

        temp_prey_belief_state = dict.fromkeys([i for i in range(50)], 999.0)
        temp_prey_belief_state[agent_curr_pos] = 0.0


        # prey has moved
        for i in range(50):
            temp_sum = 0.0
            for j in arena[i]:
                temp_sum += prey_belief_state[j] / ( get_degree(arena, j) + 1 )
            temp_sum += prey_belief_state[i] / ( get_degree(arena, i) + 1 )
            temp_prey_belief_state[i] = temp_sum

        # pretend to survey node for agent curr pos
        new_prey_belief_state[agent_curr_pos] = 0.0
        for i in range(50):
            if i != agent_curr_pos:
                new_prey_belief_state[i] = temp_prey_belief_state[i] / ( sum(temp_prey_belief_state.values()) - temp_prey_belief_state[agent_curr_pos])
        return new_prey_belief_state

def update_predator_belief_state(predator_belief_state, agent_curr_pos, agent_prev_pos, arena, found_predator, surveyed_node, checkpoint):
    """
    Updates predator belief state

    Parameters:
    predator_belief_state (dict): Stores predator's belief state
    agent_curr_pos (int): Stores Agent's current position
    agent_prev_pos (int): Stores Agent's previous position
    arena (dict): Contains the graph
    found_predator (bool): Contains predator is found status
    surveyed_node (int): Contains the node that was surveyed by the agent
    checkpoint (string): Describes which part of the function to run


    Returns:
    new_prey_belief_state (dict): The updated belief state
    """
    
    # Initializing the new predator belief states
    new_predator_belief_state = dict.fromkeys([i for i in range(50)], 999.0)
    new_predator_belief_state[agent_curr_pos] = 0.0

    
    if checkpoint == 'after_survey':
        if found_predator:
            for i in range(50):
                new_predator_belief_state[i] = 0.0
            new_predator_belief_state[surveyed_node] = 1.0
        else:
            new_predator_belief_state[surveyed_node] = 0.0
            for i in range(50):
                if i not in (agent_curr_pos, surveyed_node):
                    try:
                        new_predator_belief_state[i] = predator_belief_state[i] / ( sum(predator_belief_state.values()) - predator_belief_state[surveyed_node])
                    except:
                        print('after_survey')
                        pprint(f'predator_belief_state: {predator_belief_state}')
                        print(f'predator_belief_state[surveyed_node]: {predator_belief_state[surveyed_node]}')
                        print(f'predator_belief_state[i]: {predator_belief_state[i]}')
                        exit(0)

        return new_predator_belief_state


    elif checkpoint == 'after_agent_moves':
        if found_predator:

            return predator_belief_state
            
        else:
            # print(f'agent_curr_pos in func: {agent_curr_pos}')
            new_predator_belief_state[agent_prev_pos] = 0.0
            new_predator_belief_state[agent_curr_pos] = 0.0
            new_predator_belief_state[surveyed_node] = 0.0
            
            for i in range(50):
                if i not in (agent_curr_pos, agent_prev_pos, surveyed_node):
                    try:
                        new_predator_belief_state[i] = predator_belief_state[i] / ( sum(predator_belief_state.values()) - predator_belief_state[agent_curr_pos] - predator_belief_state[surveyed_node])
                    except:
                        print('after_agent_moves')
                        pprint(f'predator_belief_state: {predator_belief_state}')
                        print(f'predator_belief_state[surveyed_node]: {predator_belief_state[surveyed_node]}')
                        print(f'predator_belief_state[agent_curr_pos]: {predator_belief_state[agent_curr_pos]}')
                        print(f'predator_belief_state[i]: {predator_belief_state[i]}')
                        exit(0)


            return new_predator_belief_state

    elif checkpoint == 'after_predator_moves':
        new_predator_belief_state[agent_curr_pos] = 0.0

        temp_predator_belief_state = dict.fromkeys([i for i in range(50)], 999.0)
        temp_predator_belief_state[agent_curr_pos] = 0.0


        # predator has moved

        for i in range(50):
            temp_sum = 0.0
            for j in arena[i]:
                neighbour_path_length = {}

                # Finds the length for the shortest path for each of neighbours
                for k in arena[j]:
                    path, path_length = get_shortest_path(k, agent_curr_pos, arena)
                    neighbour_path_length[k] = path_length

                # Finds all the neighbours that have minimum path length
                min_length = min(neighbour_path_length.values())
                neighbours_with_min_path_length = [key for key, value in neighbour_path_length.items() if
                                                value == min_length]
                shortest_length_nodes = len(neighbours_with_min_path_length)

                if i in neighbours_with_min_path_length:
                    temp_sum += predator_belief_state[j] * (( 0.4 / get_degree(arena, j) ) + ( 0.6 / shortest_length_nodes))
                else:
                    temp_sum += predator_belief_state[j] * ( 0.4/ get_degree(arena, j))

            temp_predator_belief_state[i] = temp_sum


        # pretend to survey node for agent curr pos
        new_predator_belief_state[agent_curr_pos] = 0.0
        for i in range(50):
            if i != agent_curr_pos:
                new_predator_belief_state[i] = temp_predator_belief_state[i] / ( sum(temp_predator_belief_state.values()) - temp_predator_belief_state[agent_curr_pos])

        return new_predator_belief_state

def get_degree(arena, node):
    """
    Gets the degree of the node

    Parameters:
    arena (dict): Arena for the game
    node (int): Node to get the degree for

    Returns:
    len(arena[node]) (int): Gets the degree of the node
    """
    return len(arena[node])

def survey_prey(agent, prey):
    """
    Surveys the node with the highest probability of the prey being there and updates the belief state accordingly

    Parameters:
    agent (object): Agent object
    prey (object): Prey object

    Returns:
    found_prey (Bool): Returns True if found prey else False
    node_to_survey (int): Returns the node surveyed
    """

    belief_state = agent.prey_belief_state

    # Selects all positions where the probability is max
    max_prob_of_prey = [pos for pos, prob in belief_state.items() if prob ==  max(belief_state.values())]

    node_to_survey = random.choice(max_prob_of_prey)


    if node_to_survey == prey.curr_pos:
        return True, node_to_survey
    else:
        return False, node_to_survey

def survey_predator(agent, predator):
    """
    Surveys the node with the highest probability of the predator being there and updates the belief state accordingly

    Parameters:
    agent (object): Agent object
    prey (object): Predator object

    Returns:
    found_predator (Bool): Returns True if found predator else False
    node_to_survey (int): Returns the node surveyed
    """

    belief_state = agent.predator_belief_state

    # Selects all positions where the probability is max
    max_prob_of_predator = [pos for pos, prob in belief_state.items() if prob == max(belief_state.values())]

    node_to_survey = random.choice(max_prob_of_predator)

    if node_to_survey == predator.curr_pos:
        return True, node_to_survey
    else:
        return False, node_to_survey


def store_data(data):
    """
    Stores the collected data toa a CSV file

    data: Data collected from all the agents
    """
    file_path_to_write = config.FILE_PATH + config.FILE_NAME
    # print(file_path_to_write)
    f = open(file_path_to_write, 'w')
    writer = csv.writer(f)
    writer.writerows(data)
    print("Data Collection Complete")
    f.close()


def FindPath(parent, start_pos, end_pos):
    """
    Backtracks and finds the path in the arena to the end position from the start position

    Parameters:
    parent (dict): Parent dictionary of each node
    start_pos (int): Start position of the path
    end_pos (int): End position of the path

    Returns:
    path (deque): Path from start to end position
    """
    path = deque()
    path.append(end_pos)
    while path[-1] != start_pos:
         path.append(parent[path[-1]])
    path.reverse()
    path.popleft()
    return path

def get_shortest_path(start_pos, end_pos, arena):
    """
    Uses Breath First Search to find the shortest path between the start and end position
    'neighbours' is used as the fringe (queue) to add surrounding nodes in the arena

    Parameters:
    start_pos (int): Start position of the path
    end_pos (int): End position of the path
    arena (dict): The arena used currently

    Returns:
    path (deque): Shortest path evaluated
    (len(path) - 1) (int): Length of the path
    """
    
    parent = {}
    visited = [False] * 50

    visited[start_pos] = True
    neighbours = deque()

    curr_pos = start_pos
    while curr_pos != end_pos:
        for surrounding_node in arena[curr_pos]:
            if not visited[surrounding_node] and surrounding_node not in neighbours:
                neighbours.append(surrounding_node)
                parent.update({surrounding_node: curr_pos})
                visited[surrounding_node] = True

        curr_pos = neighbours.popleft()

    path = FindPath(parent, start_pos, end_pos)

    return path, (len(path) - 1)

def return_max_prey_belief(belief_state, arena):
    """
    Returns a randomly chosen node for max belief of the prey

    Parameters:
    belief_state (dict): The belief state of the prey
    arena (dict): Arena for the game

    Returns:
    random.choice(max_belief_nodes) (int): Random value from max beliefs
    """

    max_belief = max(belief_state.values())
    max_belief_nodes = [key for key, value in belief_state.items() if value == max_belief ]

    return random.choice(max_belief_nodes)

def return_max_predator_belief(belief_state, arena):
    """
    Returns a randomly chosen node for max belief of the predator

    Parameters:
    belief_state (dict): The belief state of the predator
    arena (dict): Arena for the game

    Returns:
    random.choice(max_belief_nodes) (int): Random value from max beliefs
    """

    max_belief = max(belief_state.values())

    max_belief_nodes = [key for key, value in belief_state.items() if value == max_belief ]

    return random.choice(max_belief_nodes)


def best_node_v2(arena, curr_pos, prey_loc, predator_loc):
    """
    Returns a node closer to the prey while the agent is 'not scared'
    Always moves away from predator if the agent is 'scared'
    Agent is scared if it is within a specific distance from the prey

    Parameters:
    arena (dictionary): Adjacency list representing the graph
    prey_loc (int): Location of prey
    predator_loc (int): Location of Predator

    Returns:
    curr_pos (int): Position to move to

    """
    path_to_predator, distance_to_predator = get_shortest_path(curr_pos, predator_loc, arena)

    path_to_prey, distance_to_prey = get_shortest_path(curr_pos, prey_loc, arena)

    if distance_to_predator <= config.SCARED_THRESHOLD:
        neighbour_predator_path_length ={}

        for i in arena[curr_pos]:
            neghbour_path, neighbour_predator_path_length[i] = get_shortest_path(i, predator_loc, arena)

        curr_pos = max(neighbour_predator_path_length, key=neighbour_predator_path_length.get)

        return curr_pos

    else:
        neighbour_prey_path_length = {}

        for i in arena[curr_pos]:
            neghbour_path, neighbour_prey_path_length[i] = get_shortest_path(i, prey_loc, arena)

        curr_pos = min(neighbour_prey_path_length, key=neighbour_prey_path_length.get)

        return curr_pos


def best_node(arena, curr_pos, prey_loc, predator_loc):
    """
    Returns the node that the agent should move to according to the following rules:
    1. Neighbors that are closer to the Prey and farther from the Predator.
    2. Neighbors that are closer to the Prey and not closer to the Predator.
    3. Neighbors that are not farther from the Prey and farther from the Predator.
    4. Neighbors that are not farther from the Prey and not closer to the Predator.
    5. Neighbors that are farther from the Predator.
    6. Neighbors that are not closer to the Predator.
    7. Sit still and pray.

    Parameters:
    arena (dictionary): Adjacency list representing the graph
    prey_loc (int): Location of prey
    predator_loc (int): Location of Predator

    Returns:
    curr_pos (int): Position to move to
    """

    # Neighbours of the current node are extracted here
    neighbours = arena[curr_pos].copy()

    # Distances from prey and predator will be stored in the following dicts
    predator_dist = {}
    prey_dist = {}

    # Storing the distances of the agent location to the prey and predator
    path, curr_pos_prey_dist = get_shortest_path(curr_pos, prey_loc, arena)
    path, curr_pos_predator_dist = get_shortest_path(curr_pos, predator_loc, arena)

    # Find distance from all neighbours to the prey and the predator
    for i in neighbours:
        path, prey_dist[i] = get_shortest_path(i, prey_loc, arena)
        path, predator_dist[i] = get_shortest_path(i, predator_loc, arena)

    # Defining subsets of nodes
    closer_to_prey = {}
    not_farther_from_prey = {}
    farther_from_predator = {}
    not_closer_to_predator = {}

    # Adding nodes to the subsets
    for k in prey_dist.keys():
        if prey_dist[k] < curr_pos_prey_dist:
            closer_to_prey[k] = prey_dist[k]

    for k in prey_dist.keys():
        if prey_dist[k] == curr_pos_prey_dist:
            not_farther_from_prey[k] = prey_dist[k]

    for k in predator_dist.keys():
        if predator_dist[k] >= curr_pos_predator_dist:
            farther_from_predator[k] = predator_dist[k]

    for k in predator_dist.keys():
        if predator_dist[k] == curr_pos_predator_dist:
            not_closer_to_predator[k] = predator_dist[k]

    # Flag helps to avoid going through multiple ifs if one if condition is satisfied
    flag = 0

    min_length = min(closer_to_prey.values())
    focused_neighbours = [key for key, value in closer_to_prey.items() if value == min_length ]
    curr_pos = random.choice(focused_neighbours)

    # Assigning the position accorinding to the given priorrity
    if len(set(closer_to_prey).intersection(set(farther_from_predator))) != 0 and flag == 0:
        # curr_pos = min(closer_to_prey, key=closer_to_prey.get)
        min_length = min(closer_to_prey.values())
        focused_neighbours = [key for key, value in closer_to_prey.items() if value == min_length ]
        curr_pos = random.choice(focused_neighbours)
        #print("priority 1")
        flag = 1

    elif len(set(closer_to_prey).intersection(set(not_closer_to_predator))) != 0 and flag == 0:
        # curr_pos = min(closer_to_prey, key=closer_to_prey.get)
        min_length = min(closer_to_prey.values())
        focused_neighbours = [key for key, value in closer_to_prey.items() if value == min_length ]
        curr_pos = random.choice(focused_neighbours)
        #print("priority 2")
        flag = 1

    elif len(set(not_farther_from_prey).intersection(set(farther_from_predator))) != 0 and flag == 0:
        # curr_pos = min(not_farther_from_prey, key=not_farther_from_prey.get)
        min_length = min(not_farther_from_prey.values())
        focused_neighbours = [key for key, value in not_farther_from_prey.items() if value == min_length ]
        curr_pos = random.choice(focused_neighbours)
        #print("priority 3")
        flag = 1

    elif len(set(closer_to_prey).intersection(set(not_closer_to_predator))) != 0 and flag == 0:
        # curr_pos = min(closer_to_prey, key=closer_to_prey.get)
        min_length = min(closer_to_prey.values())
        focused_neighbours = [key for key, value in closer_to_prey.items() if value == min_length ]
        curr_pos = random.choice(focused_neighbours)
        #print("priority 4")
        flag = 1

    elif len(farther_from_predator) != 0 and flag == 0:
        # curr_pos = max(farther_from_predator, key=farther_from_predator.get)
        min_length = min(farther_from_predator.values())
        focused_neighbours = [key for key, value in farther_from_predator.items() if value == min_length ]
        curr_pos = random.choice(focused_neighbours)
        #print("priority 5")
        flag = 1

    elif len(not_closer_to_predator) != 0 and flag == 0:
        # curr_pos = min(not_closer_to_predator, key=not_closer_to_predator.get)
        min_length = min(not_closer_to_predator.values())
        focused_neighbours = [key for key, value in not_closer_to_predator.items() if value == min_length ]
        curr_pos = random.choice(focused_neighbours)
        #print("priority 6")

    else:
        #print("Sitting and Praying")
        return 999


    return curr_pos


def update_prey_belief_state_defective_drone(prey_belief_state, agent_curr_pos, agent_prev_pos, arena, found_prey, surveyed_node,
                             checkpoint):
    """
    Updates prey belief state

    Parameters:
    prey_belief_state (dict): Stores prey's belief state
    agent_curr_pos (int): Stores Agent's current position
    agent_prev_pos (int): Stores Agent's previous position
    arena (dict): Contains the graph
    found_prey (bool): Contains prey is found status
    surveyed_node (int): Contains the node that was surveyed by the agent
    checkpoint (string): Describes which part of th function to run


    Returns:
    new_prey_belief_state (dict): The updated belief state
    """

    # Initializing the new prey belief states
    new_prey_belief_state = dict.fromkeys([i for i in range(50)], 999.0)
    new_prey_belief_state[agent_curr_pos] = 0.0

    # After surveying the node
    if checkpoint == 'after_survey':
        if found_prey:
            for i in range(50):
                new_prey_belief_state[i] = 0.0
            new_prey_belief_state[surveyed_node] = 1.0
            return new_prey_belief_state
        else:
            new_prey_belief_state[surveyed_node] = 0.0
            for i in range(50):
                if i not in (agent_curr_pos, surveyed_node):
                    new_prey_belief_state[i] = prey_belief_state[i] / (
                                sum(prey_belief_state.values()) - 0.9*prey_belief_state[surveyed_node] - prey_belief_state[agent_curr_pos])
                elif i == surveyed_node:
                    new_prey_belief_state[i] = prey_belief_state[i]*0.1 / (
                            sum(prey_belief_state.values()) - (0.9 * prey_belief_state[surveyed_node]))
            return new_prey_belief_state

    elif checkpoint == 'after_agent_moves':
        if found_prey:
            return prey_belief_state
        else:

            new_prey_belief_state[agent_prev_pos] = 0.0
            new_prey_belief_state[agent_curr_pos] = 0.0
            for i in range(50):
                if i not in (agent_curr_pos, agent_prev_pos):

                    new_prey_belief_state[i] = prey_belief_state[i] / (sum(prey_belief_state.values()) - prey_belief_state[agent_curr_pos])
            return new_prey_belief_state

    elif checkpoint == 'after_prey_moves':
        new_prey_belief_state[agent_curr_pos] = 0.0

        temp_prey_belief_state = dict.fromkeys([i for i in range(50)], 999.0)
        temp_prey_belief_state[agent_curr_pos] = 0.0

        # prey has moved
        for i in range(50):
            temp_sum = 0.0
            for j in arena[i]:
                temp_sum += prey_belief_state[j] / (get_degree(arena, j) + 1)
            temp_sum += prey_belief_state[i] / (get_degree(arena, i) + 1)
            temp_prey_belief_state[i] = temp_sum

        # pretend to survey node for agent curr pos
        new_prey_belief_state[agent_curr_pos] = 0.0
        for i in range(50):
            if i != agent_curr_pos:
                new_prey_belief_state[i] = temp_prey_belief_state[i] / (
                            sum(temp_prey_belief_state.values()) - temp_prey_belief_state[agent_curr_pos])
        return new_prey_belief_state

def update_predator_belief_state_defective_drone(predator_belief_state, agent_curr_pos, agent_prev_pos, arena, found_predator,
                                 surveyed_node, checkpoint):
    """
    Updates predator belief state

    Parameters:
    predator_belief_state (dict): Stores predator's belief state
    agent_curr_pos (int): Stores Agent's current position
    agent_prev_pos (int): Stores Agent's previous position
    arena (dict): Contains the graph
    found_predator (bool): Contains predator is found status
    surveyed_node (int): Contains the node that was surveyed by the agent
    checkpoint (string): Describes which part of the function to run


    Returns:
    new_prey_belief_state (dict): The updated belief state
    """

    # Initializing the new predator belief states
    new_predator_belief_state = dict.fromkeys([i for i in range(50)], 999.0)
    new_predator_belief_state[agent_curr_pos] = 0.0
    # new_predator_belief_state = predator_belief_state

    if checkpoint == 'after_survey':
        if found_predator:
            for i in range(50):
                new_predator_belief_state[i] = 0.0
            new_predator_belief_state[surveyed_node] = 1.0
        else:
            new_predator_belief_state[surveyed_node] = 0.0
            for i in range(50):
                if i not in (agent_curr_pos, surveyed_node):
                    new_predator_belief_state[i] = predator_belief_state[i] / (
                                sum(predator_belief_state.values()) - (0.9*predator_belief_state[surveyed_node]))
                elif i == surveyed_node:
                    new_predator_belief_state[i] = predator_belief_state[i]*0.1 / (
                            sum(predator_belief_state.values()) - (0.9 * predator_belief_state[surveyed_node]))
        return new_predator_belief_state


    elif checkpoint == 'after_agent_moves':
        if found_predator:

            return predator_belief_state

        else:

            new_predator_belief_state[agent_prev_pos] = 0.0
            new_predator_belief_state[agent_curr_pos] = 0.0


            for i in range(50):

                if i not in (agent_curr_pos, agent_prev_pos):

                    new_predator_belief_state[i] = predator_belief_state[i] / (sum(predator_belief_state.values()) - predator_belief_state[agent_curr_pos])

            return new_predator_belief_state

    elif checkpoint == 'after_predator_moves':
        new_predator_belief_state[agent_curr_pos] = 0.0

        temp_predator_belief_state = dict.fromkeys([i for i in range(50)], 999.0)
        temp_predator_belief_state[agent_curr_pos] = 0.0

        # predator has moved
        for i in range(50):
            temp_sum = 0.0
            for j in arena[i]:
                neighbour_path_length = {}

                # Finds the length for the shortest path for each of neighbours
                for k in arena[j]:
                    path, path_length = get_shortest_path(k, agent_curr_pos, arena)
                    neighbour_path_length[k] = path_length

                # Finds all the neighbours that have minimum path length
                min_length = min(neighbour_path_length.values())
                neighbours_with_min_path_length = [key for key, value in neighbour_path_length.items() if
                                                   value == min_length]
                shortest_length_nodes = len(neighbours_with_min_path_length)

                if j in neighbours_with_min_path_length:
                    temp_sum += predator_belief_state[j] * (0.4 / get_degree(arena, j)) + (0.6 / shortest_length_nodes)
                else:
                    temp_sum += predator_belief_state[j] * (0.4 / get_degree(arena, j))

            temp_predator_belief_state[i] = temp_sum


        # pretend to survey node for agent curr pos
        new_predator_belief_state[agent_curr_pos] = 0.0
        for i in range(50):
            if i != agent_curr_pos:
                new_predator_belief_state[i] = temp_predator_belief_state[i] / (
                            sum(temp_predator_belief_state.values()) - temp_predator_belief_state[agent_curr_pos])

        return new_predator_belief_state