Source code for or_suite.agents.ambulance.stable

import numpy as np

import sys
from .. import Agent


[docs]class stableAgent(Agent):
    """
    Agent that implements a stable heuristic algorithm for use with either ambulance environment

    Methods:
        reset() : clears data and call_locs which contain data on what has occurred so far in the environment
        update_config() : (UNIMPLEMENTED)
        pick_action(state, step) : the action chosen is the most recently obesrved state
            of the environment

    Attributes:
        epLen: (int) number of time steps to run the experiment for
        data: (int list list or float list list) a list of all the states of the environment observed so far

    """

[docs]    def __init__(self, epLen):
        '''
        Args:
            epLen: number of time steps
            data: all data observed so far
        '''
        self.epLen = epLen
        self.data = []

[docs]    def reset(self):
        # Resets data array to be empty
        self.data = []

[docs]    def update_obs(self, obs, action, reward, newObs, timestep, info):
        '''Add observation to records.

        Adds newObs, the most recently observed state, to data. Adds the most recent call arrival, found in info['arrival'] to call_locs.'''

        # Adds the most recent state obesrved in the environment to data
        self.data.append(newObs)
        return

[docs]    def update_policy(self, k):
        '''Update internal policy based upon records

        Not used, because a greedy algorithm does not have a policy.'''

[docs]    def pick_action(self, state, step):
        return state