congested/run_functions.py at main · CCarissimo/congested · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
import numpy as np
import scipy.cluster


def initialize_q_table(q_initial, n_agents, n_states, n_actions, qmin=0, qmax=1):
    if type(q_initial) == np.ndarray:
        if q_initial.shape == (n_agents, n_states, n_actions):
            q_table = q_initial
        else:
            q_table = q_initial.T * np.ones((n_agents, n_states, n_actions))
    elif q_initial == "UNIFORM":
        q_table = (qmax-qmin)*np.random.random_sample(size=(n_agents, n_states, n_actions)) + qmin
    elif q_initial == "ALIGNED":
        if n_actions == 3:
            q_table = np.array([[-1, -2, -2], [-2, -1, -2], [-2, -2, -1]]).T * np.ones((n_agents, n_states, n_actions))
        elif n_actions == 2:
            q_table = np.array([[-1, -2], [-2, -1]]).T * np.ones((n_agents, n_states, n_actions))
    elif q_initial == "MISALIGNED":
        if n_actions == 3:
            q_table = np.array([[-2, -1, -2], [-2, -2, -1], [-1, -2, -2]]).T * np.ones((n_agents, n_states, n_actions))
        elif n_actions == 2:
            q_table = np.array([[-2, -1], [-1, -2]]).T * np.ones((n_agents, n_states, n_actions))
    return q_table


def initialize_learning_rates(alpha, n_agents):
    if alpha == "UNIFORM":
        alpha = np.random.random_sample(size=n_agents)
    return alpha


def initialize_exploration_rates(epsilon, n_agents, mask=1):  # default mask 1 leads to no change
    if epsilon == "UNIFORM":
        epsilon = np.random.random_sample(size=n_agents) * mask
    else:
        epsilon = epsilon * np.ones(n_agents) * mask
    return epsilon


def welfare(R, N_AGENTS, welfareType="AVERAGE"):
    if welfareType == "AVERAGE":
        return R.sum() / N_AGENTS
    elif welfareType == "MIN":
        return R.min()
    elif welfareType == "MAX":
        return R.max()
    else:
        raise "SPECIFY WELFARE TYPE"


def count_groups(q_values, dist):
    y = scipy.cluster.hierarchy.average(q_values)
    z = scipy.cluster.hierarchy.fcluster(y, dist, criterion='distance')
    groups = np.bincount(z)
    return len(groups)


# def calculate_alignment(q_table):
#     argmax_q_table = np.argmax(q_table, axis=2)
#     return (argmax_q_table == np.broadcast_to(np.arange(q_table.shape[2]), (q_table.shape[0], q_table.shape[1]))).mean(axis=0)


def calculate_alignment(q_table, recommendation, actions):
    argmax_q_table = np.argmax(q_table, axis=2)
    belief_alignment = (argmax_q_table == np.broadcast_to(np.arange(q_table.shape[2]), (q_table.shape[0], q_table.shape[1]))).mean(axis=0)
    recommendation_alignment = (recommendation == argmax_q_table[np.arange(q_table.shape[0]), recommendation]).mean()
    action_alignment = (recommendation==actions).mean()
    return belief_alignment, recommendation_alignment, action_alignment