# Error-driven Payoff and Fairness

In [2]:
import sys
sys.path.append("../src")

import warnings
warnings.filterwarnings("ignore")

In [3]:
from Classes.cognitive_model_agents import FairnessM1, FairnessM2, FairnessM3
from Utils.unit_tests import (
    test_bar_is_full, 
    test_bar_has_capacity,
    test_alternation
)

In [4]:
fixed_parameters = {
	"threshold":0.5,
	"num_agents":2,
}
free_parameters = {
	"learning_rate": 0.2,
    "bias": 0.5,
	"inverse_temperature":16
}

In [5]:
from pathlib import Path

image_folder_all = Path('../images/Fairness')
image_folder_all.mkdir(parents=True, exist_ok=True)
image_folder_M1 = Path('../images/Fairness/M1')
image_folder_M1.mkdir(parents=True, exist_ok=True)
image_folder_M2 = Path('../images/Fairness/M2')
image_folder_M2.mkdir(parents=True, exist_ok=True)
image_folder_M3 = Path('../images/Fairness/M3')
image_folder_M3.mkdir(parents=True, exist_ok=True)

1. [M1](#m1)
2. [M2](#m2)
3. [M3](#m3)

## M1 <a class="anchor" id="m1"></a>

In [5]:
agent = FairnessM1(
	fixed_parameters=fixed_parameters,
	free_parameters=free_parameters,
	n=0
)
agent.debug = True
test_bar_has_capacity(agent)


------------------------------------------------------------
Test bar has capacity
------------------------------------------------------------
Initial state: [0, 0]
---------- Round 0 ----------
Action preferences in state [0, 0]: [0. 0.]
Action probabilities:
no go:0.5 ---- go:0.5
Chosen action: 0
State arrived: [0, 0]
Payoff action 0: 0
Average fairness: -0.5
Payoff: 0
G observed for action 0 in state (0, 0) is: -0.25
Learning rule:
Q[0] <- 0.0 + 0.2 * (-0.25 - 0.0)
Q[0] = -0.05
---------- Round 1 ----------
Action preferences in state [0, 0]: [-0.05  0.  ]
Action probabilities:
no go:0.31002551887238755 ---- go:0.6899744811276125
Chosen action: 0
State arrived: [0, 0]
Payoff action 0: 0
Average fairness: -0.5
Payoff: 0
G observed for action 0 in state [0, 0] is: -0.25
Learning rule:
Q[0] <- -0.05 + 0.2 * (-0.25 - -0.05)
Q[0] = -0.09000000000000001
---------- Round 2 ----------
Action preferences in state [0, 0]: [-0.09  0.  ]
Action probabilities:
no go:0.19154534856146746 ---- go

In [6]:
agent = FairnessM1(
	fixed_parameters=fixed_parameters,
	free_parameters=free_parameters,
	n=0
)
agent.debug = True
test_bar_is_full(agent)


------------------------------------------------------------
Test bar is full
------------------------------------------------------------
Initial state: [1, 1]
---------- Round 0 ----------
Action preferences in state [1, 1]: [0. 0.]
Action probabilities:
no go:0.5 ---- go:0.5
Chosen action: 0
State arrived: [0, 1]
Payoff action 0: 0
Average fairness: 0.0
Payoff: 0
G observed for action 0 in state (1, 1) is: 0.0
Learning rule:
Q[0] <- 0.0 + 0.2 * (0.0 - 0.0)
Q[0] = 0.0
---------- Round 1 ----------
Action preferences in state [0, 1]: [0. 0.]
Action probabilities:
no go:0.5 ---- go:0.5
Chosen action: 1
State arrived: [1, 1]
Payoff action 1: -1
Average fairness: -0.16666666666666663
Payoff: -1
G observed for action 1 in state [0, 1] is: -0.5833333333333333
Learning rule:
Q[1] <- 0.0 + 0.2 * (-0.5833333333333333 - 0.0)
Q[1] = -0.11666666666666665
---------- Round 2 ----------
Action preferences in state [1, 1]: [ 0.         -0.11666667]
Action probabilities:
no go:0.8660721116759263 ---

In [7]:
agent = FairnessM1(
	fixed_parameters=fixed_parameters,
	free_parameters=free_parameters,
	n=0
)
agent.debug = True
test_alternation(agent)


------------------------------------------------------------
Test other player alternates
------------------------------------------------------------
Initial state: [0, 0]
---------- Round 0 ----------
Action preferences in state [0, 0]: [0. 0.]
Action probabilities:
no go:0.5 ---- go:0.5
Chosen action: 1
State arrived: [1, 1]
Payoff action 1: -1
Average fairness: -0.0
Payoff: -1
G observed for action 1 in state (0, 0) is: -0.5
Learning rule:
Q[1] <- 0.0 + 0.2 * (-0.5 - 0.0)
Q[1] = -0.1
---------- Round 1 ----------
Action preferences in state [1, 1]: [ 0.  -0.1]
Action probabilities:
no go:0.8320183851339245 ---- go:0.1679816148660755
Chosen action: 0
State arrived: [0, 0]
Payoff action 0: 0
Average fairness: -0.16666666666666669
Payoff: 0
G observed for action 0 in state [1, 1] is: -0.08333333333333334
Learning rule:
Q[0] <- 0.0 + 0.2 * (-0.08333333333333334 - 0.0)
Q[0] = -0.01666666666666667
---------- Round 2 ----------
Action preferences in state [0, 0]: [-0.01666667 -0.1       

In [8]:
fixed_parameters = {
	"threshold":0.5,
	"num_agents":6,
}
free_parameters = {
	"learning_rate": 0.2,
	"bias": 0.5,
	"inverse_temperature":16
}
simulation_parameters = {
	'num_episodes':100,
	'num_rounds':1000,
	'verbose':False
}

In [9]:
from Utils.interaction import Performer

LaTeX_string = Performer.sweep(
    agent_class=FairnessM1,
    fixed_parameters=fixed_parameters,
    free_parameters=free_parameters,
    simulation_parameters=simulation_parameters,
    sweep_parameter='bias',
    values=[0, 0.2, 0.4, 0.6],
    image_folder=image_folder_M1,
    measures=['conditional_entropy', 'entropy', 'efficiency', 'inequality']
)

Running models for each bias:   0%|          | 0/4 [00:00<?, ?it/s]

  0%|          | 0/100 [00:00<?, ?it/s]

  0%|          | 0/100 [00:00<?, ?it/s]

  0%|          | 0/100 [00:00<?, ?it/s]

  0%|          | 0/100 [00:00<?, ?it/s]

Plotting conditional_entropy...
Plot saved to ..\images\Fairness\M1\conditional_entropy_bias.png
Plotting entropy...
Plot saved to ..\images\Fairness\M1\entropy_bias.png
Plotting efficiency...
Plot saved to ..\images\Fairness\M1\efficiency_bias.png
Plotting inequality...
Plot saved to ..\images\Fairness\M1\inequality_bias.png


---

## M2 <a class="anchor" id="m2"></a>

In [10]:
fixed_parameters = {
	"threshold":0.5,
	"num_agents":2,
}
free_parameters = {
	"learning_rate": 0.2,
	"bias": 0.5,
	"inverse_temperature":16
}
agent = FairnessM2(
	fixed_parameters=fixed_parameters,
	free_parameters=free_parameters,
	n=0
)
agent.debug = True
test_bar_has_capacity(agent)


------------------------------------------------------------
Test bar has capacity
------------------------------------------------------------
Initial state: [0, 0]
---------- Round 0 ----------
Action preferences in state [0, 0]: [0. 0.]
Action probabilities:
no go:0.5 ---- go:0.5
Chosen action: 1
State arrived: [1, 0]
Payoff action 1: 1
Average fairness: -0.0
Payoff: 1
G observed for action 1 in state (0, 0) is: 0.5
Learning rule:
Q[(0, 0), 1] <- 0.0 + 0.2 * (0.5 - 0.0)
Q[(0, 0), 1] = 0.1
---------- Round 1 ----------
Action preferences in state [1, 0]: [0. 0.]
Action probabilities:
no go:0.5 ---- go:0.5
Chosen action: 1
State arrived: [1, 0]
Payoff action 1: 1
Average fairness: -0.16666666666666663
Payoff: 1
G observed for action 1 in state [1, 0] is: 0.4166666666666667
Learning rule:
Q[(1, 0), 1] <- 0.0 + 0.2 * (0.4166666666666667 - 0.0)
Q[(1, 0), 1] = 0.08333333333333334
---------- Round 2 ----------
Action preferences in state [1, 0]: [0.         0.08333333]
Action probabilitie

In [11]:
agent = FairnessM2(
	fixed_parameters=fixed_parameters,
	free_parameters=free_parameters,
	n=0
)
agent.debug = True
test_bar_is_full(agent)


------------------------------------------------------------
Test bar is full
------------------------------------------------------------
Initial state: [1, 1]
---------- Round 0 ----------
Action preferences in state [1, 1]: [0. 0.]
Action probabilities:
no go:0.5 ---- go:0.5
Chosen action: 0
State arrived: [0, 1]
Payoff action 0: 0
Average fairness: 0.0
Payoff: 0
G observed for action 0 in state (1, 1) is: 0.0
Learning rule:
Q[(1, 1), 0] <- 0.0 + 0.2 * (0.0 - 0.0)
Q[(1, 1), 0] = 0.0
---------- Round 1 ----------
Action preferences in state [0, 1]: [0. 0.]
Action probabilities:
no go:0.5 ---- go:0.5
Chosen action: 1
State arrived: [1, 1]
Payoff action 1: -1
Average fairness: -0.16666666666666663
Payoff: -1
G observed for action 1 in state [0, 1] is: -0.5833333333333333
Learning rule:
Q[(0, 1), 1] <- 0.0 + 0.2 * (-0.5833333333333333 - 0.0)
Q[(0, 1), 1] = -0.11666666666666665
---------- Round 2 ----------
Action preferences in state [1, 1]: [0. 0.]
Action probabilities:
no go:0.5 ----

In [12]:
agent = FairnessM2(
	fixed_parameters=fixed_parameters,
	free_parameters=free_parameters,
	n=0
)
agent.debug = True
test_alternation(agent)


------------------------------------------------------------
Test other player alternates
------------------------------------------------------------
Initial state: [0, 0]
---------- Round 0 ----------
Action preferences in state [0, 0]: [0. 0.]
Action probabilities:
no go:0.5 ---- go:0.5
Chosen action: 1
State arrived: [1, 1]
Payoff action 1: -1
Average fairness: -0.0
Payoff: -1
G observed for action 1 in state (0, 0) is: -0.5
Learning rule:
Q[(0, 0), 1] <- 0.0 + 0.2 * (-0.5 - 0.0)
Q[(0, 0), 1] = -0.1
---------- Round 1 ----------
Action preferences in state [1, 1]: [0. 0.]
Action probabilities:
no go:0.5 ---- go:0.5
Chosen action: 0
State arrived: [0, 0]
Payoff action 0: 0
Average fairness: -0.16666666666666669
Payoff: 0
G observed for action 0 in state [1, 1] is: -0.08333333333333334
Learning rule:
Q[(1, 1), 0] <- 0.0 + 0.2 * (-0.08333333333333334 - 0.0)
Q[(1, 1), 0] = -0.01666666666666667
---------- Round 2 ----------
Action preferences in state [0, 0]: [ 0.  -0.1]
Action probabi

In [13]:
fixed_parameters = {
	"threshold":0.5,
	"num_agents":6,
}
free_parameters = {
	"learning_rate": 0.2,
	"bias": 0.5,
	"inverse_temperature":16
}
simulation_parameters = {
	'num_episodes':100,
	'num_rounds':1000,
	'verbose':False
}

In [14]:
from Utils.interaction import Performer

LaTeX_string = Performer.sweep(
    agent_class=FairnessM2,
    fixed_parameters=fixed_parameters,
    free_parameters=free_parameters,
    simulation_parameters=simulation_parameters,
    sweep_parameter='bias',
    values=[0, 0.2, 0.4, 0.6],
    image_folder=image_folder_M2,
    measures=['efficiency', 'inequality', 'entropy', 'conditional_entropy']
)

Running models for each bias:   0%|          | 0/4 [00:00<?, ?it/s]

  0%|          | 0/100 [00:00<?, ?it/s]

  0%|          | 0/100 [00:00<?, ?it/s]

  0%|          | 0/100 [00:00<?, ?it/s]

  0%|          | 0/100 [00:00<?, ?it/s]

Plotting efficiency...
Plot saved to ..\images\Fairness\M2\efficiency_bias.png
Plotting inequality...
Plot saved to ..\images\Fairness\M2\inequality_bias.png
Plotting entropy...
Plot saved to ..\images\Fairness\M2\entropy_bias.png
Plotting conditional_entropy...
Plot saved to ..\images\Fairness\M2\conditional_entropy_bias.png


---

## M3 <a class="anchor" id="m3"></a>

In [15]:
fixed_parameters = {
	"threshold":0.5,
	"num_agents":2,
}
free_parameters = {
	"learning_rate": 0.2,
	"bias": 0.5,
	"inverse_temperature":16
}
agent = FairnessM3(
	fixed_parameters=fixed_parameters,
	free_parameters=free_parameters,
	n=0
)
agent.debug = True
test_bar_has_capacity(agent)


------------------------------------------------------------
Test bar has capacity
------------------------------------------------------------
Initial state: [0, 0]
---------- Round 0 ----------
Action preferences in state [0, 0]: [0. 0.]
Action probabilities:
no go:0.5 ---- go:0.5
Chosen action: 1
State arrived: [1, 0]
Payoff action 1: 1
Average fairness: -0.0
Payoff: 1
G observed for action 1 in state (0, 0) is: 0.5
Learning rule:
Q[(0, 0),1] <- 0.0 + 0.2 * (0.5 - 0.0)
Q[(0, 0),1] = 0.1
---------- Round 1 ----------
Action preferences in state [1, 0]: [0. 0.]
Action probabilities:
no go:0.5 ---- go:0.5
Chosen action: 1
State arrived: [1, 0]
Payoff action 1: 1
Average fairness: -0.16666666666666663
Payoff: 1
G observed for action 1 in state [1, 0] is: 0.4166666666666667
Learning rule:
Q[[1, 0],1] <- 0.0 + 0.2 * (0.4166666666666667 - 0.0)
Q[[1, 0],1] = 0.08333333333333334
---------- Round 2 ----------
Action preferences in state [1, 0]: [0.         0.08333333]
Action probabilities:
n

In [16]:
agent = FairnessM3(
	fixed_parameters=fixed_parameters,
	free_parameters=free_parameters,
	n=0
)
agent.debug = True
test_bar_is_full(agent)


------------------------------------------------------------
Test bar is full
------------------------------------------------------------
Initial state: [1, 1]
---------- Round 0 ----------
Action preferences in state [1, 1]: [0. 0.]
Action probabilities:
no go:0.5 ---- go:0.5
Chosen action: 1
State arrived: [1, 1]
Payoff action 1: -1
Average fairness: -0.5
Payoff: -1
G observed for action 1 in state (1, 1) is: -0.75
Learning rule:
Q[(1, 1),1] <- 0.0 + 0.2 * (-0.75 - 0.0)
Q[(1, 1),1] = -0.15000000000000002
---------- Round 1 ----------
Action preferences in state [1, 1]: [ 0.   -0.15]
Action probabilities:
no go:0.9168273035060777 ---- go:0.08317269649392234
Chosen action: 0
State arrived: [0, 1]
Payoff action 0: 0
Average fairness: 0.16666666666666663
Payoff: 0
G observed for action 0 in state [1, 1] is: 0.08333333333333331
Learning rule:
Q[[1, 1],0] <- 0.0 + 0.2 * (0.08333333333333331 - 0.0)
Q[[1, 1],0] = 0.016666666666666663
---------- Round 2 ----------
Action preferences in stat

In [17]:
agent = FairnessM3(
	fixed_parameters=fixed_parameters,
	free_parameters=free_parameters,
	n=0
)
agent.debug = True
test_alternation(agent)


------------------------------------------------------------
Test other player alternates
------------------------------------------------------------
Initial state: [0, 0]
---------- Round 0 ----------
Action preferences in state [0, 0]: [0. 0.]
Action probabilities:
no go:0.5 ---- go:0.5
Chosen action: 1
State arrived: [1, 1]
Payoff action 1: -1
Average fairness: -0.0
Payoff: -1
G observed for action 1 in state (0, 0) is: -0.5
Learning rule:
Q[(0, 0),1] <- 0.0 + 0.2 * (-0.5 - 0.0)
Q[(0, 0),1] = -0.1
---------- Round 1 ----------
Action preferences in state [1, 1]: [0. 0.]
Action probabilities:
no go:0.5 ---- go:0.5
Chosen action: 0
State arrived: [0, 0]
Payoff action 0: 0
Average fairness: -0.16666666666666669
Payoff: 0
G observed for action 0 in state [1, 1] is: -0.08333333333333334
Learning rule:
Q[[1, 1],0] <- 0.0 + 0.2 * (-0.08333333333333334 - 0.0)
Q[[1, 1],0] = -0.01666666666666667
---------- Round 2 ----------
Action preferences in state [0, 0]: [ 0.  -0.1]
Action probabiliti

In [18]:
fixed_parameters = {
	"threshold":0.5,
	"num_agents":6,
}
free_parameters = {
	"learning_rate": 0.2,
	"bias": 0.5,
	"inverse_temperature":16
}
simulation_parameters = {
	'num_episodes':100,
	'num_rounds':1000,
	'verbose':False
}

In [19]:
from Utils.interaction import Performer

LaTeX_string = Performer.sweep(
    agent_class=FairnessM3,
    fixed_parameters=fixed_parameters,
    free_parameters=free_parameters,
    simulation_parameters=simulation_parameters,
    sweep_parameter='bias',
    values=[0, 0.2, 0.4, 0.6],
    image_folder=image_folder_M3,
    measures=['efficiency', 'inequality', 'entropy', 'conditional_entropy']
)

Running models for each bias:   0%|          | 0/4 [00:00<?, ?it/s]

  0%|          | 0/100 [00:00<?, ?it/s]

  0%|          | 0/100 [00:00<?, ?it/s]

  0%|          | 0/100 [00:00<?, ?it/s]

  0%|          | 0/100 [00:00<?, ?it/s]

Plotting efficiency...
Plot saved to ..\images\Fairness\M3\efficiency_bias.png
Plotting inequality...
Plot saved to ..\images\Fairness\M3\inequality_bias.png
Plotting entropy...
Plot saved to ..\images\Fairness\M3\entropy_bias.png
Plotting conditional_entropy...
Plot saved to ..\images\Fairness\M3\conditional_entropy_bias.png


---

In [20]:
from Utils.interaction import Performer

fixed_parameters = {
	"threshold":0.5,
	"num_agents":6,
}
free_parameters = {
	"learning_rate": 0.2,
	"bias": 0.3,
	"inverse_temperature":16
}
simulation_parameters = {
	'num_episodes':100,
	'num_rounds':1000,
	'verbose':False
}

list_dicts = [
    {
        'agent_class': FairnessM1,
        'fixed_parameters': fixed_parameters,
        'free_parameters': free_parameters,
        'simulation_parameters': simulation_parameters,
        'seed': 7
    },
    {
        'agent_class': FairnessM2,
        'fixed_parameters': fixed_parameters,
        'free_parameters': free_parameters,
        'simulation_parameters': simulation_parameters,
        'seed': 9
    },
    {
        'agent_class': FairnessM3,
        'fixed_parameters': fixed_parameters,
        'free_parameters': free_parameters,
        'simulation_parameters': simulation_parameters,
        'seed': 0
    }
]

In [22]:
#-------------------------------
# Create plots
#-------------------------------
perf = Performer.simple_vs(
    list_dicts=list_dicts,
    image_folder=image_folder_all,
    measures=['efficiency', 'inequality', 'entropy', 'conditional_entropy'],
    kwargs={
        'T': 20,
        'model_names': {
            'Attendance-M1-7': 'M1',
            'Attendance-M2-9': 'M2',
            'Attendance-M3-0': 'M3'
        },
        'figsize': (3.5, 3)
    }
)

  0%|          | 0/100 [00:00<?, ?it/s]

: 

---

In [6]:
from Utils.interaction import Performer

fixed_parameters = {
	"threshold":0.5,
	"num_agents":6,
}
free_parameters = {
	"learning_rate": 0.2,
	"bias": 0.3,
	"inverse_temperature":16
}
simulation_parameters = {
	'num_episodes':1,
	'num_rounds':1000,
	'verbose':False
}

In [7]:
LaTeX_string = Performer.simple_run(
    agent_class=FairnessM1,
    fixed_parameters=fixed_parameters,
    free_parameters=free_parameters,
    simulation_parameters=simulation_parameters,
    image_folder=image_folder_M1,
    measures=['render']
)

Seeds chosen for simple simulation: [18, 27, 3, 6]


Running seeds...:   0%|          | 0/4 [00:00<?, ?it/s]

  0%|          | 0/1 [00:00<?, ?it/s]

  0%|          | 0/1 [00:00<?, ?it/s]

  0%|          | 0/1 [00:00<?, ?it/s]

  0%|          | 0/1 [00:00<?, ?it/s]

In [8]:
LaTeX_string = Performer.simple_run(
    agent_class=FairnessM2,
    fixed_parameters=fixed_parameters,
    free_parameters=free_parameters,
    simulation_parameters=simulation_parameters,
    image_folder=image_folder_M2,
    measures=['render']
)

Seeds chosen for simple simulation: [58, 96, 73, 31]


Running seeds...:   0%|          | 0/4 [00:00<?, ?it/s]

  0%|          | 0/1 [00:00<?, ?it/s]

  0%|          | 0/1 [00:00<?, ?it/s]

  0%|          | 0/1 [00:00<?, ?it/s]

  0%|          | 0/1 [00:00<?, ?it/s]

In [9]:
LaTeX_string = Performer.simple_run(
    agent_class=FairnessM3,
    fixed_parameters=fixed_parameters,
    free_parameters=free_parameters,
    simulation_parameters=simulation_parameters,
    image_folder=image_folder_M3,
    measures=['render']
)

Seeds chosen for simple simulation: [11, 23, 75, 14]


Running seeds...:   0%|          | 0/4 [00:00<?, ?it/s]

  0%|          | 0/1 [00:00<?, ?it/s]

  0%|          | 0/1 [00:00<?, ?it/s]

  0%|          | 0/1 [00:00<?, ?it/s]

  0%|          | 0/1 [00:00<?, ?it/s]