Skip to content

Spruce up strategy utils module #1196

New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Merged
merged 2 commits into from
Aug 19, 2018
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
136 changes: 110 additions & 26 deletions axelrod/_strategy_utils.py
Original file line number Diff line number Diff line change
@@ -1,5 +1,7 @@
"""Utilities used by various strategies"""
"""Utilities used by various strategies."""

import itertools

from functools import lru_cache

from axelrod.player import update_history
Expand All @@ -23,8 +25,14 @@ def detect_cycle(history, min_size=1, max_size=12, offset=0):
min_size: int, 1
The minimum length of the cycle
max_size: int, 12
The maximum length of the cycle
offset: int, 0
The amount of history to skip initially

Returns
-------
Tuple of C and D
The cycle detected in the input history
"""
history_tail = history[offset:]
new_max_size = min(len(history_tail) // 2, max_size)
Expand All @@ -41,31 +49,89 @@ def detect_cycle(history, min_size=1, max_size=12, offset=0):


def inspect_strategy(inspector, opponent):
"""Simulate one round vs opponent unless opponent has an inspection countermeasure."""
"""Inspects the strategy of an opponent.

Simulate one round of play with an opponent, unless the opponent has
an inspection countermeasure.

Parameters
----------
inspector: Player
The player doing the inspecting
oponnent: Player
The player being inspected

Returns
-------
Action
The action that would be taken by the opponent.
"""
if hasattr(opponent, 'foil_strategy_inspection'):
return opponent.foil_strategy_inspection()
else:
return opponent.strategy(inspector)


def limited_simulate_play(player_1, player_2, h1):
"""Here we want to replay player_1's history to player_2, allowing
player_2's strategy method to set any internal variables as needed. If you
need a more complete simulation, see `simulate_play` in player.py. This
function is specifically designed for the needs of MindReader."""
def _limited_simulate_play(player_1, player_2, h1):
"""Simulates a player's move.

After inspecting player_2's next move (allowing player_2's strategy
method to set any internal variables as needed), update histories
for both players. Note that player_1's move is an argument.

If you need a more complete simulation, see `simulate_play` in
player.py. This function is specifically designed for the needs
of MindReader.

Parameters
----------
player_1: Player
The player whose move is already known.
player_2: Player
The player the we want to inspect.
h1: Action
The next action for first player.
"""
h2 = inspect_strategy(player_1, player_2)
update_history(player_1, h1)
update_history(player_2, h2)


def simulate_match(player_1, player_2, strategy, rounds=10):
"""Simulates a number of matches."""
"""Simulates a number of rounds with a constant strategy.

Parameters
----------
player_1: Player
The player that will have a constant strategy.
player_2: Player
The player we want to simulate.
strategy: Action
The constant strategy to use for first player.
rounds: int
The number of rounds to play.
"""
for match in range(rounds):
limited_simulate_play(player_1, player_2, strategy)
_limited_simulate_play(player_1, player_2, strategy)


def calculate_scores(p1, p2, game):
"""Calculates the score for two players based their history"""
def _calculate_scores(p1, p2, game):
"""Calculates the scores for two players based their history.

Parameters
----------
p1: Player
The first player.
p2: Player
The second player.
game: Game
Game object used to score rounds in the players' histories.

Returns
-------
int, int
The scores for the two input players.
"""
s1, s2 = 0, 0
for pair in zip(p1.history, p2.history):
score = game.score(pair)
Expand All @@ -75,28 +141,46 @@ def calculate_scores(p1, p2, game):


def look_ahead(player_1, player_2, game, rounds=10):
"""Looks ahead for `rounds` and selects the next strategy appropriately."""
results = []
# Simulate plays for `rounds` rounds
players = {C: Cooperator(), D: Defector()}
strategies = [C, D]
for strategy in strategies:
# Instead of a deepcopy, create a new opponent and play out the history
"""Returns an constant action that maximizes score by looking ahead.

Parameters
----------
player_1: Player
The player that will look ahead.
player_2: Player
The oppponent that will be inspected.
game: Game
The Game object used to score rounds.
rounds: int
The number of rounds to look ahead.

Returns
-------
Action
The action that maximized score if it is played constantly.
"""
results = {}
possible_strategies = {C: Cooperator(), D: Defector()}
for action, player in possible_strategies.items():
# Instead of a deepcopy, create a new opponent and replay the history to it.
opponent_ = player_2.clone()
player_ = players[strategy]
for h1 in player_1.history:
limited_simulate_play(player_, opponent_, h1)
for h in player_1.history:
_limited_simulate_play(player, opponent_, h)

simulate_match(player_, opponent_, strategy, rounds)
results.append(calculate_scores(player_, opponent_, game))
# Now play forward with the constant strategy.
simulate_match(player, opponent_, action, rounds)
results[action] = _calculate_scores(player, opponent_, game)

return strategies[results.index(max(results))]
return C if results[C] > results[D] else D


@lru_cache()
def recursive_thue_morse(n):
"""The recursive definition of the Thue-Morse sequence. The first few terms
of the Thue-Morse sequence are: 0 1 1 0 1 0 0 1 1 0 0 1 0 1 1 0 . . ."""
"""The recursive definition of the Thue-Morse sequence.

The first few terms of the Thue-Morse sequence are:
0 1 1 0 1 0 0 1 1 0 0 1 0 1 1 0 . . .
"""

if n == 0:
return 0
Expand Down
79 changes: 74 additions & 5 deletions axelrod/tests/unit/test_strategy_utils.py
Original file line number Diff line number Diff line change
Expand Up @@ -7,20 +7,24 @@
from hypothesis import given, settings
from hypothesis.strategies import sampled_from, lists, integers

from axelrod import Action
from axelrod._strategy_utils import detect_cycle, inspect_strategy
from axelrod import Action, Game, Player
from axelrod._strategy_utils import detect_cycle, inspect_strategy, look_ahead, \
recursive_thue_morse, simulate_match, thue_morse_generator

C, D = Action.C, Action.D


class TestDetectCycle(unittest.TestCase):
"""Test the detect cycle function"""

@given(cycle=lists(sampled_from([C, D]), min_size=2, max_size=10),
period=integers(min_value=3, max_value=10))
@settings(max_examples=5, max_iterations=20)
@settings(max_examples=5)
def test_finds_cycle(self, cycle, period):
history = cycle * period
self.assertIsNotNone(detect_cycle(history))
detected = detect_cycle(history)
self.assertIsNotNone(detected)
self.assertIn(''.join(map(str, detected)),
''.join(map(str, (cycle))))

def test_no_cycle(self):
history = [C, D, C, C]
Expand Down Expand Up @@ -74,3 +78,68 @@ def test_strategies_with_countermeasures_return_their_countermeasures(self):

self.assertEqual(inspect_strategy(inspector=inspector, opponent=d_geller), D)
self.assertEqual(d_geller.strategy(inspector), C)


class TestSimulateMatch(unittest.TestCase):

def test_tft_reacts_to_cooperation(self):
tft = axelrod.TitForTat()
inspector = axelrod.Alternator()

simulate_match(inspector, tft, C, 5)
self.assertEqual(inspector.history, [C, C, C, C, C])
self.assertEqual(tft.history, [C, C, C, C, C])

def test_tft_reacts_to_defection(self):
tft = axelrod.TitForTat()
inspector = axelrod.Alternator()

simulate_match(inspector, tft, D, 5)
self.assertEqual(inspector.history, [D, D, D, D, D])
self.assertEqual(tft.history, [C, D, D, D, D])


class TestLookAhead(unittest.TestCase):

def setUp(self):
self.inspector = Player()
self.game = Game()

def test_cooperator(self):
tft = axelrod.Cooperator()
# It always makes sense to defect here.
self.assertEqual(look_ahead(self.inspector, tft, self.game, 1), D)
self.assertEqual(look_ahead(self.inspector, tft, self.game, 2), D)
self.assertEqual(look_ahead(self.inspector, tft, self.game, 5), D)


def test_tit_for_tat(self):
tft = axelrod.TitForTat()
# Cooperation should be chosen if we look ahead further than one move.
self.assertEqual(look_ahead(self.inspector, tft, self.game, 1), D)
self.assertEqual(look_ahead(self.inspector, tft, self.game, 2), C)
self.assertEqual(look_ahead(self.inspector, tft, self.game, 5), C)


class TestRecursiveThueMorse(unittest.TestCase):

def test_initial_values(self):
self.assertEqual(recursive_thue_morse(0), 0)
self.assertEqual(recursive_thue_morse(1), 1)
self.assertEqual(recursive_thue_morse(2), 1)
self.assertEqual(recursive_thue_morse(3), 0)
self.assertEqual(recursive_thue_morse(4), 1)


class TestThueMorseGenerator(unittest.TestCase):

def test_initial_values(self):
generator = thue_morse_generator()
values = [next(generator) for i in range(5)]
self.assertEqual(values, [0, 1, 1, 0, 1])

def test_with_offset(self):
generator = thue_morse_generator(start=2)
values = [next(generator) for i in range(5)]
self.assertEqual(values, [1, 0, 1, 0, 0])