Axelrod-Python · meatballs · Mar 27, 2020 · Mar 17, 2020 · Mar 24, 2020 · Mar 25, 2020
diff --git a/axelrod/strategies/_strategies.py b/axelrod/strategies/_strategies.py
@@ -208,6 +208,7 @@
     Michaelos,
     NTitsForMTats,
     OmegaTFT,
+    OriginalGradual,
     RandomTitForTat,
     SlowTitForTwoTats2,
     SneakyTitForTat,

diff --git a/axelrod/strategies/titfortat.py b/axelrod/strategies/titfortat.py
@@ -384,18 +384,27 @@ def strategy(self, opponent: Player) -> Action:
         return move
 
 
-class Gradual(Player):
+class OriginalGradual(Player):
     """
     A player that punishes defections with a growing number of defections
-    but after punishing enters a calming state and cooperates no matter what
-    the opponent does for two rounds.
+    but after punishing for `punishment_limit` number of times enters a calming
+    state and cooperates no matter what the opponent does for two rounds.
+
+    The `punishment_limit` is incremented whenever the opponent defects and the
+    strategy is not in either calming or punishing state.
+
+    Note that `Gradual` appears in [CRISTAL-SMAC2018]_ however that version of
+    `Gradual` does not give the results reported in [Beaufils1997]_ which is the
+    paper that first introduced the strategy. For a longer discussion of this
+    see: https://github.com/Axelrod-Python/Axelrod/issues/1294. This is why this
+    strategy has been renamed to `OriginalGradual`.
 
     Names:
 
     - Gradual: [Beaufils1997]_
      """
 
-    name = "Gradual"
+    name = "Original Gradual"
     classifier = {
         "memory_depth": float("inf"),
         "stochastic": False,
@@ -438,6 +447,68 @@ def strategy(self, opponent: Player) -> Action:
 
         return C
 
+class Gradual(Player):
+    """
+    Similar to OriginalGradual, this is a player that punishes defections with a
+    growing number of defections but after punishing for `punishment_limit`
+    number of times enters a calming state and cooperates no matter what the
+    opponent does for two rounds.
+
+    This version of Gradual is an update of `OriginalGradual` and the difference
+    is that the `punishment_limit` is incremented whenever the opponent defects
+    (regardless of the state of the player).
+
+    Note that this version of `Gradual` appears in [CRISTAL-SMAC2018]_ however
+    this version of
+    `Gradual` does not give the results reported in [Beaufils1997]_ which is the
+    paper that first introduced the strategy. For a longer discussion of this
+    see: https://github.com/Axelrod-Python/Axelrod/issues/1294.
+
+    This version is based on  https://github.com/cristal-smac/ipd/blob/master/src/strategies.py#L224
+
+    Names:
+
+    - Gradual: [CRISTAL-SMAC2018]_
+    """
+
+    name = "Gradual"
+    classifier = {
+        "memory_depth": float("inf"),
+        "stochastic": False,
+        "makes_use_of": set(),
+        "long_run_time": False,
+        "inspects_source": False,
+        "manipulates_source": False,
+        "manipulates_state": False,
+    }
+
+    def __init__(self) -> None:
+
+        super().__init__()
+        self.calm_count = 0
+        self.punish_count = 0
+
+    def strategy(self, opponent: Player) -> Action:
+
+        if len(self.history) == 0:
+            return C
+
+
+        if self.punish_count > 0:
+            self.punish_count -= 1
+            return D
+
+        if self.calm_count > 0:
+            self.calm_count -= 1
+            return C
+
+        if opponent.history[-1] == D:
+            self.punish_count = opponent.defections - 1
+            self.calm_count = 2
+            return D
+        return C
+
+
 
 @TrackHistoryTransformer(name_prefix=None)
 class ContriteTitForTat(Player):

diff --git a/axelrod/tests/strategies/test_titfortat.py b/axelrod/tests/strategies/test_titfortat.py
@@ -336,6 +336,229 @@ class TestGradual(TestPlayer):
         "manipulates_state": False,
     }
 
+    def test_strategy(self):
+        # Punishes defection with a growing number of defections and calms
+        # the opponent with two cooperations in a row.
+        opponent = axelrod.MockPlayer(actions=[C])
+        actions = [(C, C)]
+        self.versus_test(
+            opponent,
+            expected_actions=actions,
+            attrs={
+                "calm_count": 0,
+                "punish_count": 0,
+            },
+        )
+
+        opponent = axelrod.MockPlayer(actions=[D])
+        actions = [(C, D)]
+        self.versus_test(
+            opponent,
+            expected_actions=actions,
+            attrs={
+                "calm_count": 0,
+                "punish_count": 0,
+            },
+        )
+
+        opponent = axelrod.MockPlayer(actions=[D, C])
+        actions = [(C, D), (D, C)]
+        self.versus_test(
+            opponent,
+            expected_actions=actions,
+            attrs={
+                "calm_count": 2,
+                "punish_count": 0,
+            },
+        )
+
+        opponent = axelrod.MockPlayer(actions=[D, C, C])
+        actions = [(C, D), (D, C), (C, C)]
+        self.versus_test(
+            opponent,
+            expected_actions=actions,
+            attrs={
+                "calm_count": 1,
+                "punish_count": 0,
+            },
+        )
+
+        opponent = axelrod.MockPlayer(actions=[D, C, D, C])
+        actions = [(C, D), (D, C), (C, D), (C, C)]
+        self.versus_test(
+            opponent,
+            expected_actions=actions,
+            attrs={
+                "calm_count": 0,
+                "punish_count": 0,
+            },
+        )
+
+        opponent = axelrod.MockPlayer(actions=[D, C, D, C, C])
+        actions = [(C, D), (D, C), (C, D), (C, C), (C, C)]
+        self.versus_test(
+            opponent,
+            expected_actions=actions,
+            attrs={
+                "calm_count": 0,
+                "punish_count": 0,
+            },
+        )
+
+        opponent = axelrod.MockPlayer(actions=[D, C, D, C, C, C])
+        actions = [(C, D), (D, C), (C, D), (C, C), (C, C), (C, C)]
+        self.versus_test(
+            opponent,
+            expected_actions=actions,
+            attrs={
+                "calm_count": 0,
+                "punish_count": 0,
+            },
+        )
+
+        opponent = axelrod.MockPlayer(actions=[D, C, D, C, C, C, D, C])
+        actions = [(C, D), (D, C), (C, D), (C, C), (C, C), (C, C), (C, D), (D, C)]
+        self.versus_test(
+            opponent,
+            expected_actions=actions,
+            attrs={
+                "calm_count": 2,
+                "punish_count": 2,
+            },
+        )
+
+        opponent = axelrod.MockPlayer(actions=[D, C, D, C, C, D, D, D])
+        actions = [(C, D), (D, C), (C, D), (C, C), (C, C), (C, D), (D, D), (D, D)]
+        self.versus_test(
+            opponent,
+            expected_actions=actions,
+            attrs={
+                "calm_count": 2,
+                "punish_count": 1,
+            },
+        )
+
+        opponent = axelrod.Defector()
+        actions = [
+                (C, D),
+                (D, D), # 1 defection as a response to the 1 defection by opponent
+                (C, D),
+                (C, D),
+                (D, D), # starts defecting after a total of 4 defections by the opponent
+                (D, D),
+                (D, D),
+                (D, D), # 4 defections
+                (C, D),
+                (C, D),
+                (D, D), # Start defecting after a total of 10 defections by the opponent
+                (D, D),
+                (D, D),
+                (D, D),
+                (D, D),
+                (D, D),
+                (D, D),
+                (D, D),
+                (D, D),
+                (D, D),  # 10 defections
+                (C, D),
+                (C, D),
+                (D, D), # starts defecting after 22 defections by the opponent
+                (D, D),
+                (D, D),
+                (D, D),
+                (D, D),
+                (D, D),
+                (D, D),
+                (D, D),
+                (D, D),
+                (D, D),
+                (D, D),
+                (D, D),
+                (D, D),
+                (D, D),
+                (D, D),
+                (D, D),
+                (D, D),
+                (D, D),
+                (D, D),
+                (D, D),
+                (D, D),
+                (D, D), # 22 defections
+                (C, D),
+                (C, D),
+                (D, D),
+                (D, D),
+                (D, D),
+                (D, D),
+        ]
+        self.versus_test(
+            opponent,
+            expected_actions=actions,
+            attrs={
+                "calm_count": 2,
+                "punish_count": 42,
+            },
+        )
+
+    def test_specific_set_of_results(self):
+        """
+        This tests specific reported results as discussed in
+        https://github.com/Axelrod-Python/Axelrod/issues/1294
+
+        The results there used a version of mistrust with a bug that corresponds
+        to a memory one player that start by defecting and only cooperates if
+        both players cooperated in the previous round.
+        """
+        mistrust_with_bug = axelrod.MemoryOnePlayer(
+                initial=D,
+                four_vector=(1, 0, 0, 0),
+                )
+        players = [
+               self.player(),
+               axelrod.TitForTat(),
+               axelrod.GoByMajority(),
+               axelrod.Grudger(),
+               axelrod.WinStayLoseShift(),
+               axelrod.Prober(),
+               axelrod.Defector(),
+               mistrust_with_bug,
+               axelrod.Cooperator(),
+               axelrod.CyclerCCD(),
+               axelrod.CyclerDDC(),
+        ]
+        axelrod.seed(1)
+        tournament = axelrod.Tournament(players, turns=1000, repetitions=1)
+        results = tournament.play(progress_bar=False)
+        scores = [round(average_score_per_turn * 1000, 1)
+                  for average_score_per_turn in results.payoff_matrix[0]]
+        expected_scores = [
+                3000.0,
+                3000.0,
+                3000.0,
+                3000.0,
+                3000.0,
+                2999.0,
+                983.0,
+                983.0,
+                3000.0,
+                3596.0,
+                2302.0,
+                ]
+        self.assertEqual(scores, expected_scores)
+
+class TestOriginalGradual(TestPlayer):
+
+    name = "Original Gradual"
+    player = axelrod.OriginalGradual
+    expected_classifier = {
+        "memory_depth": float("inf"),
+        "stochastic": False,
+        "makes_use_of": set(),
+        "inspects_source": False,
+        "manipulates_source": False,
+        "manipulates_state": False,
+    }
+
     def test_strategy(self):
         # Punishes defection with a growing number of defections and calms
         # the opponent with two cooperations in a row.
@@ -466,6 +689,9 @@ def test_output_from_literature(self):
         Dilemma" Proc. Artif. Life 1996
 
         This test just ensures that the strategy is as was originally defined.
+
+        See https://github.com/Axelrod-Python/Axelrod/issues/1294 for another
+        discussion of this.
         """
         player = self.player()
 

diff --git a/docs/reference/bibliography.rst b/docs/reference/bibliography.rst
@@ -25,6 +25,7 @@ documentation.
 .. [Bendor1993] Bendor, Jonathan. "Uncertainty and the Evolution of Cooperation." The Journal of Conflict Resolution, 37(4), 709–734.
 .. [Beaufils1997] Beaufils, B. & Delahaye, J. & Mathieu, P. (1997). Our Meeting With Gradual: A Good Strategy For The Iterated Prisoner’s Dilemma. http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.42.4041
 .. [Berg2015] Berg, P. Van Den, & Weissing, F. J. (2015). The importance of mechanisms for the evolution of cooperation. Proceedings of the Royal Society B-Biological Sciences, 282.
+.. [CRISTAL-SMAC2018] CRISTAL Lab, SMAC Team, Lille University (2018). IPD : the Iterated Prisoner's Dilemma. https://github.com/cristal-smac/ipd
 .. [Downing1975] Downing, Leslie L. "The Prisoner's Dilemma game as a problem-solving phenomenon: An outcome maximization interpretation." Simulation & Games 6.4 (1975): 366-391.
 .. [Eckhart2015] Eckhart Arnold (2016) CoopSim v0.9.9 beta 6.  https://github.com/jecki/CoopSim/
 .. [Frean1994] Frean, Marcus R. "The Prisoner's Dilemma without Synchrony." Proceedings: Biological Sciences, vol. 257, no. 1348, 1994, pp. 75–79. www.jstor.org/stable/50253.