tests for max_regret/infoset regret on mixed behavior profiles

rahulsavani · rahulsavani · commit fef1ab144abe · 2025-12-16T18:55:36.000Z
diff --git a/tests/test_behav.py b/tests/test_behav.py
@@ -798,9 +798,11 @@ def test_action_value_by_label_reference(game: gbt.Game, label: str,
      (games.create_mixed_behav_game_efg(), True),
      (games.create_stripped_down_poker_efg(), False),
      (games.create_stripped_down_poker_efg(), True),
+     (games.create_kuhn_poker_efg(), False),
+     (games.create_kuhn_poker_efg(), True),
      ]
 )
-def test_regret_consistency(game: gbt.Game, rational_flag: bool):
+def test_action_regret_consistency(game: gbt.Game, rational_flag: bool):
     profile = game.mixed_behavior_profile(rational=rational_flag)
     for player in game.players:
         for infoset in player.infosets:
@@ -812,6 +814,60 @@ def test_regret_consistency(game: gbt.Game, rational_flag: bool):
                 )
 
 
+@pytest.mark.parametrize(
+    "game,rational_flag",
+    [(games.create_mixed_behav_game_efg(), False),
+     (games.create_mixed_behav_game_efg(), True),
+     (games.create_stripped_down_poker_efg(), False),
+     (games.create_stripped_down_poker_efg(), True),
+     (games.create_kuhn_poker_efg(), False),
+     (games.create_kuhn_poker_efg(), True),
+     ]
+)
+def test_infoset_regret_consistency(game: gbt.Game, rational_flag: bool):
+    profile = game.mixed_behavior_profile(rational=rational_flag)
+    for player in game.players:
+        for infoset in player.infosets:
+            assert (
+                profile.infoset_regret(infoset) ==
+                max(profile.action_value(a) for a in infoset.actions) -
+                profile.infoset_value(infoset)
+            )
+
+
+@pytest.mark.parametrize(
+    "game,rational_flag",
+    [(games.create_mixed_behav_game_efg(), False),
+     (games.create_mixed_behav_game_efg(), True),
+     (games.create_stripped_down_poker_efg(), False),
+     (games.create_stripped_down_poker_efg(), True),
+     (games.create_kuhn_poker_efg(), False),
+     (games.create_kuhn_poker_efg(), True),
+     ]
+)
+def test_max_regret_consistency(game: gbt.Game, rational_flag: bool):
+    profile = game.mixed_behavior_profile(rational=rational_flag)
+    assert profile.max_regret() == profile.as_strategy().max_regret()
+
+
+@pytest.mark.parametrize(
+    "game,rational_flag",
+    [(games.create_mixed_behav_game_efg(), False),
+     (games.create_mixed_behav_game_efg(), True),
+     (games.create_stripped_down_poker_efg(), False),
+     (games.create_stripped_down_poker_efg(), True),
+     (games.create_kuhn_poker_efg(), False),
+     (games.create_kuhn_poker_efg(), True),
+     ]
+)
+def test_agent_max_regret_consistency(game: gbt.Game, rational_flag: bool):
+    profile = game.mixed_behavior_profile(rational=rational_flag)
+    assert (
+        profile.agent_max_regret() ==
+        max([profile.infoset_regret(infoset) for infoset in game.infosets])
+    )
+
+
 @pytest.mark.parametrize(
     "game,player_idx,infoset_idx,action_idx,action_probs,rational_flag,tol,value",
     [
@@ -823,14 +879,14 @@ def test_regret_consistency(game: gbt.Game, rational_flag: bool):
      (games.create_mixed_behav_game_efg(), 2, 0, 0, None, False, TOL, 0),
      (games.create_mixed_behav_game_efg(), 2, 0, 1, None, False, TOL, 0.5),  # 3.5 - 3
      # U1 U2 U3
-     (games.create_mixed_behav_game_efg(), 0, 0, 0, [1.0, 0.0, 1.0, 0.0, 1.0, 0.0], False, TOL, 0),
-     (games.create_mixed_behav_game_efg(), 0, 0, 0, ["1", "0", "1", "0", "1", "0"], True, ZERO, 0),
-     (games.create_mixed_behav_game_efg(), 0, 0, 1, [1.0, 0.0, 1.0, 0.0, 1.0, 0.0], False, TOL, 9),
-     (games.create_mixed_behav_game_efg(), 0, 0, 1, ["1", "0", "1", "0", "1", "0"], True, ZERO, 9),
-     (games.create_mixed_behav_game_efg(), 1, 0, 0, [1.0, 0.0, 1.0, 0.0, 1.0, 0.0], False, TOL, 0),
-     (games.create_mixed_behav_game_efg(), 1, 0, 0, ["1", "0", "1", "0", "1", "0"], True, ZERO, 0),
-     (games.create_mixed_behav_game_efg(), 1, 0, 1, [1.0, 0.0, 1.0, 0.0, 1.0, 0.0], False, TOL, 8),
-     (games.create_mixed_behav_game_efg(), 1, 0, 1, ["1", "0", "1", "0", "1", "0"], True, ZERO, 8),
+     (games.create_mixed_behav_game_efg(), 0, 0, 0, [1, 0, 1, 0, 1, 0], False, TOL, 0),
+     (games.create_mixed_behav_game_efg(), 0, 0, 0, [1, 0, 1, 0, 1, 0], True, ZERO, 0),
+     (games.create_mixed_behav_game_efg(), 0, 0, 1, [1, 0, 1, 0, 1, 0], False, TOL, 9),
+     (games.create_mixed_behav_game_efg(), 0, 0, 1, [1, 0, 1, 0, 1, 0], True, ZERO, 9),
+     (games.create_mixed_behav_game_efg(), 1, 0, 0, [1, 0, 1, 0, 1, 0], False, TOL, 0),
+     (games.create_mixed_behav_game_efg(), 1, 0, 0, [1, 0, 1, 0, 1, 0], True, ZERO, 0),
+     (games.create_mixed_behav_game_efg(), 1, 0, 1, [1, 0, 1, 0, 1, 0], False, TOL, 8),
+     (games.create_mixed_behav_game_efg(), 1, 0, 1, [1, 0, 1, 0, 1, 0], True, ZERO, 8),
      # Mixed Nash equilibrium
      (games.create_mixed_behav_game_efg(), 0, 0, 0, ["2/5", "3/5", "1/2", "1/2", "1/3", "2/3"],
       True, ZERO, 0),
@@ -858,9 +914,9 @@ def test_regret_consistency(game: gbt.Game, rational_flag: bool):
       True, ZERO, "8/3"),  # (2/3*2 + 1/3*1) - (-1)
      ]
 )
-def test_regret_reference(game: gbt.Game, player_idx: int, infoset_idx: int, action_idx: int,
-                          action_probs: None | list, rational_flag: bool,
-                          tol: gbt.Rational | float, value: str | float):
+def test_action_regret_reference(game: gbt.Game, player_idx: int, infoset_idx: int,
+                                 action_idx: int, action_probs: None | list, rational_flag: bool,
+                                 tol: gbt.Rational | float, value: str | float):
     action = game.players[player_idx].infosets[infoset_idx].actions[action_idx]
     profile = game.mixed_behavior_profile(rational=rational_flag)
     if action_probs:
@@ -955,6 +1011,41 @@ def test_agent_liap_value_reference(game: gbt.Game, action_probs: None | list,
     )
 
 
+@pytest.mark.parametrize(
+    "game,action_probs,rational_flag,max_regret,agent_max_regret,liap_value,agent_liap_value",
+    [
+     # uniform (non-Nash):
+     (games.create_mixed_behav_game_efg(), None, True, "1/4", "1/4", "1/16", "1/16"),
+     (games.create_mixed_behav_game_efg(), None, False, 0.25, 0.25, 0.0625, 0.0625),
+     # Myerson fig 2.4
+     pytest.param(
+        games.read_from_file("myerson_fig_4_2.efg"), [0, 1, 0, 1, 1, 0], True, 1, 0, 1, 0,
+        marks=pytest.mark.xfail(reason="Needs to be fixed now")
+     ),
+     ]
+)
+def test_agent_max_regret_versus_non_agent(game: gbt.Game, action_probs: None | list,
+                                           rational_flag: bool,
+                                           max_regret: str | float,
+                                           agent_max_regret: str | float,
+                                           agent_liap_value: str | float,
+                                           liap_value: str | float,
+                                           ):
+    profile = game.mixed_behavior_profile(rational=rational_flag)
+    if action_probs:
+        _set_action_probs(profile, action_probs, rational_flag)
+    assert (profile.max_regret() == (gbt.Rational(max_regret) if rational_flag else max_regret))
+    assert (
+        profile.agent_max_regret() == (gbt.Rational(agent_max_regret)
+                                       if rational_flag else agent_max_regret)
+    )
+    assert (profile.liap_value() == (gbt.Rational(liap_value) if rational_flag else liap_value))
+    assert (
+        profile.agent_liap_value() == (gbt.Rational(agent_liap_value)
+                                       if rational_flag else agent_liap_value)
+    )
+
+
 @pytest.mark.parametrize(
     "game,tol,probs,infoset_idx,member_idx,value,rational_flag",
     [(games.create_mixed_behav_game_efg(), TOL, [0.8, 0.2, 0.4, 0.6, 0.0, 1.0], 0, 0, 1.0, False),
@@ -1157,6 +1248,39 @@ def _get_and_check_answers(game: gbt.Game, action_probs1: tuple, action_probs2:
       lambda x, y: x.agent_liap_value(), lambda x: [1]),
      (games.create_stripped_down_poker_efg(), PROBS_1A_rat, PROBS_2A_rat, True,
       lambda x, y: x.agent_liap_value(), lambda x: [1]),
+     ######################################################################################
+     # liap_value (of profile, hence [1] for objects_to_test,
+     # any singleton collection would do)
+     (games.create_mixed_behav_game_efg(), PROBS_1A_doub, PROBS_2A_doub, False,
+      lambda x, y: x.liap_value(), lambda x: [1]),
+     (games.create_mixed_behav_game_efg(), PROBS_1A_rat, PROBS_2A_rat, True,
+      lambda x, y: x.liap_value(), lambda x: [1]),
+     (games.create_stripped_down_poker_efg(), PROBS_1B_doub, PROBS_2B_doub, False,
+      lambda x, y: x.liap_value(), lambda x: [1]),
+     (games.create_stripped_down_poker_efg(), PROBS_1A_rat, PROBS_2A_rat, True,
+      lambda x, y: x.liap_value(), lambda x: [1]),
+     ######################################################################################
+     # agent_max_regret (of profile, hence [1] for objects_to_test,
+     # any singleton collection would do)
+     (games.create_mixed_behav_game_efg(), PROBS_1A_doub, PROBS_2A_doub, False,
+      lambda x, y: x.agent_max_regret(), lambda x: [1]),
+     (games.create_mixed_behav_game_efg(), PROBS_1A_rat, PROBS_2A_rat, True,
+      lambda x, y: x.agent_max_regret(), lambda x: [1]),
+     (games.create_stripped_down_poker_efg(), PROBS_1B_doub, PROBS_2B_doub, False,
+      lambda x, y: x.agent_max_regret(), lambda x: [1]),
+     (games.create_stripped_down_poker_efg(), PROBS_1A_rat, PROBS_2A_rat, True,
+      lambda x, y: x.agent_max_regret(), lambda x: [1]),
+     ######################################################################################
+     # max_regret (of profile, hence [1] for objects_to_test,
+     # any singleton collection would do)
+     (games.create_mixed_behav_game_efg(), PROBS_1A_doub, PROBS_2A_doub, False,
+      lambda x, y: x.max_regret(), lambda x: [1]),
+     (games.create_mixed_behav_game_efg(), PROBS_1A_rat, PROBS_2A_rat, True,
+      lambda x, y: x.max_regret(), lambda x: [1]),
+     (games.create_stripped_down_poker_efg(), PROBS_1B_doub, PROBS_2B_doub, False,
+      lambda x, y: x.max_regret(), lambda x: [1]),
+     (games.create_stripped_down_poker_efg(), PROBS_1A_rat, PROBS_2A_rat, True,
+      lambda x, y: x.max_regret(), lambda x: [1]),
      ]
 )
 def test_profile_order_consistency(game: gbt.Game,
diff --git a/tests/test_mixed.py b/tests/test_mixed.py
@@ -795,7 +795,7 @@ def _get_and_check_answers(game: gbt.Game, action_probs1: tuple, action_probs2:
 PROBS_2A_doub = (0.5, 0, 0.5, 0)
 PROBS_1A_rat = ("1/4", "1/4", "1/4", "1/4")
 PROBS_2A_rat = ("1/2", "0", "1/2", "0")
-# For 2x2x2 nfg and Myserson 2-card poker efg (both have 6 strategies in total):
+# For 2x2x2 nfg and stripped_down_poker efg (both have 6 strategies in total):
 PROBS_1B_doub = (0.5, 0.5, 0.5, 0.5, 0.5, 0.5)
 PROBS_2B_doub = (1.0, 0.0, 1.0, 0.0, 1.0, 0.0)
 PROBS_1B_rat = ("1/2", "1/2", "1/2", "1/2", "1/2", "1/2")
@@ -933,6 +933,29 @@ def _get_and_check_answers(game: gbt.Game, action_probs1: tuple, action_probs2:
      pytest.param(games.create_stripped_down_poker_efg(), PROBS_1B_rat, PROBS_2B_rat, True,
                   lambda profile, y: profile.liap_value(), lambda x: [1],
                   id="liap_value_poker_rat"),
+     #################################################################################
+     # max_regret (of profile, hence [1] for objects_to_test, any singleton collection would do)
+     # 4x4 coordination nfg
+     pytest.param(games.create_coord_4x4_nfg(), PROBS_1A_doub, PROBS_2A_doub, False,
+                  lambda profile, y: profile.max_regret(), lambda x: [1],
+                  id="max_regret_coord_doub"),
+     pytest.param(games.create_coord_4x4_nfg(), PROBS_1A_rat, PROBS_2A_rat, True,
+                  lambda profile, y: profile.max_regret(), lambda x: [1],
+                  id="max_regret_coord_rat"),
+     # 2x2x2 nfg
+     pytest.param(games.create_2x2x2_nfg(), PROBS_1B_doub, PROBS_2B_doub, False,
+                  lambda profile, y: profile.max_regret(), lambda x: [1],
+                  id="max_regret_2x2x2_doub"),
+     pytest.param(games.create_2x2x2_nfg(), PROBS_1B_rat, PROBS_2B_rat, True,
+                  lambda profile, y: profile.max_regret(), lambda x: [1],
+                  id="max_regret_2x2x2_rat"),
+     # stripped-down poker
+     pytest.param(games.create_stripped_down_poker_efg(), PROBS_1B_doub, PROBS_2B_doub, False,
+                  lambda profile, y: profile.max_regret(), lambda x: [1],
+                  id="max_regret_poker_doub"),
+     pytest.param(games.create_stripped_down_poker_efg(), PROBS_1B_rat, PROBS_2B_rat, True,
+                  lambda profile, y: profile.max_regret(), lambda x: [1],
+                  id="max_regret_poker_rat"),
      ]
 )
 def test_profile_order_consistency(game: gbt.Game,
diff --git a/tests/test_nash.py b/tests/test_nash.py
@@ -141,8 +141,8 @@ def test_enumpoly_ordered_behavior(
     game: gbt.Game, mixed_behav_prof_data: list, stop_after: None | int
 ):
     """Test calls of enumpoly for mixed behavior equilibria,
-    using max_regret (internal consistency); and comparison to a set of previously
-    computed equilibria using this function (regression test).
+    using max_regret and agent_max_regret (internal consistency); and
+    comparison to a set of previously computed equilibria with this function (regression test).
     This set will be the full set of all computed equilibria if stop_after is None,
     else the first stop_after-many equilibria.
 
@@ -162,6 +162,7 @@ def test_enumpoly_ordered_behavior(
         result = gbt.nash.enumpoly_solve(game, use_strategic=False)
     assert len(result.equilibria) == len(mixed_behav_prof_data)
     for eq, exp in zip(result.equilibria, mixed_behav_prof_data, strict=True):
+        assert abs(eq.max_regret()) <= TOL
         assert abs(eq.agent_max_regret()) <= TOL
         expected = game.mixed_behavior_profile(rational=True, data=exp)
         for p in game.players:
@@ -197,8 +198,8 @@ def test_enumpoly_unordered_behavior(
     game: gbt.Game, mixed_behav_prof_data: list, stop_after: None | int
 ):
     """Test calls of enumpoly for mixed behavior equilibria,
-    using max_regret (internal consistency); and comparison to a set of previously
-    computed equilibria using this function (regression test).
+    using max_regret and agent_max_regret (internal consistency); and
+    comparison to a set of previously computed equilibria using this function (regression test).
 
     This set will be the full set of all computed equilibria if stop_after is None,
     else the first stop_after-many equilibria.
@@ -229,6 +230,7 @@ def are_the_same(game, found, candidate):
         return True
 
     for eq in result.equilibria:
+        assert abs(eq.max_regret()) <= TOL
         assert abs(eq.agent_max_regret()) <= TOL
         found = False
         for exp in mixed_behav_prof_data[:]:
@@ -423,12 +425,13 @@ def test_lcp_behavior_double():
 def test_lcp_behavior_rational(game: gbt.Game, mixed_behav_prof_data: list):
     """Test calls of LCP for mixed behavior equilibria, rational precision.
 
-    using max_regret (internal consistency); and comparison to a previously
-    computed equilibrium using this function (regression test)
+    using max_regret and agent_max_regret (internal consistency); and
+    comparison to a previously computed equilibrium using this function (regression test).
     """
     result = gbt.nash.lcp_solve(game, use_strategic=False, rational=True)
     assert len(result.equilibria) == 1
     eq = result.equilibria[0]
+    assert eq.max_regret() == 0
     assert eq.agent_max_regret() == 0
     expected = game.mixed_behavior_profile(rational=True, data=mixed_behav_prof_data)
     assert eq == expected
@@ -552,12 +555,13 @@ def test_lp_behavior_double():
 )
 def test_lp_behavior_rational(game: gbt.Game, mixed_behav_prof_data: list):
     """Test calls of LP for mixed behavior equilibria, rational precision,
-    using max_regret (internal consistency); and comparison to a previously
-    computed equilibrium using this function (regression test)
+    using max_regret and agent_max_regret (internal consistency); and
+    comparison to a previously computed equilibrium using this function (regression test).
     """
     result = gbt.nash.lp_solve(game, use_strategic=False, rational=True)
     assert len(result.equilibria) == 1
     eq = result.equilibria[0]
+    assert eq.max_regret() == 0
     assert eq.agent_max_regret() == 0
     expected = game.mixed_behavior_profile(rational=True, data=mixed_behav_prof_data)
     assert eq == expected