sat: rework to use integral variable, not individual bools

2023-05-20 18:03:23 +02:00 · 2023-05-20 18:03:23 +02:00 · ac261c629e
commit ac261c629e
parent de00fdc0e1
1 changed files with 17 additions and 34 deletions
--- a/sat.py
+++ b/sat.py
@ -1,5 +1,6 @@
 import copy
-from pysmt.shortcuts import Symbol, Bool, Not, Implies, Iff, And, Or, AtMostOne, ExactlyOne, get_model, get_atoms, get_formula_size, get_unsat_core
+from pysmt.shortcuts import Symbol, Bool, Not, Implies, Iff, And, Or, AtMostOne, ExactlyOne, get_model, get_atoms, get_formula_size, get_unsat_core, Equals, GE, NotEquals, Int
 from pysmt.typing import INT
 from pysmt.rewritings import conjunctive_partition
 import json
 from typing import List, Optional, Tuple
@ -19,28 +20,15 @@ class Literals():
    # default distribution among all suits is assumed
    def __init__(self, instance: HanabiInstance):
-        # clues[m][i] == "after move m we have at least i clues"
+        # clues[m][i] == "after move m we have i clues", in clue starved, this counts half clues
        self.clues = {
-                -1: { i: Bool(i < 9) for i in range(0, 10) }  # we have 8 clues after turn -1
+                -1: Int(16 if instance.clue_starved else 8)  # we have 8 clues after turn
                , **{
-                        m: {
+                        m: Symbol('m{}clues'.format(m), INT)
                            0: Bool(True),                                                # always at least 0 clues
                            **{ i: Symbol('m{}clues{}'.format(m, i)) for i in range(1, 9) },
                            9: Bool(False)                                                # never 9 or more clues. This will implicitly forbid discarding at 8 clues later
                           }
                        for m in range(instance.max_winning_moves)
                    }
                }
        # half_clue[m] == "after move we have (an additional) half a clue [relevant for ClueStarved variants]"
        self.half_clue = {
                -1: Bool(False)
                , **{
                    m: Symbol('m{}halfclue'.format(m))
                    for m in range(instance.max_winning_moves)
                    }
                }
        # strikes[m][i] == "after move m we have at least i strikes"
        self.strikes = {
                    -1: {i: Bool(i == 0) for i in range(0, instance.num_strikes + 1)}    # no strikes when we start
@ -152,8 +140,8 @@ def solve_sat(starting_state: GameState | HanabiInstance) -> Tuple[bool, Optiona
        # have to set additional variables
        # set initial clues
-        for i in range(0,10):
+        for i in range(0, 10):
-            ls.clues[first_turn - 1][i] = Bool(i <= game_state.clues)
+            ls.clues[first_turn - 1] = Int(game_state.clues)
        # set initial strikes
        for i in range(0, instance.num_strikes + 1):
@ -202,18 +190,13 @@ def solve_sat(starting_state: GameState | HanabiInstance) -> Tuple[bool, Optiona
        Iff(ls.play5[m], And(ls.play[m], Or(ls.discard[m][i] for i in range(instance.deck_size) if instance.deck[i].rank == 5))),
        # definition of ls.incr_clues
-        Iff(ls.incr_clues[m], And(ls.discard_any[m], Not(ls.clues[m-1][8]), Implies(ls.play[m], ls.play5[m]))),
+        Iff(ls.incr_clues[m], And(ls.discard_any[m], NotEquals(ls.clues[m-1], Int(16 if instance.clue_starved else 8)), Implies(ls.play[m], ls.play5[m]))),
        # change of ls.clues
-        *[
+        Implies(And(Not(ls.discard_any[m]), Not(ls.dummyturn[m])),
-            Iff(ls.clues[m][i], Or(
+                Equals(ls.clues[m], ls.clues[m-1] - (2 if instance.clue_starved else 1))),
-                ls.clues[m-1][i+1],
+        Implies(ls.incr_clues[m], Equals(ls.clues[m], ls.clues[m-1] + 1)),
-                And(ls.clues[m-1][i], Or(ls.discard_any[m], ls.dummyturn[m])),
+        Implies(And(Or(ls.discard_any[m], ls.dummyturn[m]), Not(ls.incr_clues[m])), Equals(ls.clues[m], ls.clues[m-1])),
                And(ls.clues[m-1][i-1], ls.incr_clues[m], ls.half_clue[m-1] if instance.clue_starved else Bool(True))
                )
            )
          for i in range(1, 9)
        ],
        Iff(ls.half_clue[m], Or(And(ls.half_clue[m-1], Not(ls.incr_clues[m])), And(Not(ls.half_clue[m-1])), ls.incr_clues[m]))
        if instance.clue_starved else Bool(True),
@ -223,13 +206,13 @@ def solve_sat(starting_state: GameState | HanabiInstance) -> Tuple[bool, Optiona
        # It's easy to see that if there is any solution to the instance, then there is also one where we only strike at 8 clues
        # (or not at all) -> Just strike later if neccessary
        # So, we decrease the solution space with this formulation, but do not change whether it's empty or not
-        Iff(ls.strike[m], And(ls.discard_any[m], Not(ls.play[m]), ls.clues[m-1][8])),
+        Iff(ls.strike[m], And(ls.discard_any[m], Not(ls.play[m]), Equals(ls.clues[m-1], Int(16 if instance.clue_starved else 8)))),
        # change of strikes
        *[Iff(ls.strikes[m][i], Or(ls.strikes[m-1][i], And(ls.strikes[m-1][i-1], ls.strike[m]))) for i in range(1, instance.num_strikes + 1)],
        # less than 0 clues not allowed
-        Implies(Not(ls.discard_any[m]), Or(ls.clues[m-1][1], ls.dummyturn[m])),
+        Implies(Not(ls.discard_any[m]), Or(GE(ls.clues[m-1], Int(1)), ls.dummyturn[m])),
        # we can only draw card i if the last ls.drawn card was i-1
        *[Implies(ls.draw[m][i], Or(And(ls.draw[m0][i-1], *[Not(ls.draw_any[m1]) for m1 in range(m0+1, m)]) for m0 in range(max(first_turn - 1, m-9), m))) for i in range(game_state.progress, instance.deck_size)],
@ -325,7 +308,7 @@ def log_model(model, cur_game_state, ls: Literals):
        logger.debug('[print_model] Note: Omitting first {} turns, since they were fixed already.'.format(first_turn))
    for m in range(first_turn, cur_game_state.instance.max_winning_moves):
        logger.debug('=== move {} ==='.format(m))
-        logger.debug('clues: ' + ''.join(str(i) for i in range(1, 9) if model.get_py_value(ls.clues[m][i])))
+        logger.debug('clues: {}'.format(model.get_py_value(ls.clues[m])))
        logger.debug('strikes: ' + ''.join(str(i) for i in range(1, 3) if model.get_py_value(ls.strikes[m][i])))
        logger.debug('draw: ' + ', '.join('{}: {}'.format(i, deck[i]) for i in range(cur_game_state.progress, cur_game_state.instance.deck_size) if model.get_py_value(ls.draw[m][i])))
        logger.debug('discard: ' + ', '.join('{}: {}'.format(i, deck[i]) for i in range(cur_game_state.instance.deck_size) if model.get_py_value(ls.discard[m][i])))