Endgame-Analyzer/game_state.h

#ifndef DYNAMIC_PROGRAM_GAME_STATE_H
#define DYNAMIC_PROGRAM_GAME_STATE_H

#include <array>
#include <cstdint>
#include <algorithm>
#include <cstddef>
#include <bitset>
#include <limits>
#include <optional>
#include <boost/container/static_vector.hpp>
#include <list>
#include <ostream>


namespace Hanabi {

using rank_t = std::uint8_t;
using suit_t = std::uint8_t;
using clue_t = std::uint8_t;
using player_t = std::int8_t;
using hand_index_t = std::uint8_t;

using state_t = std::uint32_t;

/**
 * We will generally assume that stacks are played from n to 0
 * Playing a 0 will yield a clue
 * Therefore, for the default hanabi, we will play 4,3,2,1,0 in that order
 * on each stack. A stack with no cards played implicitly has value 5 on it
 * This is just easier to implement, since then the remaining number of cards
 * to be played is always the current number of the stack
 */
constexpr rank_t starting_card_rank = 5;
constexpr suit_t max_suit_index = 5;
constexpr size_t max_card_duplicity = 3;
constexpr player_t draw_pile = -1;
constexpr player_t trash_or_play_stack = -2;
constexpr clue_t max_num_clues = 8;

constexpr std::array<std::string, 6> suit_initials{"r", "y", "g", "b", "p", "t"};

struct Card {
  suit_t suit;
  rank_t rank;
  bool was_in_initial_hand;
  bool initial_trash;

  Card &operator++();
  const Card operator++(int);

  auto operator<=>(const Card &) const = default;
};

std::ostream &operator<<(std::ostream &os, const Card &card);

constexpr Card r0 = {0, 0};
constexpr Card r1 = {0, 1};
constexpr Card r2 = {0, 2};
constexpr Card r3 = {0, 3};
constexpr Card r4 = {0, 4};
constexpr Card y0 = {1, 0};
constexpr Card y1 = {1, 1};
constexpr Card y2 = {1, 2};
constexpr Card y3 = {1, 3};
constexpr Card y4 = {1, 4};

/**
 * To store:
 * - Draw pile size
 * - Distribution of cards
 *      - Which cards exist?
 * - Number of clues
 */

template <size_t num_suits>
using Stacks = std::array<rank_t, num_suits>;

template <size_t num_suits>
std::ostream& operator<<(std::ostream &os, const Stacks<num_suits> &stacks);

struct CardMultiplicity {
  Card card;
  std::uint8_t multiplicity;

  auto operator<=>(const CardMultiplicity &) const = default;
};

template<typename T>
struct InnerCardArray {
    template<size_t N>
    using array_t = std::array<T, N>;
};

template<>
struct InnerCardArray<bool> {
    template<size_t N>
    using array_t = std::bitset<N>;
};

template <suit_t num_suits, typename T> struct CardArray {
    using value_type = T;

    CardArray() = default;
    explicit CardArray(value_type default_val);

    void fill(value_type val);

    const value_type &operator[](const Card &card) const;

    value_type &operator[](const Card &card);

    auto operator<=>(const CardArray &) const = default;

private:
    using inner_array_t = typename InnerCardArray<T>::template array_t<starting_card_rank>;
    std::array<inner_array_t , num_suits> _array {};
};

enum class ActionType {
    play = 0,
    discard = 1,
    clue = 2,
    color_clue = 2,
    rank_clue = 3,
    end_game = 4,
    vote_terminate = 10,
};

struct BacktrackAction {
  // The card that was discarded or played
  Card discarded{};
  // Index of card in hand that was discarded or played
  hand_index_t index{};
  // Multiplicity of new draw (needed for probability calculations)
  hand_index_t multiplicity{};
};

class HanabiStateIF {
public:
    virtual double backtrack(size_t depth) = 0;

    virtual void clue() = 0;
    virtual BacktrackAction discard(hand_index_t index) = 0;
    virtual BacktrackAction play(hand_index_t index) = 0;

    [[nodiscard]] virtual hand_index_t find_card_in_hand(const Card& card) const = 0;
    [[nodiscard]] virtual bool is_trash(const Card& card) const = 0;
    [[nodiscard]] virtual bool is_playable(const Card& card) const = 0;

    [[nodiscard]] virtual std::uint64_t enumerated_states() const = 0;

    virtual void normalize_draw_and_positions() = 0;

    virtual ~HanabiStateIF() = default;

protected:
    virtual void print(std::ostream& os) const = 0;

    friend std::ostream& operator<<(std::ostream&, HanabiStateIF const&);
};

template <suit_t num_suits, player_t num_players, hand_index_t hand_size>
class HanabiState : public HanabiStateIF {
public:
    HanabiState() = default;
    explicit HanabiState(const std::vector<Card>& deck);

    double backtrack(size_t depth) final;

    void clue() final;
    BacktrackAction play(hand_index_t index) final;
    BacktrackAction discard(hand_index_t index) final;

    void revert_clue();
    void revert_play(const BacktrackAction &action, bool was_on_8_clues);
    void revert_discard(const BacktrackAction &action);

    [[nodiscard]] hand_index_t find_card_in_hand(const Card& card) const final;
    [[nodiscard]] bool is_trash(const Card& card) const final;
    [[nodiscard]] bool is_playable(const Card& card) const final;

    [[nodiscard]] std::uint64_t enumerated_states() const final;

    void normalize_draw_and_positions() final;

    auto operator<=>(const HanabiState &) const = default;

protected:
    void print(std::ostream& os) const final;

private:
    template<bool update_card_positions> BacktrackAction play_and_potentially_update(hand_index_t index);
    template<bool update_card_positions> BacktrackAction discard_and_potentially_update(hand_index_t index);

    template<bool update_card_positions> hand_index_t draw(hand_index_t index);
    void revert_draw(hand_index_t index, Card discarded_card);

    void incr_turn();
    void decr_turn();

    player_t _turn{};
    clue_t _num_clues{};
    std::uint8_t _weighted_draw_pile_size{};
    Stacks<num_suits> _stacks{};
    std::array<std::array<Card, hand_size>, num_players> _hands{};
    std::list<CardMultiplicity> _draw_pile{};
    std::uint8_t _endgame_turns_left{};

    static constexpr uint8_t no_endgame = std::numeric_limits<uint8_t>::max();

    // This will save the card positions of all cards that are in the draw pile when we start backtracking
    CardArray<num_suits, boost::container::static_vector<player_t, max_card_duplicity>> _card_positions_draw;
    // This will indicate whether cards that were in hands initially still are in hands
    std::array<std::bitset<hand_size>, num_players> _card_positions_hands;

    // A list of cards (set up once upon initialization) of all good cards that were in starting hands
    std::array<boost::container::static_vector<Card, hand_size>, num_players> _good_cards_in_initial_draw_pile;

    // further statistics that we might want to keep track of
    uint8_t _pace{};
    uint8_t _score{};

    std::uint64_t _enumerated_states {};
};

template <std::size_t num_suits, player_t num_players, std::size_t hand_size>
bool same_up_to_discard_permutation(HanabiState<num_suits, num_players, hand_size> state1, HanabiState<num_suits, num_players, hand_size> state2) {
    auto comp = [](CardMultiplicity &m1, CardMultiplicity &m2) -> bool {
        return m1.card.suit < m2.card.suit || (m1.card.suit == m2.card.suit and m1.card.rank < m2.card.rank) ||
               (m1.card.suit == m2.card.suit and m1.card.rank == m2.card.rank and m1.multiplicity < m2.multiplicity);
    };
   state1._draw_pile.sort(comp);
   state2._draw_pile.sort(comp);
   return state1 == state2;
}


}

#include "game_state.hpp"

#endif // DYNAMIC_PROGRAM_GAME_STATE_H
initial commit of game state 2023-08-04 16:28:41 +02:00			`#ifndef DYNAMIC_PROGRAM_GAME_STATE_H`
			`#define DYNAMIC_PROGRAM_GAME_STATE_H`

			`#include <array>`
			`#include <cstdint>`
			`#include <algorithm>`
			`#include <cstddef>`
			`#include <bitset>`
			`#include <limits>`
			`#include <optional>`
			`#include <boost/container/static_vector.hpp>`
			`#include <list>`
			`#include <ostream>`


implement downloading games and parsing deck 2023-08-05 00:34:31 +02:00			`namespace Hanabi {`

initial commit of game state 2023-08-04 16:28:41 +02:00			`using rank_t = std::uint8_t;`
			`using suit_t = std::uint8_t;`
			`using clue_t = std::uint8_t;`
			`using player_t = std::int8_t;`
code cleanup (but printing currently bugged) 2023-08-06 23:12:44 +02:00			`using hand_index_t = std::uint8_t;`
initial commit of game state 2023-08-04 16:28:41 +02:00
			`using state_t = std::uint32_t;`

			`/**`
			`* We will generally assume that stacks are played from n to 0`
			`* Playing a 0 will yield a clue`
			`* Therefore, for the default hanabi, we will play 4,3,2,1,0 in that order`
			`* on each stack. A stack with no cards played implicitly has value 5 on it`
			`* This is just easier to implement, since then the remaining number of cards`
			`* to be played is always the current number of the stack`
			`*/`
			`constexpr rank_t starting_card_rank = 5;`
			`constexpr suit_t max_suit_index = 5;`
			`constexpr size_t max_card_duplicity = 3;`
			`constexpr player_t draw_pile = -1;`
			`constexpr player_t trash_or_play_stack = -2;`
			`constexpr clue_t max_num_clues = 8;`

implement reading from file. cleanup 2023-08-05 11:55:46 +02:00			`constexpr std::array<std::string, 6> suit_initials{"r", "y", "g", "b", "p", "t"};`
initial commit of game state 2023-08-04 16:28:41 +02:00
			`struct Card {`
			`suit_t suit;`
			`rank_t rank;`
set up initial card positions 2023-08-07 01:51:24 +02:00			`bool was_in_initial_hand;`
track card positions 2023-08-07 10:36:03 +02:00			`bool initial_trash;`
initial commit of game state 2023-08-04 16:28:41 +02:00
implement downloading games and parsing deck 2023-08-05 00:34:31 +02:00			`Card &operator++();`
clean up header 2023-08-04 16:55:41 +02:00			`const Card operator++(int);`
initial commit of game state 2023-08-04 16:28:41 +02:00
implement downloading games and parsing deck 2023-08-05 00:34:31 +02:00			`auto operator<=>(const Card &) const = default;`
initial commit of game state 2023-08-04 16:28:41 +02:00			`};`

code cleanup (but printing currently bugged) 2023-08-06 23:12:44 +02:00			`std::ostream &operator<<(std::ostream &os, const Card &card);`
initial commit of game state 2023-08-04 16:28:41 +02:00
more code cleanup: remove copy member from card 2023-08-06 22:20:20 +02:00			`constexpr Card r0 = {0, 0};`
			`constexpr Card r1 = {0, 1};`
			`constexpr Card r2 = {0, 2};`
			`constexpr Card r3 = {0, 3};`
			`constexpr Card r4 = {0, 4};`
			`constexpr Card y0 = {1, 0};`
			`constexpr Card y1 = {1, 1};`
			`constexpr Card y2 = {1, 2};`
			`constexpr Card y3 = {1, 3};`
			`constexpr Card y4 = {1, 4};`
initial commit of game state 2023-08-04 16:28:41 +02:00
			`/**`
			`* To store:`
			`* - Draw pile size`
			`* - Distribution of cards`
			`* - Which cards exist?`
			`* - Number of clues`
			`*/`

fix output operator for stack 2023-08-07 10:45:11 +02:00			`template <size_t num_suits>`
code cleanup (but printing currently bugged) 2023-08-06 23:12:44 +02:00			`using Stacks = std::array<rank_t, num_suits>;`
initial commit of game state 2023-08-04 16:28:41 +02:00
fix output operator for stack 2023-08-07 10:45:11 +02:00			`template <size_t num_suits>`
			`std::ostream& operator<<(std::ostream &os, const Stacks<num_suits> &stacks);`
initial commit of game state 2023-08-04 16:28:41 +02:00
			`struct CardMultiplicity {`
			`Card card;`
			`std::uint8_t multiplicity;`

implement downloading games and parsing deck 2023-08-05 00:34:31 +02:00			`auto operator<=>(const CardMultiplicity &) const = default;`
initial commit of game state 2023-08-04 16:28:41 +02:00			`};`

set up initial card positions 2023-08-07 01:51:24 +02:00			`template<typename T>`
			`struct InnerCardArray {`
			`template<size_t N>`
			`using array_t = std::array<T, N>;`
			`};`

			`template<>`
			`struct InnerCardArray<bool> {`
			`template<size_t N>`
			`using array_t = std::bitset<N>;`
			`};`

code cleanup (but printing currently bugged) 2023-08-06 23:12:44 +02:00			`template <suit_t num_suits, typename T> struct CardArray {`
remove unneeded template parameter. implement game getter and normalization 2023-08-06 10:23:29 +02:00			`using value_type = T;`
initial commit of game state 2023-08-04 16:28:41 +02:00
remove unneeded template parameter. implement game getter and normalization 2023-08-06 10:23:29 +02:00			`CardArray() = default;`
			`explicit CardArray(value_type default_val);`
initial commit of game state 2023-08-04 16:28:41 +02:00
set up initial card positions 2023-08-07 01:51:24 +02:00			`void fill(value_type val);`

remove unneeded template parameter. implement game getter and normalization 2023-08-06 10:23:29 +02:00			`const value_type &operator[](const Card &card) const;`
proper constructor for hanabi state 2023-08-05 12:19:34 +02:00
remove unneeded template parameter. implement game getter and normalization 2023-08-06 10:23:29 +02:00			`value_type &operator[](const Card &card);`

			`auto operator<=>(const CardArray &) const = default;`
initial commit of game state 2023-08-04 16:28:41 +02:00
			`private:`
set up initial card positions 2023-08-07 01:51:24 +02:00			`using inner_array_t = typename InnerCardArray<T>::template array_t<starting_card_rank>;`
			`std::array<inner_array_t , num_suits> _array {};`
initial commit of game state 2023-08-04 16:28:41 +02:00			`};`

parse actions from hanab.live 2023-08-05 13:04:51 +02:00			`enum class ActionType {`
			`play = 0,`
			`discard = 1,`
			`clue = 2,`
			`color_clue = 2,`
			`rank_clue = 3,`
			`end_game = 4,`
			`vote_terminate = 10,`
			`};`
initial commit of game state 2023-08-04 16:28:41 +02:00
parse actions from hanab.live 2023-08-05 13:04:51 +02:00			`struct BacktrackAction {`
implement backtracking approach 2023-08-06 11:54:57 +02:00			`// The card that was discarded or played`
implement downloading games and parsing deck 2023-08-05 00:34:31 +02:00			`Card discarded{};`
implement backtracking approach 2023-08-06 11:54:57 +02:00			`// Index of card in hand that was discarded or played`
code cleanup (but printing currently bugged) 2023-08-06 23:12:44 +02:00			`hand_index_t index{};`
implement backtracking approach 2023-08-06 11:54:57 +02:00			`// Multiplicity of new draw (needed for probability calculations)`
code cleanup (but printing currently bugged) 2023-08-06 23:12:44 +02:00			`hand_index_t multiplicity{};`
initial commit of game state 2023-08-04 16:28:41 +02:00			`};`

add virtual interface for all hanabi states 2023-08-06 22:06:58 +02:00			`class HanabiStateIF {`
			`public:`
			`virtual double backtrack(size_t depth) = 0;`

			`virtual void clue() = 0;`
code cleanup (but printing currently bugged) 2023-08-06 23:12:44 +02:00			`virtual BacktrackAction discard(hand_index_t index) = 0;`
			`virtual BacktrackAction play(hand_index_t index) = 0;`
add virtual interface for all hanabi states 2023-08-06 22:06:58 +02:00
code cleanup (but printing currently bugged) 2023-08-06 23:12:44 +02:00			`[[nodiscard]] virtual hand_index_t find_card_in_hand(const Card& card) const = 0;`
add virtual interface for all hanabi states 2023-08-06 22:06:58 +02:00			`[[nodiscard]] virtual bool is_trash(const Card& card) const = 0;`
			`[[nodiscard]] virtual bool is_playable(const Card& card) const = 0;`

			`[[nodiscard]] virtual std::uint64_t enumerated_states() const = 0;`

			`virtual void normalize_draw_and_positions() = 0;`

			`virtual ~HanabiStateIF() = default;`

			`protected:`
			`virtual void print(std::ostream& os) const = 0;`

			`friend std::ostream& operator<<(std::ostream&, HanabiStateIF const&);`
			`};`

code cleanup (but printing currently bugged) 2023-08-06 23:12:44 +02:00			`template <suit_t num_suits, player_t num_players, hand_index_t hand_size>`
add virtual interface for all hanabi states 2023-08-06 22:06:58 +02:00			`class HanabiState : public HanabiStateIF {`
initial commit of game state 2023-08-04 16:28:41 +02:00			`public:`
proper constructor for hanabi state 2023-08-05 12:19:34 +02:00			`HanabiState() = default;`
			`explicit HanabiState(const std::vector<Card>& deck);`

add virtual interface for all hanabi states 2023-08-06 22:06:58 +02:00			`double backtrack(size_t depth) final;`
implement backtracking approach 2023-08-06 11:54:57 +02:00
add virtual interface for all hanabi states 2023-08-06 22:06:58 +02:00			`void clue() final;`
code cleanup (but printing currently bugged) 2023-08-06 23:12:44 +02:00			`BacktrackAction play(hand_index_t index) final;`
			`BacktrackAction discard(hand_index_t index) final;`
proper constructor for hanabi state 2023-08-05 12:19:34 +02:00
track card positions 2023-08-07 10:36:03 +02:00			`void revert_clue();`
			`void revert_play(const BacktrackAction &action, bool was_on_8_clues);`
			`void revert_discard(const BacktrackAction &action);`
proper constructor for hanabi state 2023-08-05 12:19:34 +02:00
code cleanup (but printing currently bugged) 2023-08-06 23:12:44 +02:00			`[[nodiscard]] hand_index_t find_card_in_hand(const Card& card) const final;`
add virtual interface for all hanabi states 2023-08-06 22:06:58 +02:00			`[[nodiscard]] bool is_trash(const Card& card) const final;`
			`[[nodiscard]] bool is_playable(const Card& card) const final;`
proper constructor for hanabi state 2023-08-05 12:19:34 +02:00
add virtual interface for all hanabi states 2023-08-06 22:06:58 +02:00			`[[nodiscard]] std::uint64_t enumerated_states() const final;`
implement initialising + doing actions of game state 2023-08-05 13:51:55 +02:00
add virtual interface for all hanabi states 2023-08-06 22:06:58 +02:00			`void normalize_draw_and_positions() final;`
remove unneeded template parameter. implement game getter and normalization 2023-08-06 10:23:29 +02:00
add virtual interface for all hanabi states 2023-08-06 22:06:58 +02:00			`auto operator<=>(const HanabiState &) const = default;`
proper constructor for hanabi state 2023-08-05 12:19:34 +02:00
add virtual interface for all hanabi states 2023-08-06 22:06:58 +02:00			`protected:`
			`void print(std::ostream& os) const final;`
initial commit of game state 2023-08-04 16:28:41 +02:00
add virtual interface for all hanabi states 2023-08-06 22:06:58 +02:00			`private:`
track card positions 2023-08-07 10:36:03 +02:00			`template<bool update_card_positions> BacktrackAction play_and_potentially_update(hand_index_t index);`
			`template<bool update_card_positions> BacktrackAction discard_and_potentially_update(hand_index_t index);`
support striking of cards 2023-08-07 00:06:50 +02:00
track card positions 2023-08-07 10:36:03 +02:00			`template<bool update_card_positions> hand_index_t draw(hand_index_t index);`
code cleanup (but printing currently bugged) 2023-08-06 23:12:44 +02:00			`void revert_draw(hand_index_t index, Card discarded_card);`
proper constructor for hanabi state 2023-08-05 12:19:34 +02:00
			`void incr_turn();`
			`void decr_turn();`

			`player_t _turn{};`
			`clue_t _num_clues{};`
implement backtracking approach 2023-08-06 11:54:57 +02:00			`std::uint8_t _weighted_draw_pile_size{};`
proper constructor for hanabi state 2023-08-05 12:19:34 +02:00			`Stacks<num_suits> _stacks{};`
implement initialising + doing actions of game state 2023-08-05 13:51:55 +02:00			`std::array<std::array<Card, hand_size>, num_players> _hands{};`
proper constructor for hanabi state 2023-08-05 12:19:34 +02:00			`std::list<CardMultiplicity> _draw_pile{};`
add virtual interface for all hanabi states 2023-08-06 22:06:58 +02:00			`std::uint8_t _endgame_turns_left{};`
proper constructor for hanabi state 2023-08-05 12:19:34 +02:00
add virtual interface for all hanabi states 2023-08-06 22:06:58 +02:00			`static constexpr uint8_t no_endgame = std::numeric_limits<uint8_t>::max();`
more assertions 2023-08-06 13:53:18 +02:00
set up initial card positions 2023-08-07 01:51:24 +02:00			`// This will save the card positions of all cards that are in the draw pile when we start backtracking`
			`CardArray<num_suits, boost::container::static_vector<player_t, max_card_duplicity>> _card_positions_draw;`
			`// This will indicate whether cards that were in hands initially still are in hands`
track card positions 2023-08-07 10:36:03 +02:00			`std::array<std::bitset<hand_size>, num_players> _card_positions_hands;`
set up initial card positions 2023-08-07 01:51:24 +02:00
			`// A list of cards (set up once upon initialization) of all good cards that were in starting hands`
			`std::array<boost::container::static_vector<Card, hand_size>, num_players> _good_cards_in_initial_draw_pile;`

proper constructor for hanabi state 2023-08-05 12:19:34 +02:00			`// further statistics that we might want to keep track of`
			`uint8_t _pace{};`
implement backtracking approach 2023-08-06 11:54:57 +02:00			`uint8_t _score{};`
proper constructor for hanabi state 2023-08-05 12:19:34 +02:00
working version done 2023-08-06 15:02:50 +02:00			`std::uint64_t _enumerated_states {};`
proper constructor for hanabi state 2023-08-05 12:19:34 +02:00			`};`
initial commit of game state 2023-08-04 16:28:41 +02:00
comment out card positions member 2023-08-06 14:06:41 +02:00			`template <std::size_t num_suits, player_t num_players, std::size_t hand_size>`
			`bool same_up_to_discard_permutation(HanabiState<num_suits, num_players, hand_size> state1, HanabiState<num_suits, num_players, hand_size> state2) {`
			`auto comp = [](CardMultiplicity &m1, CardMultiplicity &m2) -> bool {`
			`return m1.card.suit < m2.card.suit \|\| (m1.card.suit == m2.card.suit and m1.card.rank < m2.card.rank) \|\|`
			`(m1.card.suit == m2.card.suit and m1.card.rank == m2.card.rank and m1.multiplicity < m2.multiplicity);`
			`};`
			`state1._draw_pile.sort(comp);`
			`state2._draw_pile.sort(comp);`
			`return state1 == state2;`
			`}`

initial commit of game state 2023-08-04 16:28:41 +02:00
implement downloading games and parsing deck 2023-08-05 00:34:31 +02:00			`}`

implement reading from file. cleanup 2023-08-05 11:55:46 +02:00			`#include "game_state.hpp"`

implement downloading games and parsing deck 2023-08-05 00:34:31 +02:00			`#endif // DYNAMIC_PROGRAM_GAME_STATE_H`