games/tictactoe.py

from __future__ import annotations

import pdb
import random
import typing as tp
from dataclasses import dataclass
from functools import cache

import pdbp

import util

if hasattr(pdb, "DefaultConfig"):
    pdb.DefaultConfig.sticky_by_default = False  # type:ignore

Player = tp.Literal["X", "O"]
Winner = Player | tp.Literal["draw"]
Square = Player | tp.Literal[" "]
Board = tuple[Square, Square, Square, Square, Square, Square, Square, Square, Square]
Score = int

# TODO: "get best move"
# TODO: alpha-beta pruning (elegantly)
# TODO: rotational / reflectional board parity (for less total nodes)


class QuitException(Exception):
    pass


@dataclass(frozen=True)
class GameState:
    player: Player
    board: Board

    def __str__(self):
        b = self.board
        return (
            f" {b[0]} │ {b[1]} │ {b[2]}\n"
            "───┼───┼───\n"
            f" {b[3]} │ {b[4]} │ {b[5]}\n"
            "───┼───┼───\n"
            f" {b[6]} │ {b[7]} │ {b[8]}"
        )


@dataclass(frozen=True)
class Move:
    position: int

    def __str__(self) -> str:
        return str(self.position + 1)


# @cache
def get_valid_moves(state: GameState) -> tp.Iterable[Move]:
    return tuple(
        Move(position=i) for i, square in enumerate(state.board) if square == " "
    )


# @cache
def apply_move(state: GameState, move: Move) -> GameState:
    new_player = "X" if state.player == "O" else "O"

    new_board = list(state.board)
    new_board[move.position] = state.player
    new_board = tuple(new_board)

    return GameState(player=new_player, board=new_board)


# @cache
def get_winner(state: GameState) -> Winner | None:
    # abc
    # def
    # ghi
    a, b, c, d, e, f, g, h, i = state.board

    # horizontal
    if a == b == c and a != " ":
        return a
    if d == e == f and d != " ":
        return d
    if g == h == i and g != " ":
        return g

    # vertical
    if a == d == g and a != " ":
        return a
    if b == e == h and b != " ":
        return b
    if c == f == i and c != " ":
        return c

    # diagonal
    if a == e == i and a != " ":
        return a
    if c == e == g and c != " ":
        return c

    # draw
    if not any(square == " " for square in state.board):
        return "draw"

    # no winner
    return None


# @cache
def get_next_states(state: GameState) -> tuple[tuple[Move, GameState], ...]:
    assert get_winner(state) is None, "should not be called if game ended"
    return tuple((move, apply_move(state, move)) for move in get_valid_moves(state))


# @cache
@util.count_calls
def get_score(target: Player, state: GameState) -> Score:
    winner = get_winner(state)
    if winner == target:
        return 1
    if winner == "draw":
        return 0
    if winner is not None:
        # winner must be the opponent
        return -1

    agg = max if state.player == target else min
    score = agg(
        get_score(target, next_state) for _, next_state in get_next_states(state)
    )
    return score


# @cache
def get_scored_moves(
    target: Player, state: GameState
) -> tuple[tuple[Score, Move], ...]:
    return tuple(
        (get_score(target, state), move) for move, state in get_next_states(state)
    )


def get_human_move(state: GameState) -> Move:
    print("123\n456\n789")
    while True:
        choice = input("choice: ")
        if choice.endswith("b"):
            breakpoint()
            choice = choice[:-1]
        if choice == "":
            continue
        elif choice == "q":
            raise QuitException
        move = Move(position=int(choice) - 1)
        if move not in get_valid_moves(state):
            print("bad move")
            continue
        return move


REAL = GameState(player="X", board=(" ",) * 9)

# if __name__ == "__main__":
#     # total_nodes=5478
#     # print(f"{get_score('X', REAL)=}, {CALL_COUNTS['get_score']=}")
#     # best_moves = get_best_moves(REAL)
#     play_human(human_player="X", state=REAL)
tic tac toe monte carlo style 2023-06-01 07:58:45 +00:00			`from __future__ import annotations`

play against a human 2023-06-07 04:35:36 +00:00			`import pdb`
			`import random`
tic tac toe monte carlo style 2023-06-01 07:58:45 +00:00			`import typing as tp`
			`from dataclasses import dataclass`
updates per discussion with chris ariza 2023-06-01 21:22:42 +00:00			`from functools import cache`
tic tac toe monte carlo style 2023-06-01 07:58:45 +00:00
play against a human 2023-06-07 04:35:36 +00:00			`import pdbp`

an attempt at protocoling the module 2023-06-08 03:22:30 +00:00			`import util`

play against a human 2023-06-07 04:35:36 +00:00			`if hasattr(pdb, "DefaultConfig"):`
			`pdb.DefaultConfig.sticky_by_default = False # type:ignore`

tic tac toe monte carlo style 2023-06-01 07:58:45 +00:00			`Player = tp.Literal["X", "O"]`
ab pruning 2023-06-02 05:58:42 +00:00			`Winner = Player \| tp.Literal["draw"]`
updates per discussion with chris ariza 2023-06-01 21:22:42 +00:00			`Square = Player \| tp.Literal[" "]`
tic tac toe monte carlo style 2023-06-01 07:58:45 +00:00			`Board = tuple[Square, Square, Square, Square, Square, Square, Square, Square, Square]`
play against a human 2023-06-07 04:35:36 +00:00			`Score = int`
ab pruning 2023-06-02 05:58:42 +00:00
			`# TODO: "get best move"`
play against a human 2023-06-07 04:35:36 +00:00			`# TODO: alpha-beta pruning (elegantly)`
ab pruning 2023-06-02 05:58:42 +00:00			`# TODO: rotational / reflectional board parity (for less total nodes)`
tic tac toe monte carlo style 2023-06-01 07:58:45 +00:00
play against a human 2023-06-07 04:35:36 +00:00
			`class QuitException(Exception):`
			`pass`

tic tac toe monte carlo style 2023-06-01 07:58:45 +00:00
			`@dataclass(frozen=True)`
			`class GameState:`
			`player: Player`
			`board: Board`

			`def __str__(self):`
			`b = self.board`
			`return (`
			`f" {b[0]} │ {b[1]} │ {b[2]}\n"`
			`"───┼───┼───\n"`
			`f" {b[3]} │ {b[4]} │ {b[5]}\n"`
			`"───┼───┼───\n"`
			`f" {b[6]} │ {b[7]} │ {b[8]}"`
			`)`


			`@dataclass(frozen=True)`
			`class Move:`
			`position: int`

play against a human 2023-06-07 04:35:36 +00:00			`def __str__(self) -> str:`
			`return str(self.position + 1)`

tic tac toe monte carlo style 2023-06-01 07:58:45 +00:00
an attempt at protocoling the module 2023-06-08 03:22:30 +00:00			`# @cache`
			`def get_valid_moves(state: GameState) -> tp.Iterable[Move]:`
tic tac toe monte carlo style 2023-06-01 07:58:45 +00:00			`return tuple(`
ab pruning 2023-06-02 05:58:42 +00:00			`Move(position=i) for i, square in enumerate(state.board) if square == " "`
tic tac toe monte carlo style 2023-06-01 07:58:45 +00:00			`)`


an attempt at protocoling the module 2023-06-08 03:22:30 +00:00			`# @cache`
tic tac toe monte carlo style 2023-06-01 07:58:45 +00:00			`def apply_move(state: GameState, move: Move) -> GameState:`
updates per discussion with chris ariza 2023-06-01 21:22:42 +00:00			`new_player = "X" if state.player == "O" else "O"`
tic tac toe monte carlo style 2023-06-01 07:58:45 +00:00
			`new_board = list(state.board)`
updates per discussion with chris ariza 2023-06-01 21:22:42 +00:00			`new_board[move.position] = state.player`
tic tac toe monte carlo style 2023-06-01 07:58:45 +00:00			`new_board = tuple(new_board)`

			`return GameState(player=new_player, board=new_board)`


an attempt at protocoling the module 2023-06-08 03:22:30 +00:00			`# @cache`
updates per discussion with chris ariza 2023-06-01 21:22:42 +00:00			`def get_winner(state: GameState) -> Winner \| None:`
tic tac toe monte carlo style 2023-06-01 07:58:45 +00:00			`# abc`
			`# def`
			`# ghi`
			`a, b, c, d, e, f, g, h, i = state.board`

			`# horizontal`
			`if a == b == c and a != " ":`
			`return a`
			`if d == e == f and d != " ":`
			`return d`
			`if g == h == i and g != " ":`
			`return g`

			`# vertical`
			`if a == d == g and a != " ":`
			`return a`
			`if b == e == h and b != " ":`
			`return b`
			`if c == f == i and c != " ":`
			`return c`

			`# diagonal`
			`if a == e == i and a != " ":`
			`return a`
			`if c == e == g and c != " ":`
			`return c`

			`# draw`
			`if not any(square == " " for square in state.board):`
ab pruning 2023-06-02 05:58:42 +00:00			`return "draw"`
tic tac toe monte carlo style 2023-06-01 07:58:45 +00:00
			`# no winner`
			`return None`


an attempt at protocoling the module 2023-06-08 03:22:30 +00:00			`# @cache`
play against a human 2023-06-07 04:35:36 +00:00			`def get_next_states(state: GameState) -> tuple[tuple[Move, GameState], ...]:`
ab pruning 2023-06-02 05:58:42 +00:00			`assert get_winner(state) is None, "should not be called if game ended"`
play against a human 2023-06-07 04:35:36 +00:00			`return tuple((move, apply_move(state, move)) for move in get_valid_moves(state))`
tic tac toe monte carlo style 2023-06-01 07:58:45 +00:00

an attempt at protocoling the module 2023-06-08 03:22:30 +00:00			`# @cache`
			`@util.count_calls`
ab pruning 2023-06-02 05:58:42 +00:00			`def get_score(target: Player, state: GameState) -> Score:`
			`winner = get_winner(state)`
			`if winner == target:`
			`return 1`
			`if winner == "draw":`
			`return 0`
			`if winner is not None:`
			`# winner must be the opponent`
			`return -1`
tic tac toe monte carlo style 2023-06-01 07:58:45 +00:00
ab pruning 2023-06-02 05:58:42 +00:00			`agg = max if state.player == target else min`
play against a human 2023-06-07 04:35:36 +00:00			`score = agg(`
			`get_score(target, next_state) for _, next_state in get_next_states(state)`
			`)`
ab pruning 2023-06-02 05:58:42 +00:00			`return score`
tic tac toe monte carlo style 2023-06-01 07:58:45 +00:00
ab pruning 2023-06-02 05:58:42 +00:00
an attempt at protocoling the module 2023-06-08 03:22:30 +00:00			`# @cache`
			`def get_scored_moves(`
			`target: Player, state: GameState`
			`) -> tuple[tuple[Score, Move], ...]:`
			`return tuple(`
			`(get_score(target, state), move) for move, state in get_next_states(state)`
play against a human 2023-06-07 04:35:36 +00:00			`)`


			`def get_human_move(state: GameState) -> Move:`
			`print("123\n456\n789")`
			`while True:`
			`choice = input("choice: ")`
			`if choice.endswith("b"):`
			`breakpoint()`
			`choice = choice[:-1]`
			`if choice == "":`
			`continue`
			`elif choice == "q":`
			`raise QuitException`
			`move = Move(position=int(choice) - 1)`
			`if move not in get_valid_moves(state):`
			`print("bad move")`
			`continue`
			`return move`


ab pruning 2023-06-02 05:58:42 +00:00			`REAL = GameState(player="X", board=(" ",) * 9)`
he doesnt know about dynamic programming :) 2023-06-01 08:05:25 +00:00
an attempt at protocoling the module 2023-06-08 03:22:30 +00:00			`# if __name__ == "__main__":`
			`# # total_nodes=5478`
			`# # print(f"{get_score('X', REAL)=}, {CALL_COUNTS['get_score']=}")`
			`# # best_moves = get_best_moves(REAL)`
			`# play_human(human_player="X", state=REAL)`