from __future__ import annotations from enum import Enum import json class Ch(Enum): Empty = 0 Cross = 1 Circle = 2 def ch_str(ch: Ch, empty = " ") -> str: match ch: case Ch.Empty: return empty case Ch.Cross: return "X" case Ch.Circle: return "O" CH_WIDTH = 2 class Board: def __init__(self, val = 0) -> None: self.val = val def possible_plays(self) -> list[int]: return [i for i in range(9) if (self.val >> i * CH_WIDTH & 0b11) == 0] def clone(self) -> Board: return Board(self.val) def play(self, ch: Ch, i: int): self.val |= ch.value << i * CH_WIDTH def with_play(self, ch: Ch, i: int) -> Board: board = self.clone() board.play(ch, i) return board def rotate(self): idcs = [6, 3, 0, 7, 4, 1, 8, 5, 2] vals = [self.val >> i * CH_WIDTH & 0b11 for i in idcs] self.val = 0 for i, v in enumerate(vals): self.val |= v << i * CH_WIDTH def flip(self): idcs = [6, 7, 8, 3, 4, 5, 0, 1, 2] vals = [self.val >> i * CH_WIDTH & 0b11 for i in idcs] self.val = 0 for i, v in enumerate(vals): self.val |= v << i * CH_WIDTH def key(self) -> int: return self.val def place(self, i: int) -> Ch: return Ch(self.val >> i * CH_WIDTH & 0b11) def player_has_won(self, ch: Ch) -> bool: combos = [ (0, 1, 2), (3, 4, 5), (6, 7, 8), (0, 3, 6), (1, 4, 7), (2, 5, 8), (0, 4, 8), (2, 4, 6), ] for combo in combos: if all(self.place(p) == ch for p in list(combo)): return True return False def is_draw(self) -> bool: return len(self.possible_plays()) == 0 def __repr__(self) -> str: # print(f"{self.val:b}".rjust(18, "0")) return "[" + "".join(ch_str(Ch(self.val >> i * CH_WIDTH & 0b11)) for i in range(9)).replace(" ", ".") + "]" def print(self) -> None: s = [ch_str(Ch(self.val >> i * CH_WIDTH & 0b11), empty=f"\x1b[0;37m{i}\x1b[0m") for i in range(9)] print("#############") print(f"# {s[0]} | {s[1]} | {s[2]} #") print("#---+---+---#") print(f"# {s[3]} | {s[4]} | {s[5]} #") print("#---+---+---#") print(f"# {s[6]} | {s[7]} | {s[8]} #") print("#############") START_WEIGHT = 20 REWARD = 1 PUNUSHMENT = 1 class AiPlayer: def __init__(self, ch: Ch) -> None: self.choices: dict[int, int] = {} self.current_choices: list[int] = [] self.ch = ch def clear_choices(self): self.current_choices = [] def reward(self): for choice in self.current_choices: self.choices[choice] += REWARD def punish(self): for choice in self.current_choices: self.choices[choice] -= PUNUSHMENT def interned_choice(self, choice: Board) -> Board: for _ in range(2): for _ in range(4): key = choice.key() if key in self.choices: return choice choice.rotate() choice.flip() key = choice.key() self.choices[key] = START_WEIGHT return choice def make_play(self, board: Board) -> None: possible_choices = [(idx, board.with_play(self.ch, idx)) for idx in board.possible_plays()] candiate_weigth = 0 candidate_idcs: list[tuple[int, int]] = [] for idx, choice in possible_choices: choice = self.interned_choice(choice) key = choice.key() if self.choices[key] > candiate_weigth: candiate_weigth = self.choices[key] candidate_idcs = [(idx, key)] elif self.choices[key] == candiate_weigth: candidate_idcs.append((idx, key)) (choice_idx, choice_key) = candidate_idcs[0] self.current_choices.append(choice_key) board.play(self.ch, choice_idx) def save_to_file(self): with open("ai.json", "w") as file: file.write(json.dumps(self.choices)) def load_from_file(self): with open("ai.json", "r") as file: vs = json.loads(file.read()) self.choices = {} for key in vs: self.choices[int(key)] = vs[key] class Game: def __init__(self) -> None: self.current_plays = [] self.weights = {} p0 = AiPlayer(Ch.Cross) games = 0 while True: print(f"\n\nGame #{games}") board = Board() p0.clear_choices() while True: print("AI's turn") p0.make_play(board) board.print() if board.player_has_won(Ch.Cross): print("AI won!") print("Rewarding AI...") p0.reward() break print("Your turn (0..8)") if board.is_draw(): print("Draw!") break possible_choices = board.possible_plays() should_restart = False while True: text = input("> ") if text == ".save": p0.save_to_file() continue elif text == ".load": p0.load_from_file() choice = 0 should_restart = True continue elif text == ".restart": choice = 0 should_restart = True break choice = int(text) if choice not in possible_choices: print("invalid choice") else: break if should_restart: break board.play(Ch.Circle, choice) board.print() if board.player_has_won(Ch.Circle): print("Player won!") print("Punishing AI...") p0.punish() break games += 1