Initial commit

2023-08-25 14:34:55 +00:00 · 2023-08-25 14:34:55 +00:00 · da4a3bc4c0
commit da4a3bc4c0
15 changed files with 503 additions and 0 deletions
--- a/.commit_template
+++ b/.commit_template
@ -0,0 +1,9 @@
+(Commit summary. Replace this with a one-line description of this commit.)
+
+What I changed
+(Replace this with a description of what you changed in this commit. This should be 1-2 sentences.)
+
+Why I changed it
+(Describe why you made these changes. Were you working toward a goal? Did you reorganize your code? This should be 1-2 sentences.)
+
+Estimate for remaining time to finish assignment: [REPLACE WITH TIME ESTIMATE]
--- a/.gitignore
+++ b/.gitignore
@ -0,0 +1,3 @@
+*.swp
+*.swo
+**/__pycache__/*
--- a/nim/game_stub.py
+++ b/nim/game_stub.py
@ -0,0 +1,34 @@
+class NimGameStub:
+    """A stub is a minimal version of a class which stands in for the 
+    real class, which hasn't yet been written. The stub has all the correct 
+    methods, and their inputs and outputs are the right kind of thing, 
+    but it doesn't really do anything. 
+    """
+    def get_initial_state(self):
+        return {
+            "board": [1, 3, 5, 7],
+            "first_player": True
+        }
+
+    def get_next_state(self, state, action):
+        next_state = {
+            "board": state["board"].copy(),
+            "first_player": not state["first_player"],
+        }
+        return next_state
+
+    def get_actions(self, state):
+        return [
+            (0, 0), 
+            (1, 0), (1, 1),
+            (2, 0), (2, 1), (2, 2), (3, 0), (3, 1), (3, 2), (3, 3),
+        ]
+
+    def get_reward(self, state):
+        return 0
+
+    def is_over(self, state):
+        return False
+
+    def get_objective(self, state):
+        return max if state["first_player"] else min
--- a/nim/player.py
+++ b/nim/player.py
@ -0,0 +1,35 @@
+from nim.game_stub import NimGameStub
+from strategy.lookahead_strategy import LookaheadStrategy
+
+class HumanNimPlayer:
+    def __init__(self, name):
+        self.name = name
+        self.game = NimGameStub()
+
+    def choose_action(self, state):
+        actions = self.game.get_actions(state)
+        for i, action in enumerate(actions):
+            row, lines_to_remove = action
+            print(f"{i}. Remove {lines_to_remove} from row {row}.")
+        choice = self.get_int(len(actions))
+        return actions[choice]
+
+    def get_int(self, maximum):
+        while True:
+            response = input("> ")
+            if response.isdigit():
+                value = int(response)
+                if value < maximum:
+                    return value
+            print("Invalid input.")
+
+class ComputerNimPlayer:
+    def __init__(self, name):
+        self.name = name
+        self.strategy = LookaheadStrategy(NimGameStub(), max_depth=3, deterministic=False)
+
+    def choose_action(self, state):
+        action = self.strategy.choose_action(state)
+        row, lines_to_remove = action
+        print(f"{self.name} removes {lines_to_remove} from row {row}")
+        return action
--- a/nim/view.py
+++ b/nim/view.py
@ -0,0 +1,32 @@
+from nim.game_stub import NimGameStub
+
+class NimView:
+    def __init__(self, player0, player1):
+        self.players = [player0, player1]
+        self.game = NimGameStub()
+
+    def greet(self):
+        print(f"{self.players[0].name} and {self.players[1].name}, welcome to Nim.")
+    
+    def show_board(self, state):
+        for lines_in_row in state["board"]:
+            print("| " * lines_in_row)
+
+    def get_action(self, state):
+        self.show_board(state)
+        player = self.get_current_player(state)
+        return player.choose_action(state)
+
+    def get_current_player(self, state):
+        if state["first_player"]:
+            return self.players[0]
+        else:
+            return self.players[1]
+
+    def conclude(self, state):
+        self.show_board(state)
+        if self.game.get_reward(state) > 0:
+            winner = self.players[0]
+        else:
+            winner = self.players[1]
+        print(f"Congratulations, {winner.name}!")
--- a/notes.md
+++ b/notes.md
@ -0,0 +1,35 @@
+# Tic Tac Toe notes
+
+## Checkpoint 1 Notes
+
+Which class is responsible for each of the following behaviors?
+For each, explain how the behavior is accomplished.
+
+### Checking to see whether the game is over
+
+### Determining which actions are available at a particular state
+
+### Showing the board
+
+### Choosing which action to play on a turn
+
+
+## Checkpoint 2 Notes
+
+### TTT Strategy
+
+For each of the following board states, if you are playing as X
+and it's your turn, which action would you take? Why?
+
+   | O | O       |   | O       | X |       X | O |   
+---+---+---   ---+---+---   ---+---+---   ---+---+---
+ X | X |         | X |       X | O | O       |   |   
+---+---+---   ---+---+---   ---+---+---   ---+---+---
+   |   |         |   | O       |   |         |   |   
+
+### Initial game state
+
+You can get the inital game state using game.get_initial_state(). 
+What is the current and future reward for this state? What does this mean? 
+
+
--- a/play_nim.py
+++ b/play_nim.py
@ -0,0 +1,15 @@
+from nim.game_stub import NimGameStub
+from nim.view import NimView
+from nim.player import HumanNimPlayer, ComputerNimPlayer
+
+player0 = HumanNimPlayer(input("What's your name? "))
+player1 = ComputerNimPlayer("Robot")
+view = NimView(player0, player1)
+game = NimGameStub()
+
+view.greet()
+state = game.get_initial_state()
+while not game.is_over(state):
+    action = view.get_action(state)
+    state = game.get_next_state(state, action)
+view.conclude(state)
--- a/play_ttt.py
+++ b/play_ttt.py
@ -0,0 +1,15 @@
+from ttt.game import TTTGame
+from ttt.view import TTTView
+from ttt.player import TTTHumanPlayer, TTTComputerPlayer
+
+player0 = TTTHumanPlayer("Player 1")
+player1 = TTTHumanPlayer("Player 2")
+game = TTTGame()
+view = TTTView(player0, player1)
+
+state = game.get_initial_state()
+view.greet()
+while not game.is_over(state):
+    action = view.get_action(state)
+    state = game.get_next_state(state, action)
+view.conclude(state)
--- a/poetry.lock
+++ b/poetry.lock
@ -0,0 +1,33 @@
+# This file is automatically @generated by Poetry 1.4.0 and should not be changed by hand.
+
+[[package]]
+name = "click"
+version = "8.1.3"
+description = "Composable command line interface toolkit"
+category = "main"
+optional = false
+python-versions = ">=3.7"
+files = [
+    {file = "click-8.1.3-py3-none-any.whl", hash = "sha256:bb4d8133cb15a609f44e8213d9b391b0809795062913b383c62be0ee95b1db48"},
+    {file = "click-8.1.3.tar.gz", hash = "sha256:7682dc8afb30297001674575ea00d1814d808d6a36af415a82bd481d37ba7b8e"},
+]
+
+[package.dependencies]
+colorama = {version = "*", markers = "platform_system == \"Windows\""}
+
+[[package]]
+name = "colorama"
+version = "0.4.6"
+description = "Cross-platform colored terminal text."
+category = "main"
+optional = false
+python-versions = "!=3.0.*,!=3.1.*,!=3.2.*,!=3.3.*,!=3.4.*,!=3.5.*,!=3.6.*,>=2.7"
+files = [
+    {file = "colorama-0.4.6-py2.py3-none-any.whl", hash = "sha256:4f1d9991f5acc0ca119f9d443620b77f9d6b33703e51011c16baf57afb285fc6"},
+    {file = "colorama-0.4.6.tar.gz", hash = "sha256:08695f5cb7ed6e0531a20572697297273c47b8cae5a63ffc6d6ed5c201be6e44"},
+]
+
+[metadata]
+lock-version = "2.0"
+python-versions = "^3.11"
+content-hash = "101b8706a8befcaae12f34f371e35e5bc371645d8ce2747a4b32cca44ff8e832"
--- a/pyproject.toml
+++ b/pyproject.toml
@ -0,0 +1,16 @@
+[tool.poetry]
+name = "lab_tic_tac_toe"
+version = "0.1.0"
+description = ""
+authors = ["Chris Proctor <chris@chrisproctor.net>"]
+license = "MIT"
+
+[tool.poetry.dependencies]
+python = "^3.11"
+click = "^8.1.3"
+
+[tool.poetry.dev-dependencies]
+
+[build-system]
+requires = ["poetry-core>=1.0.0"]
+build-backend = "poetry.core.masonry.api"
--- a/strategy/lookahead_strategy.py
+++ b/strategy/lookahead_strategy.py
@ -0,0 +1,96 @@
+from types import MethodType
+from random import choice
+
+class LookaheadStrategy:
+    """A Strategy which considers the future consequences of an action.
+
+    To initialize a LookaheadStrategy, pass in an instance of a game containing
+    the following methods. These methods encode the rules of the game, 
+    which a LookaheadStrategy needs to know in order to determine which move is best.
+
+        - get_next_state: state, action -> state
+        - get_actions: state -> [actions]
+        - get_reward: state -> int
+        - is_over: state -> bool
+        - get_objective: str -> function
+
+    Optionally, pass the following arguments to control the behavior of the LookaheadStrategy:
+
+        - max_depth: int. A game may be too complex to search the full state tree.
+          Setting max_depth will set a cutoff on how far ahead the LookaheadStrategy will look.
+        - deterministic: bool. It's possible that there are multiple equally-good actions. 
+          When deterministic is True, LookaheadStrategy will always choose the first of the 
+          equally-good actions, so that LookaheadStrategy will always play out the same game. 
+          When deterministic is False, LookaheadStrategy will choose randomly from all actions
+          which are equally-good. 
+        - Explain: When set to True, LookaheadStrategy will print out its reasoning. 
+    """
+
+    def __init__(self, game, max_depth=None, deterministic=True, explain=False):
+        self.validate_game(game)
+        self.game = game
+        self.max_depth = max_depth
+        self.deterministic = deterministic
+        self.explain = explain
+
+    def choose_action(self, state, depth=0):
+        """Given a state, chooses an action.
+        This is the most important method of a Strategy, corresponding to the situation where
+        it's a player's turn to play a game and she needs to decide what to do. 
+
+        Strategy chooses an action by considering all possible actions, and finding the 
+        total current and future reward which would come from playing that action. 
+        Then we use the game's objective to choose the "best" reward. Usually bigger is better, 
+        but in zero-sum games like tic tac toe, the players want opposite outcomes. One player
+        wants the reward to be high, while the other wants the reward to be low.
+
+        Once we know which reward is best, we choose an action which will lead to that reward.
+        """
+        possible_actions = self.game.get_actions(state)
+        rewards = {}
+        for action in possible_actions:
+            future_state = self.game.get_next_state(state, action)
+            rewards[action] = self.get_current_and_future_reward(future_state, depth=depth)
+        objective = self.game.get_objective(state)
+        best_reward = objective(rewards.values())
+        best_actions = [action for action in possible_actions if rewards[action] == best_reward]
+        if self.deterministic:
+            action = best_actions[0]
+        else:
+            action = choice(best_actions)
+        if self.explain:
+            self.print_explanation(state, action, rewards[action], depth)
+        return action
+
+    def get_current_and_future_reward(self, state, depth=0):
+        """Calculates the reward from this state, and from all future states which would be 
+        reached, assuming all players are using this Strategy.
+        """
+        reward = self.game.get_reward(state)
+        if (self.max_depth is None or depth <= self.max_depth) and not self.game.is_over(state):
+            action = self.choose_action(state, depth=depth+1)
+            future_state = self.game.get_next_state(state, action)
+            reward += self.get_current_and_future_reward(future_state, depth=depth+1)
+        return reward
+
+    def validate_game(self, game):
+        "Checks that the game has all the required methods."
+        required_methods = [
+            "get_next_state",
+            "get_actions",
+            "get_reward",
+            "is_over",
+            "get_objective",
+        ]
+        for method in required_methods:
+            if not (hasattr(game, method) and isinstance(getattr(game, method), MethodType)):
+                message = f"Game {game} does not have method {method}."
+                raise ValueError(message)
+
+    def print_explanation(self, state, action, reward, depth):
+        """Prints out the current state of exploration of the state tree"""
+        indent = '│ ' * (max(0, depth-1)) + ('├ ' if depth > 0 else '')
+        print(f"{indent}[{reward}] Best action: {action} {state}")
+
+
+
--- a/strategy/random_strategy.py
+++ b/strategy/random_strategy.py
@ -0,0 +1,11 @@
+from random import choice
+
+class RandomStrategy:
+    """A Strategy which randomly chooses a move. Not a great choice.
+    """
+    def __init__(self, game):
+        self.game = game
+
+    def choose_action(self, state):
+        possible_actions = self.game.get_actions(state)
+        return choice(possible_actions)
--- a/ttt/game.py
+++ b/ttt/game.py
@ -0,0 +1,61 @@
+class TTTGame:
+    "Models a tic-tac-toe game."
+
+    def get_initial_state(self):
+        "Returns the game's initial state."
+        return {
+            "board": ['-', '-', '-', '-', '-', '-', '-', '-', '-'],
+            "player_x": True,
+        }
+
+    def get_next_state(self, state, action):
+        """Given a state and an action, returns the resulting state.
+        In the resulting state, the current player's symbol has been placed 
+        in an empty board space, and it is the opposite player's turn.
+        """
+        new_board = state["board"].copy()
+        new_board[action] = 'X' if state["player_x"] else 'O'
+        return {
+            "board": new_board,
+            "player_x": not state["player_x"],
+        }
+
+    def get_actions(self, state):
+        "Returns a list of the indices of empty spaces"
+        return [index for index in range(9) if state["board"][index] == '-']
+
+    def is_over(self, state):
+        "Checks whether the game is over."
+        return self.board_is_full(state) or self.check_winner(state, 'X') or self.check_winner(state, 'O')
+
+    def get_reward(self, state):
+        """Determines the reward associated with reaching this state.
+        For tic-tac-toe, the two opponents each want a different game outcome. So 
+        we set the reward for X winning to 1 and the reward for O winning to -1.
+        All other states (unfinished games and games which ended in a draw) are worth 0.
+        """
+        if self.check_winner(state, 'X'):
+            return 1
+        elif self.check_winner(state, 'O'):
+            return -1
+        else:
+            return 0
+
+    def get_objective(self, state):
+        """Returns a player's objective, or a function describing what a player wants. 
+        This function should choose the best value from a list. In tic tac toe, the players
+        want opposite things, so we set X's objective to the built-in function `max`
+        (which chooses the largest number), and we set O's objective to the built-in function `min`.
+        """
+        return max if state["player_x"] else min
+
+    def board_is_full(self, state):
+        "Checks whether all the spaces in the board are occupied."
+        for space in state["board"]:
+            if space == '-':
+                return False
+        return True
+
+    def check_winner(self, state, symbol):
+        "Checks whether the player with `symbol` has won the game."
+        return False
--- a/ttt/player.py
+++ b/ttt/player.py
@ -0,0 +1,33 @@
+from click import Choice, prompt
+from strategy.random_strategy import RandomStrategy
+from ttt.game import TTTGame
+import random
+
+class TTTHumanPlayer:
+    "A human tic tac toe player."
+
+    def __init__(self, name):
+        "Sets up the player."
+        self.name = name
+        self.game = TTTGame()
+
+    def choose_action(self, state):
+        "Chooses an action by prompting the player for a choice."
+        actions = self.game.get_actions(state)
+        choices = Choice([str(action) for action in actions])
+        action = int(prompt("> ", type=choices, show_choices=False))
+        return action
+
+class TTTComputerPlayer:
+    "A computer tic tac toe player"
+
+    def __init__(self, name):
+        "Sets up the player."
+        self.name = name
+        self.strategy = RandomStrategy(TTTGame())
+
+    def choose_action(self, state):
+        "Chooses a random move from the moves available."
+        action = self.strategy.choose_action(state)
+        print(f"{self.name} chooses {action}.")
+        return action
--- a/ttt/view.py
+++ b/ttt/view.py
@ -0,0 +1,75 @@
+from ttt.game import TTTGame
+import click
+
+class TTTView:
+    "Handles user interaction with a tic-tac-toe game."
+    greeting = "Welcome to tic-tac-toe"
+    goodbye = "Well, that's a wrap."
+    divider = "---+---+---"
+    x_color = "red"
+    o_color = "blue"
+    option_color = "bright_black"
+
+    def __init__(self, playerX, playerO):
+        self.game = TTTGame()
+        self.players = {
+            "X": playerX, 
+            "O": playerO,
+        }
+
+    def greet(self):
+        "Starts a new game by greeting the players."
+        x_name = self.players['X'].name
+        o_name = self.players['O'].name
+        print(self.greeting)
+        print(f"{x_name} will play as X.")
+        print(f"{o_name} will play as O.")
+
+    def get_action(self, state):
+        "Shows the board and asks the current player for their choice of action."
+        self.print_board(state)
+        current_player_symbol = 'X' if state["player_x"] else 'O'
+        player = self.players[current_player_symbol]
+        print(f"{player.name}, it's your move.")
+        return player.choose_action(state)
+
+    def print_board(self, state):
+        "Prints the current board, showing indices of available spaces"
+        print(self.format_row(state, [0, 1, 2]))
+        print(self.divider)
+        print(self.format_row(state, [3, 4, 5]))
+        print(self.divider)
+        print(self.format_row(state, [6, 7, 8]))
+
+    def format_row(self, state, indices):
+        "Returns a string for one row in the board, like ' X | O | X '"
+        spaces = [self.format_value(state, i) for i in indices]
+        return f" {spaces[0]} | {spaces[1]} | {spaces[2]} "
+
+    def format_value(self, state, index):
+        """Formats the value for a single space on the board. 
+        If the game board already has a symbol in that space, formats that value for the Terminal.
+        If the space is empty, instead formats the index of the space. 
+        """
+        if state["board"][index] == 'X':
+            return click.style('X', fg=self.x_color)
+        elif state["board"][index] == 'O':
+            return click.style('O', fg=self.o_color)
+        else:
+            return click.style(index, fg=self.option_color)
+
+    def conclude(self, state):
+        """Says goodbye.
+        """
+        self.print_board(state)
+        if self.game.check_winner(state, 'X'):
+            winner = self.players['X']
+        elif self.game.check_winner(state, 'O'):
+            winner = self.players['O']
+        else:
+            winner = None
+        print(self.goodbye)
+        if winner:        
+            print(f"Congratulations to {winner.name}.")
+        else:
+            print("Nobody won this game.")