addissemagn
diff --git a/‎#agent.py#
+223 b/‎#agent.py#
+223
diff --git a/‎__pycache__/agent.cpython-38.pyc
6.46 KB b/‎__pycache__/agent.cpython-38.pyc
6.46 KB
diff --git a/‎__pycache__/othello_game.cpython-38.pyc
5.34 KB b/‎__pycache__/othello_game.cpython-38.pyc
5.34 KB
diff --git a/‎__pycache__/othello_shared.cpython-38.pyc
1.89 KB b/‎__pycache__/othello_shared.cpython-38.pyc
1.89 KB
@@ -0,0 +1,223 @@
+board
+An AI player for Othello. 
+"""
+
+# gotta make moves within 10 seconds
+
+import random
+import sys
+import time
+import math
+
+# You can use the functions in othello_shared to write your AI
+from othello_shared import find_lines, get_possible_moves, get_score, play_move
+
+def eprint(*args, **kwargs): #you can use this for debugging, as it will print to sterr and not stdout
+    print(*args, file=sys.stderr, **kwargs)
+    
+# Method to compute utility value of terminal state
+def compute_utility(board, color):
+    score = get_score(board) # (# of dark disks, # of light disks), color 1 for dark and 2 for light
+    final = (score[0] - score[1]) if color == 1 else (score[1] - score[0])    
+    return final
+
+# Better heuristic value of board
+def compute_heuristic(board, color): #not implemented, optional
+    #IMPLEMENT
+    return 0 #change this!
+
+############ MINIMAX ###############################
+# returns lowest possible utility
+def minimax_min_node(board, color, limit, caching = 0):
+    opponent = 1 if color == 2 else 2
+    moves = get_possible_moves(board, color)
+    lowest_utility = math.inf
+    
+    if len(moves) == 0:
+        return (0, 0), compute_utility(board, color)
+    
+    best_move = moves[0]
+    
+    for move in moves:
+        board_after_play = play_move(board, color, move[0], move[1])
+        test_move, utility = minimax_max_node(board_after_play, opponent, limit, caching)
+        
+        if utility < lowest_utility:
+            best_move = move
+            lowest_utility = utility
+    
+    # return ((0,0),0)
+    return best_move, lowest_utility
+
+# returns highest possible utility
+def minimax_max_node(board, color, limit, caching = 0): 
+    opponent = 1 if color == 2 else 2
+    moves = get_possible_moves(board, color)
+    highest_utility = -math.inf
+    
+    if len(moves) == 0:
+        return (0, 0), compute_utility(board, color)
+    
+    best_move = moves[0]
+    
+    for move in moves:
+        board_after_play = play_move(board, color, move[0], move[1])
+        test_move, utility = minimax_min_node(board_after_play, opponent, limit, caching)
+        
+        if utility > highest_utility:
+            best_move = move
+            highest_utility = utility
+    
+    return best_move, highest_utility
+
+def select_move_minimax(board, color, limit, caching = 0):
+    """
+    Given a board and a player color, decide on a move. 
+    The return value is a tuple of integers (i,j), where
+    i is the column and j is the row on the board.  
+    Note that other parameters are accepted by this function:
+    If limit is a positive integer, your code should enfoce a depth limit that is equal to the value of the parameter.
+    Search only to nodes at a depth-limit equal to the limit.  If nodes at this level are non-terminal return a heuristic 
+    value (see compute_utility)
+    If caching is ON (i.e. 1), use state caching to reduce the number of state evaluations.
+    If caching is OFF (i.e. 0), do NOT use state caching to reduce the number of state evaluations.    
+    """
+    move, utility = minimax_max_node(board, color, limit, caching)
+    return move
+    
+############ ALPHA-BETA PRUNING #####################
+def alphabeta_min_node(board, color, alpha, beta, limit, caching = 0, ordering = 0):
+    opponent = 1 if color == 2 else 2
+    moves = get_possible_moves(board, color)
+    lowest_utility = math.inf
+    
+    if len(moves) == 0:
+        return (0, 0), compute_utility(board, color)
+    
+    best_move = moves[0]
+    
+    for move in moves:
+        board_after_play = play_move(board, color, move[0], move[1])
+        test_move, utility = minimax_max_node(board_after_play, opponent, limit, caching)
+        
+        if utility < lowest_utility:
+            best_move = move
+            lowest_utility = utility
+        
+        if lowest_utility <= alpha:
+            return best_move, highest_utility
+
+        if lowest_utility < beta:
+            beta = lowest_utility
+    
+    # return ((0,0),0)
+    return best_move, lowest_utility
+
+# maximizer
+def alphabeta_max_node(board, color, alpha, beta, limit, caching = 0, ordering = 0):
+    opponent = 1 if color == 2 else 2
+    moves = get_possible_moves(board, color)
+    highest_utility = -math.inf
+    
+    if len(moves) == 0:
+        return (0, 0), compute_utility(board, color)
+    
+    best_move = moves[0]
+    
+    for move in moves:
+        board_after_play = play_move(board, color, move[0], move[1])
+        test_move, utility = minimax_min_node(board_after_play, opponent, limit, caching)
+        
+        if utility > highest_utility:
+            best_move = move
+            highest_utility = utility
+            
+        if highest_utility >= beta:
+            return best_move, highest_utility
+
+        if highest_utility > alpha:
+            alpha = highest_utility
+    
+    return best_move, highest_utility
+
+def select_move_alphabeta(board, color, limit, caching = 0, ordering = 0):
+    """
+    Given a board and a player color, decide on a move. 
+    The return value is a tuple of integers (i,j), where
+    i is the column and j is the row on the board.  
+
+    Note that other parameters are accepted by this function:
+    If limit is a positive integer, your code should enfoce a depth limit that is equal to the value of the parameter.
+    Search only to nodes at a depth-limit equal to the limit.  If nodes at this level are non-terminal return a heuristic 
+    value (see compute_utility)
+    If caching is ON (i.e. 1), use state caching to reduce the number of state evaluations.
+    If caching is OFF (i.e. 0), do NOT use state caching to reduce the number of state evaluations.    
+    If ordering is ON (i.e. 1), use node ordering to expedite pruning and reduce the number of state evaluations. 
+    If ordering is OFF (i.e. 0), do NOT use node ordering to expedite pruning and reduce the number of state evaluations. 
+    """
+    alpha = -math.inf
+    beta = math.inf
+    
+    move, utility = alphabeta_max_node(board, color, alpha, beta, limit, caching, ordering)
+    return move #change this!
+
+####################################################
+def run_ai():
+    """
+    This function establishes communication with the game manager.
+    It first introduces itself and receives its color.
+    Then it repeatedly receives the current score and current board state
+    until the game is over.
+    """
+    print("Othello AI") # First line is the name of this AI
+    arguments = input().split(",")
+    
+    color = int(arguments[0]) #Player color: 1 for dark (goes first), 2 for light. 
+    limit = int(arguments[1]) #Depth limit
+    minimax = int(arguments[2]) #Minimax or alpha beta
+    caching = int(arguments[3]) #Caching 
+    ordering = int(arguments[4]) #Node-ordering (for alpha-beta only)
+
+    if (minimax == 1): eprint("Running MINIMAX")
+    else: eprint("Running ALPHA-BETA")
+
+    if (caching == 1): eprint("State Caching is ON")
+    else: eprint("State Caching is OFF")
+
+    if (ordering == 1): eprint("Node Ordering is ON")
+    else: eprint("Node Ordering is OFF")
+
+    if (limit == -1): eprint("Depth Limit is OFF")
+    else: eprint("Depth Limit is ", limit)
+
+    if (minimax == 1 and ordering == 1): eprint("Node Ordering should have no impact on Minimax")
+
+    while True: # This is the main loop
+        # Read in the current game status, for example:
+        # "SCORE 2 2" or "FINAL 33 31" if the game is over.
+        # The first number is the score for player 1 (dark), the second for player 2 (light)
+        next_input = input()
+        status, dark_score_s, light_score_s = next_input.strip().split()
+        dark_score = int(dark_score_s)
+        light_score = int(light_score_s)
+
+        if status == "FINAL": # Game is over.
+            print
+        else:
+            board = eval(input()) # Read in the input and turn it into a Python
+                                  # object. The format is a list of rows. The
+                                  # squares in each row are represented by
+                                  # 0 : empty square
+                                  # 1 : dark disk (player 1)
+                                  # 2 : light disk (player 2)
+
+            # Select the move and send it to the manager
+            if (minimax == 1): #run this if the minimax flag is given
+                movei, movej = select_move_minimax(board, color, limit, caching)
+            else: #else run alphabeta
+                movei, movej = select_move_alphabeta(board, color, limit, caching, ordering)
+            
+            print("{} {}".format(movei, movej))
+
+if __name__ == "__main__":
+    run_ai()