test2.py

import os
import random
import numpy as np
import tqdm
from game import Game, MonteCarloPNSPlayer, Move, Player
from board import Board
from tree_PNS import PN_MCTS_Node


class RandomPlayer(Player):
    def __init__(self) -> None:
        super().__init__()

    def make_move(self, game: 'Game') -> tuple[tuple[int, int], Move]:
        from_pos = (random.randint(0, 4), random.randint(0, 4))
        move = random.choice([Move.TOP, Move.BOTTOM, Move.LEFT, Move.RIGHT])
        return from_pos, move

if __name__ == '__main__':
    
    losing_board = []
    winning_board = []
    results = {}
    my_player_id = 0
    players = np.empty(2, dtype=Player)
    tot = 100
    duration = 0.5
    # cross validation backbone to find best hyperparameters
        # this below is the best configuration found if we consider a performance/execution_time tradeoff
    for ns in [1]:
        for cp in [0.1]:

            #wins and matches for accuracy
            wins = 0
            matches = 0

            #play tot games
            for i in tqdm.tqdm(range(tot)):
                my_player_id = 0
                print(f"my_player_id: {my_player_id}")
                g = Game()
                #g.print()

                # player initialization -> our player is players[my_player_id]
               # player initialization -> our player is players[my_player_id]
                minmax_depth = 1
                MR_hybrid = False # if True, the player will use the Minimax hybrid algorithm for the rollout

                players[my_player_id] = MonteCarloPNSPlayer(player_id=my_player_id,duration=duration, c_param=0.5, pn_param=0.5,MR_hybrid = MR_hybrid,minimax_depth=minmax_depth)
                players[1 - my_player_id] = RandomPlayer()
                
                # play the game
                winner = g.play(players[0], players[1])
                g.print()
                print(f"Winner: Player {winner}")
                matches += 1

                #update accuracy
                if winner == my_player_id:
                    
                    wins += 1
                    winning_board.append(g.get_board())
                    #np.save("Computational-Intelligence\\quixo\\features\\won_test3.npy", winning_board)
                else:
                    #g.print()
                    losing_board.append(g.get_board())
                    #np.save("Computational-Intelligence\\quixo\\features\\lost_test3.npy", losing_board)

                #print(g.get_board())
            #print accuracy
            acc  = 100*float(wins)/float(matches)
            print("accuracy: ",acc )

            #save results
            results[str(ns) + "-"+ str(cp)] = acc

            # np.save("Computational-Intelligence\\quixo\\features\\lost_test3.npy", losing_board)
            # with open('Computational-Intelligence\\quixo\\features\\lost_test3.txt', 'a' if os.path.isfile('lost.txt') else 'w') as file:
            #             file.write("\n")
            #             file.write(str(losing_board))    
                        
            #             #print(losing_board)

            # np.save("Computational-Intelligence\\quixo\\features\\won_test3.npy", winning_board)
            # with open('Computational-Intelligence\\quixo\\features\\won_test3.txt', 'a' if os.path.isfile('won.txt') else 'w') as file:
            #             file.write("\n")
            #             file.write(str(losing_board))
            #             #print(winning_board)