From 06e633b4b750c002d2d488334aa75b292482651d Mon Sep 17 00:00:00 2001
From: sirmammingtonham <ethanj217@gmail.com>
Date: Thu, 1 Nov 2018 15:54:05 -0700
Subject: [PATCH] cleaning: merged gameUtils.py and game.py

---
 alphabot/Arena.py   |   4 +-
 alphabot/Coach.py   |   4 +-
 alphabot/Game.py    | 331 +++++++++++++++++++++++++++++-------
 alphabot/GameOld.py | 405 ++++++++++++++++++++++++++++++++++++++++++++
 alphabot/MCTS.py    |   6 +-
 alphabot/pit.py     |   2 +-
 6 files changed, 683 insertions(+), 69 deletions(-)
 create mode 100644 alphabot/GameOld.py

diff --git a/alphabot/Arena.py b/alphabot/Arena.py
index d73d241..8f691c5 100644
--- a/alphabot/Arena.py
+++ b/alphabot/Arena.py
@@ -48,7 +48,7 @@ def playGame(self, verbose=False):
                 action = players[curPlayer + 1](current_game)
                 next_state, curPlayer = self.game.getNextState(curPlayer, (action), current_game)
             else:
-                pi = players[curPlayer+1](self.game.getState(current_game))
+                pi = players[curPlayer+1](self.game.getState())
                 pi_reshape = np.reshape(pi, (21, 18))
                 action = np.where(pi_reshape==np.max(pi_reshape))
                 next_state, curPlayer = self.game.getNextState(curPlayer, (action[0][0], action[1][0]), current_game)
@@ -56,7 +56,7 @@ def playGame(self, verbose=False):
         #     assert(self.display)
         #     print("Game over: Turn ", str(it), "Result ", str(self.game.getGameEnded(board, 1)))
         #     self.display(board)
-        return self.game.getGameEnded(curPlayer, current_game)
+        return self.game.getGameEnded(current_game)
 
     def playGames(self, num, verbose=False):
         """
diff --git a/alphabot/Coach.py b/alphabot/Coach.py
index a513f38..33633eb 100644
--- a/alphabot/Coach.py
+++ b/alphabot/Coach.py
@@ -51,7 +51,7 @@ def executeEpisode(self):
             pi = self.mcts.getActionProb(state, temp=temp)
             pi_reshape = np.reshape(pi, (21, 18))
             # sym = self.game.getSymmetries(state, pi)
-            s = self.game.getState(self.curPlayer)
+            s = self.game.getState()
             trainExamples.append([s, self.curPlayer, pi, None])
             # for b,p in sym:
             #     trainExamples.append([b, self.curPlayer, p, None])
@@ -59,7 +59,7 @@ def executeEpisode(self):
             a, b = np.unravel_index(np.ravel(action, np.asarray(pi).shape), pi_reshape.shape)
             current_game, self.curPlayer = self.game.getNextState(self.curPlayer, (a[0], b[0]))
 
-            r = self.game.getGameEnded(self.curPlayer)
+            r = self.game.getGameEnded()
 
             if r!=0:
                 return [(x[0],x[2],r*((-1)**(x[1]!=self.curPlayer))) for x in trainExamples]
diff --git a/alphabot/Game.py b/alphabot/Game.py
index 7e6e0fb..cd13b30 100644
--- a/alphabot/Game.py
+++ b/alphabot/Game.py
@@ -1,23 +1,42 @@
+import random
 import numpy as np
-from utils import Board, UnhandledAction
+import pickle
+
+from fireplace import cards
+from fireplace.exceptions import GameOver, InvalidAction
+from fireplace.game import Game
+from fireplace.player import Player
+from fireplace.utils import random_draft
+from hearthstone.enums import CardClass
+from utils import UnhandledAction
 from fireplace.exceptions import GameOver
 
 class YEET:
     """
-    This class specifies the base Game class. To define your own game, subclass
-    this class and implement the functions below. This works when the game is
-    two-player, adversarial and turn-based.
-
     Use 1 for player1 and -1 for player2.
     21 possible actions per move, and 8 possible targets per action + 1 if no targets
     is_basic = True initializes game between priest and rogue only
     """
-    
+
     def __init__(self, is_basic=True):
-        self.num_actions = 21
+        self.game = None
+        self.is_basic = True
         self.players = ['player1', 'player2']
         self.is_basic = is_basic
-        self.b = Board()
+        self.isolate = False
+
+
+    def isolateSet(self, filename='notbasicset', set='CardSet.CORE'):
+        # isolates the specified card set for exclusion in drafting
+        cards.db.initialize()
+        extraset = []
+        for index, card in cards.db.items():
+            if str(card.card_set) != set:
+                    extraset.append(card.id)
+        with open(f'{filename}.data', 'wb') as filehandle:
+            # store the data as binary data stream
+            pickle.dump(extraset, filehandle)
+
 
     def getInitGame(self):
         """
@@ -25,70 +44,177 @@ def getInitGame(self):
             startBoard: a representation of the board (ideally this is the form
                         that will be the input to your neural network)
         """
-        # self.b.isolateSet()
-        self.b.initGame()
-        return self.b.game
+        if self.isolate:
+            self.isolateSet()
+
+        cards.db.initialize()
+        if self.is_basic: #create quick simple game
+            with open('notbasic.data', 'rb') as f:
+                extra_set = pickle.load(f)
+            p1 = 6 #priest
+            p2 = 7 #rogue
+            deck1 = random_draft(CardClass(p1), exclude=extra_set)
+            deck2 = random_draft(CardClass(p2), exclude=extra_set)
+        else:
+            p1 = random.randint(1, 9)
+            p2 = random.randint(1, 9)
+            deck1 = random_draft(CardClass(p1))
+            deck2 = random_draft(CardClass(p2))
+        self.players[0] = Player("Player1", deck1, CardClass(p1).default_hero)
+        self.players[1] = Player("Player2", deck2, CardClass(p2).default_hero)
+        game = Game(players=self.players)
+        game.start()
+
+        # Skip mulligan for now
+        for player in game.players:
+            cards_to_mulligan = random.sample(player.choice.cards, 0)
+            player.choice.choose(*cards_to_mulligan)
+
+        game.player_to_start = game.current_player
+        self.game = game
+        return game
+
 
-    def getNextState(self, player, action, game_instance=Board.game):
+    def getNextState(self, player, action, game_instance=self.game):
         """
         Input:
-            board: current board (gameUtils)
             player: current player (1 or -1)
             action: action taken by current player
+            game_instance: the game object (actual game or deepcopy for MCTS)
 
         Returns:
-            nextBoard: board after applying action
-            nextPlayer: player who plays in the next turn (should be -player)
-
-            all actions executed by copy_player to preserve new game
-
+            next_state: state after applying action
+            next_player: player who plays in the next turn (should be -player if the action is end turn)
         """
         if game_instance == None:
-            game_instance = Board.game
+            game_instance = self.game
 
         try:
-            self.b.performAction(action, player, game_instance)
+            self.performAction(action, game_instance)
         except GameOver:
             raise GameOver
-        next_state = self.b.getState(player, game_instance)
+
+        next_state = self.getState(game_instance)
+
         if action[0] != 19:
             return next_state, player
         else:
             return next_state, -player
 
-    def getValidMoves(self, player, game_instance=Board.game):
+
+    def getValidMoves(self, game_instance=self.game):
         """
         Input:
-            board: current board
-            player: current player
+            game_instance: the game object (actual game or deepcopy for MCTS)
 
         Returns:
-            validMoves: a binary vector of length self.getActionSize(), 1 for
-                        moves that are valid from the current board and player,
+            validMoves: a 21x18 binary matrix, 1 for
+                        moves that are valid from the current game instance and player,
                         0 for invalid moves
         """
-        # if player == 1:
-        #     current_player = self.b.players[0]
-        # elif player == -1:
-        #     current_player = self.b.players[1]
-        if game_instance == None:
-            game_instance = Board.game
-        return self.b.getValidMoves(game_instance)
+        actions = np.zeros((21,18))
+        player = game_instance.current_player
+        #If the player is being given a choice, return only valid choices
+        if player.choice:
+            for index, card in enumerate(player.choice.cards):
+                actions[20, index] = 1
 
+        else:
+            # add cards in hand
+            for index, card in enumerate(player.hand):
+                if card.is_playable():
+                    if card.requires_target():
+                        for target, card in enumerate(card.targets):
+                            actions[index, target] = 1
+                    elif card.must_choose_one:
+                        for choice, card in enumerate(card.choose_cards):
+                            actions[index, choice] = 1
+                    else:
+                        actions[index] = 1
+            # add targets available to minions that can attack
+            for position, minion in enumerate(player.field):
+                if minion.can_attack():
+                    for target, card in enumerate(minion.attack_targets):
+                        actions[position+10, target] = 1
+            # add hero power and targets if applicable
+            if player.hero.power.is_usable():
+                if player.hero.power.requires_target():
+                    for target, card in enumerate(player.hero.power.targets):
+                        actions[17, target] = 1
+                else:
+                    actions[17] = 1
+            # add hero attacking if applicable
+            if player.hero.can_attack():
+                for target, card in enumerate(player.hero.attack_targets):
+                    actions[18, target] = 1
+            # add end turn
+            actions[19,1] = 1
+        return actions
 
 
-    def getGameEnded(self, player, game_instance=Board.game):
+    def performAction(self, a, game_instance):
         """
+        utility to perform an action tuple
+
         Input:
-            board: current board
-            player: current player (1 or -1)
+            a, a tuple representing index of action
+            game_instance: the game object (actual game or deepcopy for MCTS)
+
+        """
+        player = game_instance.current_player
+        if not game_instance.ended:
+            try:
+                if 0 <= a[0] <= 9:
+                    if player.hand[a[0]].requires_target():
+                        player.hand[a[0]].play(player.hand[a[0]].targets[a[1]])
+                    elif player.hand[a[0]].must_choose_one:
+                        player.hand[a[0]].play(choose=player.hand[a[0]].choose_targets[a[1]])
+                    else:
+                        player.hand[a[0]].play()
+                elif 10 <= a[0] <= 16:
+                    player.field[a[0]-10].attack(player.field[a[0]-10].attack_targets[a[1]])
+                elif a[0] == 17:
+                    if player.hero.power.requires_target():
+                            player.hero.power.use(player.hero.power.play_targets[a[1]])
+                    else:
+                        player.hero.power.use()
+                elif a[0] == 18:
+                    player.hero.attack(player.hero.attack_targets[a[1]])
+                elif a[0] == 19:
+                    player.game.end_turn()
+                elif a[0] == 20 and not player.choice:
+                    player.game.end_turn()
+                elif player.choice:
+                    player.choice.choose(player.choice.cards[a[1]])
+                else:
+                    raise UnhandledAction
+            except UnhandledAction:
+                print("Attempted to take an inappropriate action!")
+                print(a)
+                raise
+            except InvalidAction:
+                print("Attempted to do something I can't!")
+                player.game.end_turn()
+            except IndexError:
+                try:
+                    player.game.end_turn()
+                except GameOver:
+                    pass
+            except GameOver:
+                pass
+
+
+    def getGameEnded(self, game_instance=self.game):
+        """
+        Input:
+            game_instance: the game object (actual game or deepcopy for MCTS)
 
         Returns:
-            r: 0 if game has not ended. 1 if player won, -1 if player lost,
+            r: 0 if game has not ended. 1 if starting player won, -1 if player lost,
                small non-zero value for draw.
         """
         if game_instance == None:
-            game_instance = Board.game
+            game_instance = self.game
 
         p1 = game_instance.player_to_start
 
@@ -103,58 +229,141 @@ def getGameEnded(self, player, game_instance=Board.game):
             return 0.0001
         return 0
 
-    def getState(self, player, game_instance=Board.game):
+    def getState(self, game_instance=self.game):
         """
-        Input:
-            board: current board
-            player: current player (1 or -1)
-
-        Returns:
-            state: see gameUtils.getState for info
+        Args:
+            game_instance: the game object (actual game or deepcopy for MCTS)
+        return:
+            a 263 length numpy array of features extracted from the
+            supplied game.
         """
-        # if player == 1:
-        #     current_player = self.b.players[0]
-        # elif player == -1:
-        #     current_player = self.b.players[1]
-        if game_instance == None:
-            game_instance = Board.game
+        s = np.zeros(263, dtype=np.int32)
+
+        p1 = game_instance.current_player
+        p2 = p1.opponent
+
+        #0-9 player1 class, we subtract 1 here because the classes are from 1 to 10
+        s[p1.hero.card_class-1] = 1
+        #10-19 player2 class
+        s[10 + p2.hero.card_class-1] = 1
+        i = 20
+        # 20-21: current health of current player, then opponent
+        s[i] = p1.hero.health
+        s[i + 1] = p2.hero.health
+
+        # 22: hero power usable y/n
+        s[i + 2] = p1.hero.power.is_usable()*1
+        # 23-24: # of mana crystals for you opponent
+        s[i + 3] = p1.max_mana
+        s[i + 4] = p2.max_mana
+        # 25: # of crystals still avalible
+        s[i + 5] = p1.mana
+        #26-31: weapon equipped y/n, pow., dur. for you, then opponent
+        s[i + 6] = 0 if p1.weapon is None else 1
+        s[i + 7] = 0 if p1.weapon is None else p1.weapon.damage
+        s[i + 8] = 0 if p1.weapon is None else p1.weapon.durability
+
+        s[i + 9] = 0 if p2.weapon is None else 1
+        s[i + 10] = 0 if p2.weapon is None else p2.weapon.damage
+        s[i + 11] = 0 if p2.weapon is None else p2.weapon.durability
+
+        # 32: number of cards in opponents hand
+        s[i + 12] = len(p2.hand)
+        #in play minions
+
+        i = 33
+        #33-102, your monsters on the field
+        p1_minions = len(p1.field)
+        for j in range(0, 7):
+            if j < p1_minions:
+                # filled y/n, pow, tough, current health, can attack
+                s[i] = 1
+                s[i + 1] = p1.field[j].atk
+                s[i + 2] = p1.field[j].max_health
+                s[i + 3] = p1.field[j].health
+                s[i + 4] = p1.field[j].can_attack()*1
+                # deathrattle, div shield, taunt, stealth y/n
+                s[i + 5] = p1.field[j].has_deathrattle*1
+                s[i + 6] = p1.field[j].divine_shield*1
+                s[i + 7] = p1.field[j].taunt*1
+                s[i + 8] = p1.field[j].stealthed*1
+                s[i + 9] = p1.field[j].silenced*1
+            i += 10
+
+        #103-172, enemy monsters on the field
+        p2_minions = len(p2.field)
+        for j in range(0, 7):
+            if j < p2_minions:
+                # filled y/n, pow, tough, current health, can attack
+                s[i] = 1
+                s[i + 1] = p2.field[j].atk
+                s[i + 2] = p2.field[j].max_health
+                s[i + 3] = p2.field[j].health
+                s[i + 4] = p2.field[j].can_attack()*1
+                # deathrattle, div shield, taunt, stealth y/n
+                s[i + 5] = p2.field[j].has_deathrattle*1
+                s[i + 6] = p2.field[j].divine_shield*1
+                s[i + 7] = p2.field[j].taunt*1
+                s[i + 8] = p2.field[j].stealthed*1
+                s[i + 9] = p2.field[j].silenced*1
+            i += 10
+
+        #in hand
+
+        #173-262, your cards in hand
+        p1_hand = len(p1.hand)
+        for j in range(0, 10):
+            if j < p1_hand:
+                #card y/n
+                s[i] = 1
+                # minion y/n, attk, hp, battlecry, div shield, deathrattle, taunt
+                s[i + 1] = 1 if p1.hand[j].type == 4 else 0
+                s[i + 2] = p1.hand[j].atk if s[i + 1] == 1 else 0
+                s[i + 2] = p1.hand[j].health if s[i + 1] == 1 else 0
+                s[i + 3] = p1.hand[j].divine_shield*1 if s[i + 1] == 1 else 0
+                s[i + 4] = p1.hand[j].has_deathrattle*1 if s[i + 1] == 1 else 0
+                s[i + 5] = p1.hand[j].taunt*1 if s[i + 1] == 1 else 0
+                # weapon y/n, spell y/n, cost
+                s[i + 6] = 1 if p1.hand[j].type == 7 else 0
+                s[i + 7] = 1 if p1.hand[j].type == 5 else 0
+                s[i + 8] = p1.hand[j].cost
+            i += 9
+        return s
 
-        return self.b.getState(player, game_instance)
-        # return b.game
 
     def getSymmetries(self, state, pi):
         """
         Input:
-            board: current board
+            state: current state
             pi: policy vector of size self.getActionSize()
 
         Returns:
-            symmForms: a list of [(board,pi)] where each tuple is a symmetrical
-                       form of the board and the corresponding pi vector. This
+            symmForms: a list of [(actions,pi)] where each tuple is a symmetrical
+                       form of the actions and the corresponding pi vector. This
                        is used when training the neural network from examples.
         """
-        # assert(len(pi) == len(state))
         assert(len(pi) == 168)
-        pi_board = np.reshape(pi, (21, 9))
+        pi_reshape = np.reshape(pi, (21, 9))
         l = []
 
         for i in range(1, 5):
             for j in [True, False]:
                 newS = np.rot90(state, i)
-                newPi = np.rot90(pi_board, i)
+                newPi = np.rot90(pi_reshape, i)
                 if j:
                     newS = np.fliplr(newS)
                     newPi = np.fliplr(newPi)
                 l += [(newS, list(newPi.ravel()) + [pi[-1]])]
         return l
 
+
     def stringRepresentation(self, state):
         """
         Input:
             state: np array of state
 
         Returns:
-            boardString: a quick conversion of board to a string format.
+            stateString: a quick conversion of state to a string format.
                          Required by MCTS for hashing.
         """
-        return state.tostring()
+        return state.tostring()
\ No newline at end of file
diff --git a/alphabot/GameOld.py b/alphabot/GameOld.py
new file mode 100644
index 0000000..7e63bae
--- /dev/null
+++ b/alphabot/GameOld.py
@@ -0,0 +1,405 @@
+import numpy as np
+from utils import Board, UnhandledAction
+from fireplace.exceptions import GameOver
+
+class YEET:
+    """
+    This class specifies the base Game class. To define your own game, subclass
+    this class and implement the functions below. This works when the game is
+    two-player, adversarial and turn-based.
+
+    Use 1 for player1 and -1 for player2.
+    21 possible actions per move, and 8 possible targets per action + 1 if no targets
+    is_basic = True initializes game between priest and rogue only
+    """
+    
+    def __init__(self, is_basic=True):
+        self.num_actions = 21
+        self.players = ['player1', 'player2']
+        self.is_basic = is_basic
+        self.b = Board()
+
+    def getInitGame(self):
+        """
+        Returns:
+            startBoard: a representation of the board (ideally this is the form
+                        that will be the input to your neural network)
+        """
+        # self.b.isolateSet()
+        self.b.initGame()
+        return self.b.game
+
+    def getNextState(self, player, action, game_instance=Board.game):
+        """
+        Input:
+            board: current board (gameUtils)
+            player: current player (1 or -1)
+            action: action taken by current player
+
+        Returns:
+            nextBoard: board after applying action
+            nextPlayer: player who plays in the next turn (should be -player)
+
+            all actions executed by copy_player to preserve new game
+
+        """
+        if game_instance == None:
+            game_instance = Board.game
+
+        try:
+            self.b.performAction(action, player, game_instance)
+        except GameOver:
+            raise GameOver
+        next_state = self.b.getState(player, game_instance)
+        if action[0] != 19:
+            return next_state, player
+        else:
+            return next_state, -player
+
+    def getValidMoves(self, player, game_instance=Board.game):
+        """
+        Input:
+            board: current board
+            player: current player
+
+        Returns:
+            validMoves: a binary vector of length self.getActionSize(), 1 for
+                        moves that are valid from the current board and player,
+                        0 for invalid moves
+        """
+        # if player == 1:
+        #     current_player = self.b.players[0]
+        # elif player == -1:
+        #     current_player = self.b.players[1]
+        if game_instance == None:
+            game_instance = Board.game
+        return self.b.getValidMoves(game_instance)
+
+
+    def getGameEnded(self, game_instance=Board.game):
+        """
+        Input:
+            board: current board
+            player: current player (1 or -1)
+
+        Returns:
+            r: 0 if game has not ended. 1 if player won, -1 if player lost,
+               small non-zero value for draw.
+        """
+        if game_instance == None:
+            game_instance = Board.game
+
+        p1 = game_instance.player_to_start
+
+        if p1.playstate == 4:
+            return 1
+        elif p1.playstate == 5:
+            return -1
+        elif p1.playstate == 6:
+            return 0.0001
+        elif game_instance.turn > 180:
+            game_instance.ended = True
+            return 0.0001
+        return 0
+
+    def getState(self, player, game_instance=Board.game):
+        """
+        Input:
+            board: current board
+            player: current player (1 or -1)
+
+        Returns:
+            state: see gameUtils.getState for info
+        """
+        # if player == 1:
+        #     current_player = self.b.players[0]
+        # elif player == -1:
+        #     current_player = self.b.players[1]
+        if game_instance == None:
+            game_instance = Board.game
+
+        return self.b.getState(player, game_instance)
+        # return b.game
+
+    def getSymmetries(self, state, pi):
+        """
+        Input:
+            board: current board
+            pi: policy vector of size self.getActionSize()
+
+        Returns:
+            symmForms: a list of [(board,pi)] where each tuple is a symmetrical
+                       form of the board and the corresponding pi vector. This
+                       is used when training the neural network from examples.
+        """
+        # assert(len(pi) == len(state))
+        assert(len(pi) == 168)
+        pi_board = np.reshape(pi, (21, 9))
+        l = []
+
+        for i in range(1, 5):
+            for j in [True, False]:
+                newS = np.rot90(state, i)
+                newPi = np.rot90(pi_board, i)
+                if j:
+                    newS = np.fliplr(newS)
+                    newPi = np.fliplr(newPi)
+                l += [(newS, list(newPi.ravel()) + [pi[-1]])]
+        return l
+
+    def stringRepresentation(self, state):
+        """
+        Input:
+            state: np array of state
+
+        Returns:
+            boardString: a quick conversion of board to a string format.
+                         Required by MCTS for hashing.
+        """
+        return state.tostring()
+class Board:
+    """
+    This class interacts with Game.py to initialize the game,
+    return states, and return actions
+    """
+    game = None
+    players = ['', '']
+
+    def __init__(self):
+        self.num_actions = 23
+        self.is_basic = True
+
+    def isolateSet(self, filename='notbasicset', set='CardSet.CORE'):
+        # isolates the specified card set for exclusion in drafting
+        cards.db.initialize()
+        extraset = []
+        for index, card in cards.db.items():
+            if str(card.card_set) != set:
+                    extraset.append(card.id)
+        with open(f'{filename}.data', 'wb') as filehandle:
+            # store the data as binary data stream
+            pickle.dump(extraset, filehandle)
+
+    def initGame(self):
+        cards.db.initialize()
+        if self.is_basic: #create quick simple game
+            with open('notbasic.data', 'rb') as f:
+                extra_set = pickle.load(f)
+            p1 = 6 #priest
+            p2 = 7 #rogue
+            deck1 = random_draft(CardClass(p1), exclude=extra_set)
+            deck2 = random_draft(CardClass(p2), exclude=extra_set)
+        else:
+            p1 = random.randint(1, 9)
+            p2 = random.randint(1, 9)
+            deck1 = random_draft(CardClass(p1))
+            deck2 = random_draft(CardClass(p2))
+        Board.players[0] = Player("Player1", deck1, CardClass(p1).default_hero)
+        Board.players[1] = Player("Player2", deck2, CardClass(p2).default_hero)
+        game = Game(players=self.players)
+        game.start()
+
+        # Skip mulligan for now
+        for player in game.players:
+            cards_to_mulligan = random.sample(player.choice.cards, 0)
+            player.choice.choose(*cards_to_mulligan)
+
+        # self.start_player = game.current_player
+        game.player_to_start = game.current_player
+        Board.game = game
+        return game
+
+    def getValidMoves(self, game_instance):
+        actions = np.zeros((21,18))
+        player = game_instance.current_player
+        #If the player is being given a choice, return only valid choices
+        if player.choice:
+            for index, card in enumerate(player.choice.cards):
+                actions[20, index] = 1
+                #actions.append(("choose", card, None))
+
+        else:
+            # add cards in hand
+            for index, card in enumerate(player.hand):
+                if card.is_playable():
+                    if card.requires_target():
+                        for target, card in enumerate(card.targets):
+                            actions[index, target] = 1
+                    elif card.must_choose_one:
+                        for choice, card in enumerate(card.choose_cards):
+                            actions[index, choice] = 1
+                    else:
+                        actions[index] = 1
+            # add targets available to minions that can attack
+            for position, minion in enumerate(player.field):
+                if minion.can_attack():
+                    for target, card in enumerate(minion.attack_targets):
+                        actions[position+10, target] = 1
+            # add hero power and targets if applicable
+            if player.hero.power.is_usable():
+                if player.hero.power.requires_target():
+                    for target, card in enumerate(player.hero.power.targets):
+                        actions[17, target] = 1
+                else:
+                    actions[17] = 1
+            # add hero attacking if applicable
+            if player.hero.can_attack():
+                for target, card in enumerate(player.hero.attack_targets):
+                    actions[18, target] = 1
+            # add end turn
+            actions[19,1] = 1
+        return actions
+
+    def performAction(self, a, player, game_instance):
+        """
+        utilty to convert an action tuple
+        into an action input
+        Args:
+            a, a tuple representing index of action
+            player,
+            game,
+        """
+        player = game_instance.current_player
+        if not game_instance.ended:
+            try:
+                if 0 <= a[0] <= 9:
+                    if player.hand[a[0]].requires_target():
+                        player.hand[a[0]].play(player.hand[a[0]].targets[a[1]])
+                    elif player.hand[a[0]].must_choose_one:
+                        player.hand[a[0]].play(choose=player.hand[a[0]].choose_targets[a[1]])
+                    else:
+                        player.hand[a[0]].play()
+                elif 10 <= a[0] <= 16:
+                    player.field[a[0]-10].attack(player.field[a[0]-10].attack_targets[a[1]])
+                elif a[0] == 17:
+                    if player.hero.power.requires_target():
+                            player.hero.power.use(player.hero.power.play_targets[a[1]])
+                    else:
+                        player.hero.power.use()
+                elif a[0] == 18:
+                    player.hero.attack(player.hero.attack_targets[a[1]])
+                elif a[0] == 19:
+                    player.game.end_turn()
+                elif a[0] == 20 and not player.choice:
+                    player.game.end_turn()
+                elif player.choice:
+                    player.choice.choose(player.choice.cards[a[1]])
+                else:
+                    raise UnhandledAction
+            except UnhandledAction:
+                print("Attempted to take an inappropriate action!")
+                print(a)
+                raise
+            except InvalidAction:
+                print("Attempted to do something I can't!")
+                player.game.end_turn()
+            except IndexError:
+                try:
+                    player.game.end_turn()
+                except GameOver:
+                    pass
+            except GameOver:
+                pass
+
+
+    def getState(self, player, game_instance):
+        """
+        Args:
+            game, the current game object
+            player, the player from whose perspective to analyze the state
+        return:
+            a numpy array features extracted from the
+            supplied game.
+        """
+        s = np.zeros(263, dtype=np.int32)
+
+        p1 = game_instance.current_player
+        p2 = p1.opponent
+
+        #0-9 player1 class, we subtract 1 here because the classes are from 1 to 10
+        s[p1.hero.card_class-1] = 1
+        #10-19 player2 class
+        s[10 + p2.hero.card_class-1] = 1
+        i = 20
+        # 20-21: current health of current player, then opponent
+        s[i] = p1.hero.health
+        s[i + 1] = p2.hero.health
+
+        # 22: hero power usable y/n
+        s[i + 2] = p1.hero.power.is_usable()*1
+        # 23-24: # of mana crystals for you opponent
+        s[i + 3] = p1.max_mana
+        s[i + 4] = p2.max_mana
+        # 25: # of crystals still avalible
+        s[i + 5] = p1.mana
+        #26-31: weapon equipped y/n, pow., dur. for you, then opponent
+        s[i + 6] = 0 if p1.weapon is None else 1
+        s[i + 7] = 0 if p1.weapon is None else p1.weapon.damage
+        s[i + 8] = 0 if p1.weapon is None else p1.weapon.durability
+
+        s[i + 9] = 0 if p2.weapon is None else 1
+        s[i + 10] = 0 if p2.weapon is None else p2.weapon.damage
+        s[i + 11] = 0 if p2.weapon is None else p2.weapon.durability
+
+        # 32: number of cards in opponents hand
+        s[i + 12] = len(p2.hand)
+        #in play minions
+
+        i = 33
+        #33-102, your monsters on the field
+        p1_minions = len(p1.field)
+        for j in range(0, 7):
+            if j < p1_minions:
+                # filled y/n, pow, tough, current health, can attack
+                s[i] = 1
+                s[i + 1] = p1.field[j].atk
+                s[i + 2] = p1.field[j].max_health
+                s[i + 3] = p1.field[j].health
+                s[i + 4] = p1.field[j].can_attack()*1
+                # deathrattle, div shield, taunt, stealth y/n
+                s[i + 5] = p1.field[j].has_deathrattle*1
+                s[i + 6] = p1.field[j].divine_shield*1
+                s[i + 7] = p1.field[j].taunt*1
+                s[i + 8] = p1.field[j].stealthed*1
+                s[i + 9] = p1.field[j].silenced*1
+            i += 10
+
+        #103-172, enemy monsters on the field
+        p2_minions = len(p2.field)
+        for j in range(0, 7):
+            if j < p2_minions:
+                # filled y/n, pow, tough, current health, can attack
+                s[i] = 1
+                s[i + 1] = p2.field[j].atk
+                s[i + 2] = p2.field[j].max_health
+                s[i + 3] = p2.field[j].health
+                s[i + 4] = p2.field[j].can_attack()*1
+                # deathrattle, div shield, taunt, stealth y/n
+                s[i + 5] = p2.field[j].has_deathrattle*1
+                s[i + 6] = p2.field[j].divine_shield*1
+                s[i + 7] = p2.field[j].taunt*1
+                s[i + 8] = p2.field[j].stealthed*1
+                s[i + 9] = p2.field[j].silenced*1
+            i += 10
+
+        #in hand
+
+        #173-262, your cards in hand
+        p1_hand = len(p1.hand)
+        for j in range(0, 10):
+            if j < p1_hand:
+                #card y/n
+                s[i] = 1
+                # minion y/n, attk, hp, battlecry, div shield, deathrattle, taunt
+                s[i + 1] = 1 if p1.hand[j].type == 4 else 0
+                s[i + 2] = p1.hand[j].atk if s[i + 1] == 1 else 0
+                s[i + 2] = p1.hand[j].health if s[i + 1] == 1 else 0
+                s[i + 3] = p1.hand[j].divine_shield*1 if s[i + 1] == 1 else 0
+                s[i + 4] = p1.hand[j].has_deathrattle*1 if s[i + 1] == 1 else 0
+                s[i + 5] = p1.hand[j].taunt*1 if s[i + 1] == 1 else 0
+                # weapon y/n, spell y/n, cost
+                s[i + 6] = 1 if p1.hand[j].type == 7 else 0
+                s[i + 7] = 1 if p1.hand[j].type == 5 else 0
+                s[i + 8] = p1.hand[j].cost
+            i += 9
+        return s
\ No newline at end of file
diff --git a/alphabot/MCTS.py b/alphabot/MCTS.py
index f395d68..8178af4 100644
--- a/alphabot/MCTS.py
+++ b/alphabot/MCTS.py
@@ -90,7 +90,7 @@ def search(self, state, create_copy):
         s = self.game.stringRepresentation(state)
 
         if s not in self.Es:
-            self.Es[s] = self.game.getGameEnded(1, self.game_copy)
+            self.Es[s] = self.game.getGameEnded(self.game_copy)
         if self.game_copy.ended or self.game_copy.turn > 180:
             # terminal node
             return -self.Es[s]
@@ -98,7 +98,7 @@ def search(self, state, create_copy):
         if s not in self.Ps:
             # leaf node
             self.Ps[s], v = self.nnet.predict(state)
-            valids = self.game.getValidMoves(1, self.game_copy)
+            valids = self.game.getValidMoves(self.game_copy)
             self.Ps[s] = self.Ps[s]*valids      # masking invalid moves
             sum_Ps_s = np.sum(self.Ps[s])
             if sum_Ps_s > 0:
@@ -136,7 +136,7 @@ def search(self, state, create_copy):
         a = best_act
 
         next_s, next_player = self.game.getNextState(1, a, self.game_copy)
-        next_s = self.game.getState(next_player, self.game_copy)
+        next_s = self.game.getState(self.game_copy)
         if not self.game_copy.ended:
             v = self.search(next_s, create_copy=False) #call recursively
         else:
diff --git a/alphabot/pit.py b/alphabot/pit.py
index ff7b786..ffefd08 100644
--- a/alphabot/pit.py
+++ b/alphabot/pit.py
@@ -16,7 +16,7 @@ def __init__(self, game):
 
     def play(self, game_instance):
         agent = game_instance.current_player
-        choices = np.argwhere(self.game.getValidMoves(agent, game_instance) == 1)
+        choices = np.argwhere(self.game.getValidMoves(game_instance) == 1)
         return random.choice(choices)