view.py

import os
os.environ['TF_CPP_MIN_LOG_LEVEL'] = '3'
import holdem_model.table as table,  holdem_model.utils as utils
import tensorflow as tf
import  numpy as np
from tensorflow import keras

class View:
    model = None
    playerid = 0

    def __init__(self, model, playerid):
        self.model = model
        self.playerid = playerid

    def view_player_action(self, action):
        pass

    def view_hand_results(self):
        pass

    def view_cards(self):
        pass


class AgentView(View):
    model = None
    playerid = 0
    states = []
    history = []
    card_model = None
    action_model = None
    action_count = -1
    training_actions = []

    def __init__(self, model, playerid):
        self.model = model
        self.playerid = playerid
        self.states = []
        self.history = [[0.0] * 168] * 20
        self.card_model = tf.keras.models.load_model('./agent_models/card_model.h5')
        self.action_model = tf.keras.models.load_model('./agent_models/action_model.h5')


    def predict_cards(self, state, labels=None):
        # Given a state, predict what cards the opponent is holding
        example = [[x[52:] for x in state]]
        pred = self.card_model.predict(example)
        return(pred.tolist()[0])


    def predict_action(self, state, labels=None):
        # Given a state, predict the opponent's next action
        example = [[x[:52] + x[104:-3] for x in state]]
        pred = self.action_model.predict(example)
        return(pred.tolist()[0])
        

    def view_player_action(self, action, prev_state):
        """
        History is a 168 x 20 nested array that is used to generate states.
        States is a 1d-20d array of 168 x 20 states (will be made into tensors)
            NOTE- Each state includes the history of the hand until that point.
            Actions past the 20th in a hand are ignored. 
            This is fine since 99%+ hands have fewer than 20 states.
        predict_opponent_cards
            input: 116x20 (state[52:])
            (state, not including predicted cards)
            output: 52x1 (predicted cards)
        predict_fold_chance
            input: 113x20  (state[:52] + state[104:-3]) 
            (state, not including your cards and their action)
            output: 1x1 (predicted fold chance)
        """

        self.action_count += 1

        # Dont train if player1. For agent v agent training.
        if self.playerid or self.action_count == 20:
            return

        # Predicted opponent's cards - idx 51
        fake_pred = [0.0 for _ in range(52)]

        # Own cards - idx 103
        state = utils.hand_to_vec(self.model.players[self.playerid]['hand']) 

        # Community cards - idx 155
        state += utils.hand_to_vec(self.model.community_cards)

        # Round of betting - idx 156
        if not self.model.community_cards:
            state.append(0.0)
        else:
            for i in range(3,6):
                if len(self.model.community_cards) == i:
                    state.append(float(i - 2))
                    break

        # Position index 157
        state.append(float(self.model.players[self.playerid]['position']))

        # to_call, min & max bet, pot, stacks. index 163
        if self.playerid:
            prev_state = prev_state[:-2] + [prev_state[-1], prev_state[-2]]
        state += [float(x) for x in prev_state]

        # Whether it was just the opponent's turn. index 164
        state.append(float(self.model.active_player==self.playerid))

        # Action idx 167
        action = min(action, 2)
        state += [float(x == action) for x in range(3)]
        state = fake_pred + state

        # Set history

        temp_history = self.history
        temp_history[len(self.states)] = state

        state = self.predict_cards(temp_history) + state[52:]
        self.history[len(self.states)] = state

        # If it was opponent's action, add to training examples
        if state[164]:
            self.states.append(self.history)
            self.training_actions.append(self.action_count)


    def view_hand_results(self, result=None):
        card_examples = []
        action_examples = []
        action_labels = []

        # Get training examples
        for i in range(len(self.states)):
            card_examples.append([s[52:] for s in self.states[i]])
            action_examples.append([s[:52] + s[104:-3] for s in self.states[i]])
            action_labels.append(self.states[i][self.training_actions[i]][-3:])
        
        # Get opponent's actual cards
        if result:
            opp_hand = utils.hand_to_vec(result[4 - self.playerid])
        else:
            opp_hand = utils.hand_to_vec(self.model.players[1 - self.playerid]['hand'])

        card_labels = [opp_hand for _ in range(len(card_examples))]


        for i in range(len(card_examples)):
            # Train opponent's hand predictor
            self.card_model.fit([card_examples[i]], [card_labels[i]], epochs = 1, batch_size = 1, verbose = 0)
            # Train action predictor
            self.action_model.fit([action_examples[i]], [action_labels[i]], epochs = 1, batch_size = 1, verbose = 0)

        # Remove history of hand
        self.states = []
        self.history = [[0.0] * 168] * 20
        self.action_count = -1
        self.training_actions = []


    def end_game(self, pid):
        print("saving model")
        if not self.playerid:
            self.card_model.save('./agent_models/card_model.h5')
            self.action_model.save('./agent_models/action_model.h5')


class UIView(View):
    model = None
    playerid = 0

    def view_cards(self):
        if not self.model.community_cards:
            print("\nRound: Preflop")
            if self.model.players[self.playerid]['position']:
                print("You are the big blind ({})".format(self.model.blinds[1]))
            else:
                print("You are the little blind ({})".format(self.model.blinds[0]))
        
        elif len(self.model.community_cards) == 3:
            print("\nRound: Flop")
        
        elif len(self.model.community_cards) == 4:
            print("\nRound: Turn")

        elif len(self.model.community_cards) == 5:
            print("\nRound: River")

        else:
            print("Error!")

        hand = self.model.players[self.playerid]['hand']
        print('Hand: ' + ' '.join([utils.card_to_string(card) for card in hand]))

        print('Community: ' + ' '.join([utils.card_to_string(card) for card in self.model.community_cards]))    
        best = utils.get_rank(self.playerid, hand, self.model.community_cards)   
        print("The best hand you currently have is {}".format(utils.hand_to_string(best[1])))


    def view_chips(self):
        c1 = self.model.players[self.playerid]['chips']
        c2 = self.model.players[1 - self.playerid]['chips']

        if self.model.players[self.playerid]['position']:
            blind = 'big'
            b = self.model.blinds[1]
        else:
             blind = 'little'
             b = self.model.blinds[0]

        print("Pot: {}. The current bet is {}.".format(self.model.pot, self.model.to_call))
        if c2:
            print("You have {} chips. Opponent has {}.".format(c1,c2))
        else:
            print("You have {} chips. Opponent is all-in.".format(c1))
        print("You are the {} blind ({})".format(blind, b))


    def view_hand_results(self, result=None):
        if result:
            print("\nRound: Showdown")
            print('Community cards: ' + ' '.join([utils.card_to_string(card) for card in result[4]]))
            print('Your cards: ' + ' '.join([utils.card_to_string(card) for card in result[2]]))
            print("Opponent's cards: " + ' '.join([utils.card_to_string(card) for card in result[3]]))

        if not result:
            if self.model.active_player == self.playerid:
                print("Your opponent folded. You win the pot of {}".format(self.model.pot))
            else:
                print("You folded. Your opponent wins the pot of {}".format(self.model.pot))
                
        elif len(result) == 7:
            loser = utils.hand_to_string(result[0][1])
            winner = utils.hand_to_string(result[1][1])
            if result[6] == self.playerid:
                print("You have {} and your opponent has {}. You win the pot of {}".format(winner,loser, result[5]))
            else:
                print("You have {} and your opponent has {}. Your opponent wins the pot of {}".format(loser,winner, result[5]))
        else:
            print("You and your opponent each have {} and split the pot of {}".format(utils.hand_to_string(result[0][1]),
             result[5]))


    def view_player_action(self, action, prev_state):
        actions = ['folds', 'checks', 'calls', 'raises by']
        you = ' (You)' if self.model.active_player != self.playerid else ''
        if action < 3:
            print("Player {}{} {}.".format(1 - self.model.active_player, you, actions[action]))
        else:
            print("Player {}{} {} {}.".format(1 - self.model.active_player, you, actions[action], self.model.to_call))
        

    def end_game(self, pid):
        if pid == self.playerid:
            print("You win!")
        else:
            print("You lose!")

    
    def view_history(self):
        pass