python/alphaBeta.py


1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148

# import MCTS
import math
from copy import deepcopy
from time import clock
from random import choice

from GameState import GameState

class Algo: # A class for defining algorithms used (minimax and alpha-beta pruning)
    
    def miniMax(State, Ply_num): # Function for the minimax algorithm

        for i in range(State.Current.dimY):
            for j in range(State.Current.dimX):
                if State.Current.Mat[i][j] == ' ' and (j, i) not in State.children:
                    State.Make(j, i, True)
                    if Ply_num < 2:
                        return (i, j)

        Minimum_Score = 1000
        i = 0

        
        j = 0
        for k, z in State.children.items():
            Result = Algo.Maximum(z, Ply_num - 1, Minimum_Score)
            if Minimum_Score > Result:
                Minimum_Score = Result
                i = k[0]
                j = k[1]

        return (i, j)


    def Maximum(State, Ply_num, Alpha): # Alpha-beta pruning function for taking care of Alpha values
        if Ply_num == 0:
            return State.CurrentScore

        for i in range(State.Current.dimY):
            for j in range(State.Current.dimX):
                if State.Current.Mat[i][j] == ' ' and (j, i) not in State.children:
                    State.Make(j, i, False)

        Maximum_Score = -1000
        i = 0
        j = 0
        for k, z in State.children.items():
            Result = Algo.Minimum(z, Ply_num - 1, Maximum_Score)
            if Maximum_Score < Result:
                Maximum_Score = Result
            if Result > Alpha:
                return Result

        return Maximum_Score


    def Minimum(State, Ply_num, Beta): # Alpha-beta pruning function for taking care of Beta values
        if Ply_num == 0:
            return State.CurrentScore

        for i in range(State.Current.dimY):
            for j in range(State.Current.dimX):
                if State.Current.Mat[i][j] == ' ' and (j, i) not in State.children:
                    State.Make(j, i, True)

        Minimum_Score = 1000
        i = 0
        j = 0
        for k, z in State.children.items():
            Result = Algo.Maximum(z, Ply_num - 1, Minimum_Score)
            if Minimum_Score > Result:
                Minimum_Score = Result
            if Result < Beta:
                return Result

        return Minimum_Score

# class MCTSNode(object):
#     """Monte Carlo Tree Node.
#     Each node encapsulates a particular game state, the moves that
#     are possible from that state and the strategic information accumulated
#     by the tree search as it progressively samples the game space.
#     """

#     def __init__(self, state, parent=None, move=None):
#         self.parent = parent
#         self.move = move
#         self.state = state

#         self.plays = 0
#         self.score = 0

#         self.pending_moves = state.get_moves()
#         self.children = []

#     def select_child_ucb(self):
#         # Note that each node's plays count is equal
#         # to the sum of its children's plays
#         def ucb(child):
#             win_ratio = child.score / child.plays \
#                         + math.sqrt(2 * math.log(self.plays) / child.plays)
#             return win_ratio

#         return max(self.children, key=ucb)

#     def expand_move(self, move):
#         self.pending_moves.remove(move)  # raises KeyError

#         child_state = deepcopy(self.state)
#         child_state.play_move(move)

#         child = MCTSNode(state=child_state, parent=self, move=move)
#         self.children.append(child)
#         return child

#     def get_score(self, result):
#         # return result
#         if result == 0.5:
#             return result

#         if self.state.player == 2:
#             if self.state.next_turn_player == result:
#                 return 0.0
#             else:
#                 return 1.0
#         else:
#             if self.state.next_turn_player == result:
#                 return 1.0
#             else:
#                 return 0.0

#         if self.state.next_turn_player == result:
#             return 0.0
#         else:
#             return 1.0

#     def __repr__(self):
#         s = 'ROOT\n' if self.parent is None else ''

#         children_moves = [c.move for c in self.children]

#         s += """Score ratio: {score} / {plays}
# Pending moves: {pending_moves}
# Children's moves: {children_moves}
# State:
# {state}\n""".format(children_moves=children_moves, **self.__dict__)

#         return s