이제 머신러닝으로 게임을 구현해 보자.
학습 데이터가 5만 이상 되어야 하는데 2만개 정도만 학습 시켰다.
최적화 이동 처리 함수와 믹스해서 구현해 보았다.
3x3일 경우 막지 않았다.
나중에 그 부분은 업데이트 하도록 하겠다.
#
# FIAR
# Created by netcanis on 2023/10/29.
#
# minimax
# alpha beta pruning
# 속도 개선
# 훈련데이터 생성하여 머신러닝.
import pygame
import random
import numpy as np
import sys
import os
import tensorflow as tf
from keras.models import load_model
BOARD_SIZE = 9 # (7,9,13,15,19)
CELL_SIZE = 40
MARGIN = 20
CLICK_RADIUS = CELL_SIZE // 2
BLACK = (0, 0, 0)
WHITE = (255, 255, 255)
RED = (255, 0, 0)
GRAY = (100, 100, 100)
NUM_ITEMS = (BOARD_SIZE * BOARD_SIZE)
PLAYER = 1
AI = -1
DIFFICULTY_LEVEL_AI = 4
PLAYER_MODE = "MANUAL"
AI_MODE = "ML"
H5_FILE_NAME = "fiar_model.h5"
class FIAR:
def __init__(self):
self.init_game()
def init_game(self):
self.episode = 0
pygame.init()
pygame.display.set_caption("FIAR")
w = (BOARD_SIZE-1) * CELL_SIZE + 2 * MARGIN
h = (BOARD_SIZE-1) * CELL_SIZE + 2 * MARGIN
self.screen = pygame.display.set_mode((w, h))
self.font = pygame.font.Font(None, CELL_SIZE-4)
def reset_game(self):
self.board = np.zeros((BOARD_SIZE, BOARD_SIZE), dtype=int)
self.sequences = np.zeros((BOARD_SIZE, BOARD_SIZE), dtype=int)
self.sequence = 0
self.game_over = False
self.turn_player = PLAYER#random.choice([PLAYER, AI])
self.draw_board(self.screen)
pygame.display.flip()
self.model = load_model(H5_FILE_NAME)
def find_empty_cells(self):
empty_cells = []
for row in range(BOARD_SIZE):
for col in range(BOARD_SIZE):
if self.board[row][col] == 0:
empty_cells.append((row, col))
random.shuffle(empty_cells)
return empty_cells
def find_adjacent_empty_cells(self):
empty_cells = []
empty_cells2 = []
for row, col in self.find_empty_cells():
for dr in [-1, 0, 1]:
for dc in [-1, 0, 1]:
new_row, new_col = row + dr, col + dc
if 0 <= new_row < BOARD_SIZE and 0 <= new_col < BOARD_SIZE and self.board[new_row][new_col] != 0:
# 수를 놓았을 경우 연결된 수가 3개 이상이고 5개를 놓을 수 있는 자리일 경우만 배열에 추가.
self.board[row][col] = self.turn_player
c1, c2, _ = self.evaluate_position(self.board, row, col)
self.board[row][col] = -self.turn_player
c3, c4, _ = self.evaluate_position(self.board, row, col)
self.board[row][col] = 0
if (c1 >= 3 and c2 >= 5) or (c3 >= 3 and c4 >= 5):
empty_cells2.append((row, col))
empty_cells.append((row, col))
break
if len(empty_cells2) > 0:
return empty_cells2
return empty_cells
def evaluate_position(self, board, row, col):
def check_direction(dx, dy):
count = 1
r, c = row + dx, col + dy
while 0 <= r < len(board) and 0 <= c < len(board[0]) and board[r][c] == board[row][col]:
count += 1
r += dx
c += dy
return count
def check_direction_with_blank(dx, dy):
count = 1 # 빈자리 포함 총자리 수
r, c = row + dx, col + dy
while 0 <= r < len(board) and 0 <= c < len(board[0]) and (board[r][c] == board[row][col] or board[r][c] == 0):
count += 1
r += dx
c += dy
return count
total_count1 = 0
total_count2 = 0
total_score = 0
directions = [(0, 1), (1, 0), (1, 1), (-1, 1)]
for dx, dy in directions:
count1 = check_direction( dx, dy)
count2 = check_direction(-dx, -dy)
dir_count1 = count1 + count2 - 1
count3 = check_direction_with_blank( dx, dy)
count4 = check_direction_with_blank(-dx, -dy)
dir_count2 = count3 + count4 - 1
total_count1 = max(total_count1, dir_count1)
total_count2 = max(total_count2, dir_count2)
# 각 방향별로 연결된 돌의 수가 3자리 이상이고 5개이상 놓을 수 있는 자리라면 점수를 추가한다.
# 즉, 연결되는 돌이 교차하는 위치라면 점수가 높게 나온다.
if dir_count1 == 4 and dir_count2 >= 5:
total_score += dir_count1 * 4
elif dir_count1 >= 3 and dir_count2 >= 5:
total_score += dir_count1 * 2
elif dir_count1 >= 2 and dir_count2 >= 5:
total_score += dir_count1
return total_count1, total_count2, total_score
def check_winner(self, board, row, col):
if board[row][col] == 0:
return False
def check_direction(dx, dy):
count = 1
r, c = row + dx, col + dy
while 0 <= r < len(board) and 0 <= c < len(board[0]) and board[r][c] == board[row][col]:
count += 1
r += dx
c += dy
return count
directions = [(0, 1), (1, 0), (1, 1), (-1, 1)]
for dx, dy in directions:
count1 = check_direction(dx, dy)
count2 = check_direction(-dx, -dy)
total_count = count1 + count2 - 1
if total_count == 5:
return True
return False
def is_board_full(self, board):
return all(cell != 0 for row in board for cell in row)
def random_move(self, player):
if self.game_over:
return -1, -1
best_move = None
best_score = 0
best_move = self.make_optimal_move(player)
if best_move == None:
if player == AI:
empty_cells = self.find_adjacent_empty_cells()
for row, col in empty_cells:
self.board[row][col] = player
s1 = self.evaluate_position(self.board, row, col)[2]
if s1 > best_score:
best_score = s1
best_move = (row, col)
self.board[row][col] = -player
s2 = self.evaluate_position(self.board, row, col)[2]
if s2 > best_score:
best_score = s2
best_move = (row, col)
self.board[row][col] = 0
if best_score == 0:
best_move = random.choice(self.find_empty_cells())
else:
best_move = random.choice(self.find_empty_cells())
self.make_move(best_move[0], best_move[1], player)
return best_move
def minimax_move(self, player):
if self.game_over:
return -1, -1
row, col = self.find_best_move(player)
self.make_move(row, col, player)
return row, col
def make_move(self, row, col, player):
if self.board[row][col] == 0:
self.board[row][col] = player
self.sequence += 1
self.sequences[row][col] = self.sequence
#print(f"[{self.sequence}] <{player}> {row},{col}")
if self.check_winner(self.board, row, col):
self.game_over = True
elif self.is_board_full(self.board):
self.game_over = True
self.turn_player = 0
else:
self.turn_player *= -1
def minimax(self, depth, is_maximizing, alpha, beta, row2, col2):
if self.is_board_full(self.board):
return 0
if is_maximizing:
if self.check_winner(self.board, row2, col2):
return -(NUM_ITEMS - depth + 1)
else:
if self.check_winner(self.board, row2, col2):
return (NUM_ITEMS - depth + 1)
if depth >= DIFFICULTY_LEVEL_AI:
return 0
if is_maximizing:# AI
best_score = -float('inf')
for row, col in self.find_adjacent_empty_cells():
self.board[row][col] = AI
score = self.minimax(depth + 1, False, alpha, beta, row, col)
self.board[row][col] = 0
best_score = max(best_score, score)
alpha = max(alpha, best_score)
if beta <= alpha:
break
return best_score
else:
best_score = float('inf')
for row, col in self.find_adjacent_empty_cells():
self.board[row][col] = PLAYER
score = self.minimax(depth + 1, True, alpha, beta, row, col)
self.board[row][col] = 0
best_score = min(best_score, score)
beta = min(beta, best_score)
if beta <= alpha:
break
return best_score
def make_optimal_move(self, player):
# 0. The first one is random.
if self.sequence == 0:
row = BOARD_SIZE // 2 + random.randint(-2, 2)
col = BOARD_SIZE // 2 + random.randint(-2, 2)
return (row, col)
empty_cells = self.find_adjacent_empty_cells()
# 1. ai turn: 5
for row, col in empty_cells:
self.board[row][col] = player
if self.check_winner(self.board, row, col):
self.board[row][col] = 0
return (row, col)
self.board[row][col] = 0
# 2. player turn: 5
for row, col in empty_cells:
self.board[row][col] = -player
if self.check_winner(self.board, row, col):
self.board[row][col] = 0
return (row, col)
self.board[row][col] = 0
# 3. The position that becomes 4 when placed
for row, col in empty_cells:
self.board[row][col] = player
c1, c2, _ = self.evaluate_position(self.board, row, col)
self.board[row][col] = -player
c3, c4, _ = self.evaluate_position(self.board, row, col)
self.board[row][col] = 0
if (c1 == 4 and c2 >= 5) or (c3 == 4 and c4 >= 5):
return (row, col)
# 4. The position that becomes 3 when placed
for row, col in empty_cells:
self.board[row][col] = player
c1, c2, _ = self.evaluate_position(self.board, row, col)
self.board[row][col] = -player
c3, c4, _ = self.evaluate_position(self.board, row, col)
self.board[row][col] = 0
if (c1 == 3 and c2 >= 5) or (c3 == 3 and c4 >= 5):
return (row, col)
return None
def find_best_move(self, player):
if AI_MODE == "ML":
optimal_move = self.make_optimal_move(player)
if optimal_move != None:
print(f"optimal move! ({optimal_move[0]}, {optimal_move[1]})")
return optimal_move
move_index = self.predicts(self.board)
row = move_index // BOARD_SIZE
col = move_index % BOARD_SIZE
best_move = (row, col)
print(f"ML move! ({row}, {col})")
elif AI_MODE == "RANDOM":
best_move = self.random_move(player)
else: # MINIMAX
print(f"[{self.sequence+1}] <{player}> ...")
optimal_move = self.make_optimal_move(player)
if optimal_move != None:
return optimal_move
alpha = -float('inf')
beta = float('inf')
best_move = None
best_score = -float('inf') if player == AI else float('inf')
empty_cells = self.find_adjacent_empty_cells()
for index, (row, col) in enumerate(empty_cells):
self.board[row][col] = player
is_maximizing = False if player == AI else True
score = self.minimax(0, is_maximizing, alpha, beta, row, col)
self.board[row][col] = 0
if (player == AI and score > best_score) or (player == PLAYER and score < best_score):
best_score = score
best_move = (row, col)
percentage = (index / len(empty_cells)) * 100
print(f" [{percentage:.1f}%] <{player}> {row},{col} -> {score}")
print(f" {best_move[0]},{best_move[1]} ({best_score})")
return best_move
def show_message(self, message, is_exit=False):
popup = True
while popup:
for event in pygame.event.get():
if event.type == pygame.QUIT:
pygame.quit()
sys.exit()
if event.type == pygame.KEYDOWN:
if is_exit:
if event.key == pygame.K_y:
self.reset_game()
popup = False
return
elif event.key == pygame.K_n:
pygame.quit()
sys.exit()
else:
popup = False
message = ""
self.draw_board(self.screen)
break
text_lines = message.split('\n')
for i, line in enumerate(text_lines):
text = self.font.render(line, True, (128, 0, 128))
text_rect = text.get_rect(topleft=(20, 20 + i * 20))
self.screen.blit(text, text_rect)
pygame.display.flip()
def draw_board(self, screen):
screen.fill(GRAY)
for row in range(BOARD_SIZE):# draw horizontal lines
pygame.draw.line(screen, BLACK,
(0 * CELL_SIZE + MARGIN, row * CELL_SIZE + MARGIN),
((BOARD_SIZE-1) * CELL_SIZE + MARGIN, row * CELL_SIZE + MARGIN),
1)
for col in range(BOARD_SIZE):# draw vertical lines
if row == 0:
pygame.draw.line(screen, BLACK,
(col * CELL_SIZE + MARGIN, 0 * CELL_SIZE + MARGIN),
(col * CELL_SIZE + MARGIN, (BOARD_SIZE-1) * CELL_SIZE + MARGIN),
1)
x = col * CELL_SIZE + MARGIN
y = row * CELL_SIZE + MARGIN
if self.board[row][col] == PLAYER:
pygame.draw.circle(screen, BLACK, (x, y), CLICK_RADIUS)
elif self.board[row][col] == AI:
pygame.draw.circle(screen, WHITE, (x, y), CLICK_RADIUS)
seq_no = self.sequences[row][col]
if seq_no != 0:
if seq_no == self.sequence:
pygame.draw.circle(screen, RED, (x, y), CLICK_RADIUS+1, 1)
color = WHITE if self.board[row][col] == PLAYER else BLACK
text = self.font.render(f"{seq_no}", True, color)
text_rect = text.get_rect(center=(x, y))
screen.blit(text, text_rect)
def handle_events(self):
for event in pygame.event.get():
if event.type == pygame.QUIT:
self.game_over = True
elif event.type == pygame.MOUSEBUTTONDOWN and not self.game_over and self.turn_player == PLAYER:
x, y = pygame.mouse.get_pos()
row = int(round((y - MARGIN) / CELL_SIZE))
col = int(round((x - MARGIN) / CELL_SIZE))
if 0 <= row < BOARD_SIZE and 0 <= col < BOARD_SIZE and self.board[row][col] == 0:
self.make_move(row, col, self.turn_player)
self.draw_board(self.screen)
pygame.display.flip()
if self.turn_player == AI:
best_move = self.find_best_move(self.turn_player)
if best_move is not None:
row, col = best_move
self.make_move(row, col, self.turn_player)
self.draw_board(self.screen)
pygame.display.flip()
if self.game_over == True:
if self.turn_player == 0:
self.show_message("Game draw!")
else:
self.show_message(f"Game Over!\n{'Player' if self.turn_player == PLAYER else 'AI'} wins!")
def init_ML(self):
hidden_layer_count = 3 * NUM_ITEMS
self.model = tf.keras.Sequential([
tf.keras.layers.Dense(hidden_layer_count, activation='relu', input_shape=(NUM_ITEMS,)),
tf.keras.layers.Dense(NUM_ITEMS, activation='softmax')
])
self.model.compile(loss='categorical_crossentropy', optimizer='adam', metrics=['accuracy'])
def predicts(self, input_data):
if isinstance(input_data, list):
input_data = np.array(input_data)
prediction = self.model.predict(input_data.reshape(1, -1))
sorted_indices = np.argsort(prediction, axis=-1)[:, ::-1]
index = 0
for i in sorted_indices[0]:
if input_data.shape == (NUM_ITEMS,):
if input_data[i] == 0:
index = i
break
elif input_data.shape == (BOARD_SIZE, BOARD_SIZE):
row = i // BOARD_SIZE
col = i % BOARD_SIZE
if input_data[row][col] == 0:
index = i
break
return index
if __name__ == "__main__":
game = FIAR()
game.init_ML()
game.reset_game()
while True:
while not game.game_over:
game.handle_events()
game.show_message("Play Again? (y/n)", is_exit=True)
2023.10.27 - [AI,ML, Algorithm] - Gomoku(Five in a Row, Omok) (2/5) - 속도 최적화 1차 (minimax 속도 개선)
2023.10.28 - [AI,ML, Algorithm] - Gomoku(Five in a Row, Omok) (3/5) - 속도 최적화 2차 (RANDOM모드 추가)
2023.10.29 - [AI,ML, Algorithm] - Gomoku(Five in a Row, Omok) (4/5) - 훈련 데이터 생성 및 학습
2023.10.29 - [AI,ML, Algorithm] - Gomoku(Five in a Row, Omok) (5/5) - 머신러닝으로 게임 구현
2023.11.03 - [AI,ML, Algorithm] - Gomoku(Five in a Row, Omok) (5/5) - 3x3 체크 추가
'개발 > AI,ML,ALGORITHM' 카테고리의 다른 글
A star (0) | 2023.12.27 |
---|---|
Gomoku(Five in a Row, Omok) (5/5) - 3x3 체크 추가 (0) | 2023.11.03 |
Gomoku(Five in a Row, Omok) (4/5) - 훈련 데이터 생성 및 학습 (1) | 2023.10.29 |
Gomoku(Five in a Row, Omok) (3/5) - 속도 최적화 2차 (RANDOM모드 추가) (1) | 2023.10.28 |
Gomoku(Five in a Row, Omok) (2/5) - 속도 최적화 1차 (minimax 속도 개선) (0) | 2023.10.27 |