27_game_theory.py

  1"""
  2게임 이론 (Game Theory)
  3Game Theory Algorithms
  4
  5조합 게임 이론과 최적 전략을 다루는 알고리즘입니다.
  6"""
  7
  8from typing import List, Dict, Tuple, Set, Optional
  9from functools import lru_cache
 10
 11
 12# =============================================================================
 13# 1. 님 게임 (Nim Game)
 14# =============================================================================
 15
 16def nim_xor(piles: List[int]) -> int:
 17    """
 18    님 게임의 XOR 값 (Nim-sum)
 19    XOR != 0이면 선공 승리, XOR == 0이면 후공 승리
 20    """
 21    result = 0
 22    for pile in piles:
 23        result ^= pile
 24    return result
 25
 26
 27def nim_winning_move(piles: List[int]) -> Optional[Tuple[int, int]]:
 28    """
 29    님 게임에서 승리하는 수 찾기
 30    반환: (더미 인덱스, 남길 개수) 또는 None
 31    """
 32    xor = nim_xor(piles)
 33
 34    if xor == 0:
 35        return None  # 패배 상태, 승리 수 없음
 36
 37    for i, pile in enumerate(piles):
 38        target = pile ^ xor
 39        if target < pile:
 40            return (i, target)  # pile에서 target개만 남기기
 41
 42    return None
 43
 44
 45def nim_game_simulation(piles: List[int], verbose: bool = False) -> int:
 46    """
 47    님 게임 시뮬레이션
 48    반환: 승자 (0: 선공, 1: 후공)
 49    """
 50    current = 0  # 현재 플레이어
 51
 52    while max(piles) > 0:
 53        move = nim_winning_move(piles)
 54
 55        if move is None:
 56            # 패배 상태: 아무 수나
 57            for i, pile in enumerate(piles):
 58                if pile > 0:
 59                    move = (i, pile - 1)
 60                    break
 61
 62        pile_idx, new_count = move
 63        if verbose:
 64            print(f"    Player {current}: 더미 {pile_idx}에서 {piles[pile_idx]}→{new_count}")
 65
 66        piles[pile_idx] = new_count
 67        current = 1 - current
 68
 69    return 1 - current  # 마지막에 가져간 사람이 승리
 70
 71
 72# =============================================================================
 73# 2. 스프라그-그런디 정리 (Sprague-Grundy Theorem)
 74# =============================================================================
 75
 76def mex(s: Set[int]) -> int:
 77    """
 78    Minimum Excludant
 79    집합에 없는 가장 작은 음이 아닌 정수
 80    """
 81    i = 0
 82    while i in s:
 83        i += 1
 84    return i
 85
 86
 87def calculate_grundy(position: int, moves: List[int], memo: Dict[int, int] = None) -> int:
 88    """
 89    스프라그-그런디 수 계산
 90    position: 현재 상태 (예: 돌의 개수)
 91    moves: 가능한 이동량 리스트
 92    """
 93    if memo is None:
 94        memo = {}
 95
 96    if position in memo:
 97        return memo[position]
 98
 99    if position == 0:
100        memo[position] = 0
101        return 0
102
103    reachable = set()
104    for move in moves:
105        if position >= move:
106            reachable.add(calculate_grundy(position - move, moves, memo))
107
108    result = mex(reachable)
109    memo[position] = result
110    return result
111
112
113def multi_pile_grundy(piles: List[int], moves: List[int]) -> int:
114    """
115    여러 더미 게임의 전체 그런디 수
116    각 더미의 그런디 수를 XOR
117    """
118    memo = {}
119    total_grundy = 0
120
121    for pile in piles:
122        grundy = calculate_grundy(pile, moves, memo)
123        total_grundy ^= grundy
124
125    return total_grundy
126
127
128# =============================================================================
129# 3. 변형 님 게임
130# =============================================================================
131
132def staircase_nim(stairs: List[int]) -> int:
133    """
134    계단 님 (Staircase Nim)
135    홀수 번째 계단의 XOR = 그런디 수
136    """
137    xor = 0
138    for i in range(0, len(stairs), 2):  # 홀수 인덱스 (0-indexed의 짝수)
139        xor ^= stairs[i]
140    return xor
141
142
143def misere_nim(piles: List[int]) -> bool:
144    """
145    미제르 님 (마지막 가져가는 사람이 패배)
146    반환: True면 선공 승리
147    """
148    xor = nim_xor(piles)
149    all_one_or_zero = all(p <= 1 for p in piles)
150
151    if all_one_or_zero:
152        # 1인 더미의 개수가 홀수면 후공 승리
153        ones = sum(1 for p in piles if p == 1)
154        return ones % 2 == 0
155    else:
156        return xor != 0
157
158
159def poker_nim(piles: List[int], k: int) -> bool:
160    """
161    포커 님: 더미에 돌을 추가할 수도 있음 (최대 k개)
162    반환: True면 선공 승리
163    규칙: 일반 님과 동일 (XOR != 0이면 선공 승리)
164    """
165    return nim_xor(piles) != 0
166
167
168# =============================================================================
169# 4. 미니맥스 알고리즘 (Minimax)
170# =============================================================================
171
172def minimax(position, depth: int, is_maximizing: bool,
173            evaluate, get_moves, is_terminal) -> int:
174    """
175    미니맥스 알고리즘
176    position: 현재 게임 상태
177    depth: 탐색 깊이
178    is_maximizing: 최대화 플레이어의 턴인지
179    evaluate: 상태 평가 함수
180    get_moves: 가능한 수 반환 함수
181    is_terminal: 종료 상태 확인 함수
182    """
183    if depth == 0 or is_terminal(position):
184        return evaluate(position)
185
186    moves = get_moves(position)
187
188    if is_maximizing:
189        max_eval = float('-inf')
190        for move in moves:
191            new_position = apply_move(position, move)
192            eval_score = minimax(new_position, depth - 1, False,
193                                evaluate, get_moves, is_terminal)
194            max_eval = max(max_eval, eval_score)
195        return max_eval
196    else:
197        min_eval = float('inf')
198        for move in moves:
199            new_position = apply_move(position, move)
200            eval_score = minimax(new_position, depth - 1, True,
201                                evaluate, get_moves, is_terminal)
202            min_eval = min(min_eval, eval_score)
203        return min_eval
204
205
206def apply_move(position, move):
207    """수를 적용한 새 상태 반환 (추상 함수)"""
208    # 구현은 게임에 따라 다름
209    pass
210
211
212# =============================================================================
213# 5. 알파-베타 가지치기 (Alpha-Beta Pruning)
214# =============================================================================
215
216def alpha_beta(position, depth: int, alpha: float, beta: float,
217               is_maximizing: bool, evaluate, get_moves, is_terminal) -> int:
218    """
219    알파-베타 가지치기
220    alpha: 최대화 플레이어의 최선의 보장값
221    beta: 최소화 플레이어의 최선의 보장값
222    """
223    if depth == 0 or is_terminal(position):
224        return evaluate(position)
225
226    moves = get_moves(position)
227
228    if is_maximizing:
229        max_eval = float('-inf')
230        for move in moves:
231            new_position = apply_move(position, move)
232            eval_score = alpha_beta(new_position, depth - 1, alpha, beta,
233                                   False, evaluate, get_moves, is_terminal)
234            max_eval = max(max_eval, eval_score)
235            alpha = max(alpha, eval_score)
236            if beta <= alpha:
237                break  # 가지치기
238        return max_eval
239    else:
240        min_eval = float('inf')
241        for move in moves:
242            new_position = apply_move(position, move)
243            eval_score = alpha_beta(new_position, depth - 1, alpha, beta,
244                                   True, evaluate, get_moves, is_terminal)
245            min_eval = min(min_eval, eval_score)
246            beta = min(beta, eval_score)
247            if beta <= alpha:
248                break  # 가지치기
249        return min_eval
250
251
252# =============================================================================
253# 6. 틱택토 (Tic-Tac-Toe) 구현
254# =============================================================================
255
256class TicTacToe:
257    """틱택토 게임"""
258
259    def __init__(self):
260        self.board = [[' '] * 3 for _ in range(3)]
261        self.current_player = 'X'
262
263    def get_moves(self) -> List[Tuple[int, int]]:
264        """가능한 수 반환"""
265        moves = []
266        for i in range(3):
267            for j in range(3):
268                if self.board[i][j] == ' ':
269                    moves.append((i, j))
270        return moves
271
272    def make_move(self, row: int, col: int) -> bool:
273        """수 두기"""
274        if self.board[row][col] != ' ':
275            return False
276        self.board[row][col] = self.current_player
277        self.current_player = 'O' if self.current_player == 'X' else 'X'
278        return True
279
280    def undo_move(self, row: int, col: int):
281        """수 되돌리기"""
282        self.board[row][col] = ' '
283        self.current_player = 'O' if self.current_player == 'X' else 'X'
284
285    def check_winner(self) -> Optional[str]:
286        """승자 확인"""
287        # 행
288        for row in self.board:
289            if row[0] == row[1] == row[2] != ' ':
290                return row[0]
291        # 열
292        for col in range(3):
293            if self.board[0][col] == self.board[1][col] == self.board[2][col] != ' ':
294                return self.board[0][col]
295        # 대각선
296        if self.board[0][0] == self.board[1][1] == self.board[2][2] != ' ':
297            return self.board[0][0]
298        if self.board[0][2] == self.board[1][1] == self.board[2][0] != ' ':
299            return self.board[0][2]
300        return None
301
302    def is_terminal(self) -> bool:
303        """게임 종료 확인"""
304        return self.check_winner() is not None or len(self.get_moves()) == 0
305
306    def evaluate(self) -> int:
307        """상태 평가 (X 관점)"""
308        winner = self.check_winner()
309        if winner == 'X':
310            return 10
311        elif winner == 'O':
312            return -10
313        return 0
314
315    def minimax(self, is_maximizing: bool) -> int:
316        """미니맥스"""
317        if self.is_terminal():
318            return self.evaluate()
319
320        if is_maximizing:
321            max_eval = float('-inf')
322            for row, col in self.get_moves():
323                self.make_move(row, col)
324                eval_score = self.minimax(False)
325                self.undo_move(row, col)
326                max_eval = max(max_eval, eval_score)
327            return max_eval
328        else:
329            min_eval = float('inf')
330            for row, col in self.get_moves():
331                self.make_move(row, col)
332                eval_score = self.minimax(True)
333                self.undo_move(row, col)
334                min_eval = min(min_eval, eval_score)
335            return min_eval
336
337    def best_move(self) -> Tuple[int, int]:
338        """최선의 수 찾기"""
339        best_score = float('-inf') if self.current_player == 'X' else float('inf')
340        best_move = None
341
342        for row, col in self.get_moves():
343            self.make_move(row, col)
344            score = self.minimax(self.current_player == 'X')
345            self.undo_move(row, col)
346
347            if self.current_player == 'X':
348                if score > best_score:
349                    best_score = score
350                    best_move = (row, col)
351            else:
352                if score < best_score:
353                    best_score = score
354                    best_move = (row, col)
355
356        return best_move
357
358    def display(self):
359        """보드 출력"""
360        for i, row in enumerate(self.board):
361            print("    " + " | ".join(row))
362            if i < 2:
363                print("    " + "-" * 9)
364
365
366# =============================================================================
367# 7. 돌 게임 (Stone Game)
368# =============================================================================
369
370@lru_cache(maxsize=None)
371def stone_game_dp(piles: Tuple[int, ...], left: int, right: int) -> int:
372    """
373    돌 게임: 양 끝에서만 가져갈 수 있음
374    선공이 얻을 수 있는 최대 점수 차이 반환
375    """
376    if left > right:
377        return 0
378
379    # 선공이 왼쪽 선택
380    pick_left = piles[left] - stone_game_dp(piles, left + 1, right)
381    # 선공이 오른쪽 선택
382    pick_right = piles[right] - stone_game_dp(piles, left, right - 1)
383
384    return max(pick_left, pick_right)
385
386
387def stone_game(piles: List[int]) -> bool:
388    """
389    돌 게임: 선공이 이기면 True
390    """
391    n = len(piles)
392    diff = stone_game_dp(tuple(piles), 0, n - 1)
393    return diff > 0
394
395
396# =============================================================================
397# 8. 바시 게임 (Bash Game)
398# =============================================================================
399
400def bash_game(n: int, k: int) -> bool:
401    """
402    바시 게임: n개 돌에서 최대 k개씩 가져감
403    마지막 돌을 가져가는 사람이 승리
404    반환: 선공이 이기면 True
405    """
406    return n % (k + 1) != 0
407
408
409def bash_game_optimal_move(n: int, k: int) -> int:
410    """바시 게임에서 최적의 수 (가져갈 돌의 개수)"""
411    if n % (k + 1) == 0:
412        return 1  # 패배 상태, 아무 수나
413    return n % (k + 1)
414
415
416# =============================================================================
417# 9. 위더프 게임 (Wythoff's Game)
418# =============================================================================
419
420def wythoff_game(a: int, b: int) -> bool:
421    """
422    위더프 게임: 두 더미에서 같은 개수 또는 한 더미에서 임의 개수
423    마지막 돌을 가져가는 사람이 승리
424    반환: 선공이 이기면 True
425    """
426    phi = (1 + 5 ** 0.5) / 2  # 황금비
427
428    if a > b:
429        a, b = b, a
430
431    k = b - a
432    ak = int(k * phi)
433
434    return a != ak
435
436
437# =============================================================================
438# 10. 유클리드 게임 (Euclid's Game)
439# =============================================================================
440
441def euclid_game(a: int, b: int) -> bool:
442    """
443    유클리드 게임: 큰 수에서 작은 수의 배수를 뺌
444    0을 만드는 사람이 승리
445    반환: 선공이 이기면 True
446    """
447    if a < b:
448        a, b = b, a
449
450    if b == 0:
451        return False  # 이미 끝남
452
453    # 재귀적 분석
454    turn = True  # True: 선공의 턴
455    while b > 0:
456        if a >= 2 * b or a == b:
457            return turn
458        a, b = b, a - b
459        turn = not turn
460
461    return not turn
462
463
464# =============================================================================
465# 테스트
466# =============================================================================
467
468def main():
469    print("=" * 60)
470    print("게임 이론 (Game Theory) 예제")
471    print("=" * 60)
472
473    # 1. 님 게임
474    print("\n[1] 님 게임 (Nim Game)")
475    piles = [3, 4, 5]
476    xor = nim_xor(piles)
477    move = nim_winning_move(piles)
478    print(f"    더미: {piles}")
479    print(f"    XOR: {xor} ({'선공 승리' if xor != 0 else '후공 승리'})")
480    if move:
481        print(f"    승리 수: 더미 {move[0]}에서 {move[1]}개로")
482
483    # 시뮬레이션
484    print("\n    게임 시뮬레이션:")
485    piles_copy = [3, 4, 5]
486    winner = nim_game_simulation(piles_copy, verbose=True)
487    print(f"    승자: Player {winner}")
488
489    # 2. 스프라그-그런디
490    print("\n[2] 스프라그-그런디 정리")
491    moves = [1, 3, 4]  # 한 번에 1, 3, 4개 가져갈 수 있음
492    memo = {}
493    for n in range(10):
494        g = calculate_grundy(n, moves, memo)
495        print(f"    G({n}) = {g}", end="  ")
496    print()
497
498    # 여러 더미
499    piles = [7, 5]
500    total_g = multi_pile_grundy(piles, moves)
501    print(f"    더미 {piles}, 이동 {moves}")
502    print(f"    전체 그런디: {total_g} ({'선공 승리' if total_g != 0 else '후공 승리'})")
503
504    # 3. 변형 님
505    print("\n[3] 변형 님 게임")
506    # 미제르 님
507    piles_misere = [1, 2, 3]
508    print(f"    미제르 님 {piles_misere}: 선공 {'승리' if misere_nim(piles_misere) else '패배'}")
509
510    # 계단 님
511    stairs = [3, 1, 2, 4]  # 계단 1, 2, 3, 4
512    print(f"    계단 님 {stairs}: 그런디 = {staircase_nim(stairs)}")
513
514    # 4. 틱택토
515    print("\n[4] 틱택토 미니맥스")
516    game = TicTacToe()
517    game.board = [['X', 'O', 'X'],
518                  [' ', 'O', ' '],
519                  [' ', ' ', ' ']]
520    game.current_player = 'X'
521    print("    현재 상태:")
522    game.display()
523    best = game.best_move()
524    print(f"    X의 최선의 수: {best}")
525
526    # 5. 돌 게임
527    print("\n[5] 돌 게임")
528    piles = [5, 3, 4, 5]
529    print(f"    더미: {piles}")
530    result = stone_game(piles)
531    diff = stone_game_dp(tuple(piles), 0, len(piles) - 1)
532    print(f"    선공 {'승리' if result else '패배'} (점수 차이: {diff})")
533
534    # 6. 바시 게임
535    print("\n[6] 바시 게임")
536    n, k = 10, 3
537    print(f"    n={n}, k={k}")
538    print(f"    선공 {'승리' if bash_game(n, k) else '패배'}")
539    if bash_game(n, k):
540        print(f"    최적의 수: {bash_game_optimal_move(n, k)}개 가져가기")
541
542    # 7. 위더프 게임
543    print("\n[7] 위더프 게임")
544    test_cases = [(1, 2), (3, 5), (4, 7), (5, 8)]
545    for a, b in test_cases:
546        result = wythoff_game(a, b)
547        print(f"    ({a}, {b}): 선공 {'승리' if result else '패배'}")
548
549    # 8. 유클리드 게임
550    print("\n[8] 유클리드 게임")
551    test_cases = [(25, 7), (24, 10), (100, 45)]
552    for a, b in test_cases:
553        result = euclid_game(a, b)
554        print(f"    ({a}, {b}): 선공 {'승리' if result else '패배'}")
555
556    # 9. 알고리즘 요약
557    print("\n[9] 게임 이론 알고리즘 요약")
558    print("    | 게임           | 승리 조건                    |")
559    print("    |----------------|------------------------------|")
560    print("    | 님 게임        | XOR != 0                     |")
561    print("    | 미제르 님      | 복잡한 조건                  |")
562    print("    | 바시 게임      | n % (k+1) != 0               |")
563    print("    | 위더프 게임    | 황금비 기반 패배 위치        |")
564    print("    | 일반 게임      | 스프라그-그런디 정리         |")
565
566    print("\n" + "=" * 60)
567
568
569if __name__ == "__main__":
570    main()