# Python imports
from functools import lru_cache
from itertools import combinations, permutations
from pathlib import Path
from typing import Callable, Dict, Generator, Iterable, List, Optional, Set, Tuple

import numpy as np

# Paths to data
testpath = Path("day21_test.txt")
datapath = Path("day21_data.txt")


def load_input(fpath: Path) -> Tuple[Dict[int,int], np.array]:
    """Return the game start positions
    
    :param fpath:  Path to data file
    """
    with fpath.open("r") as ifh:
        p1_start = int(ifh.readline().strip().split()[-1])
        p2_start = int(ifh.readline().strip().split()[-1])                

    return p1_start, p2_start


def play(p1_start, p2_start, die_size=100, board_size=10, end_score=1000):
    p1_pos, p2_pos = p1_start % board_size, p2_start % board_size
    p1_score, p2_score = 0, 0
    die_roll_count, die_state = 0, 0
    while True:
        # P1 move
        # Roll die x3
        die_rolls = (die_state + np.array([1, 2, 3])) % die_size
        die_roll_count += 3
        die_state = die_rolls[-1]
        # Move
        p1_pos = (p1_pos + die_rolls.sum()) % board_size
        # Increment score
        if p1_pos == 0:  # we're doing mod10 so need this
            p1_score += 10
        p1_score += p1_pos
        if p1_score >= end_score:
            break
            
        # P2 move
        # Roll die x3
        die_rolls = (die_state + np.array([1, 2, 3])) % die_size
        die_roll_count += 3
        die_state = die_rolls[-1]
        # Move
        p2_pos = (p2_pos + die_rolls.sum()) % board_size
        # Increment score
        if p2_pos == 0:  # we're doing mod10 so need this
            p2_score += 10
        p2_score += p2_pos
        if p2_score >= end_score:
            break
        
    return die_roll_count, min(p1_score, p2_score)


p1_start, p2_start = load_input(testpath)
print(f"{np.prod(play(p1_start, p2_start))=}")

np.prod(play(p1_start, p2_start))=739785


p1_start, p2_start = load_input(datapath)
print(f"{np.prod(play(p1_start, p2_start))=}")

np.prod(play(p1_start, p2_start))=720750


# (Sum of) roll frequencies - see above
freqdict = {3:1, 4:3, 5:6, 6:7, 7:6, 8:3, 9:1}

@lru_cache(maxsize=None)
def play_dirac(cur_player_pos, other_player_pos, cur_player_score, other_player_score):
    # Return a winner if either player scored >= 21
    if other_player_score >= 21:
        return 0, 1  # the other player wins before the current player rolls
    
    # We don't have a winner, so current player rolls
    # So far we don't know how many wins there are downstream
    # of this state, so set total wins for each player here to 0
    cur_player_tot_wins, other_player_tot_wins = 0, 0
    
    # We know that the current state will result in 27 universes for
    # the current player, on the next roll, but we need only consider
    # the possible roll sums, and multiply the wins by their frequency
    for roll, count in freqdict.items():
        new_cur_player_pos = (cur_player_pos + roll) % 10
        if new_cur_player_pos == 0:  # we're doing mod10 so need this
            new_cur_player_score = cur_player_score + 10
        else:
            new_cur_player_score = cur_player_score + new_cur_player_pos
        
        # Play next round (swap players)
        other_player_win, cur_player_win = play_dirac(other_player_pos,
                                                      new_cur_player_pos,
                                                      other_player_score,
                                                      new_cur_player_score)
        
        # Update win counts
        cur_player_tot_wins += cur_player_win * count
        other_player_tot_wins += other_player_win * count     
        
    # Return total win count for each player
    return cur_player_tot_wins, other_player_tot_wins


p1_start, p2_start = load_input(testpath)
print(f"Most wins: {max(play_dirac(p1_start, p2_start, 0, 0))=}")

Most wins: max(play_dirac(p1_start, p2_start, 0, 0))=444356092776315


p1_start, p2_start = load_input(datapath)
print(f"Most wins: {max(play_dirac(p1_start, p2_start, 0, 0))=}")

Most wins: max(play_dirac(p1_start, p2_start, 0, 0))=275067741811212

Day 21: Dirac Dice¶

Puzzle 2:¶