Created
August 28, 2022 00:52
-
-
Save Gabriella439/6d59a810998245904a0d4eda42d0f1c7 to your computer and use it in GitHub Desktop.
MaxiMin algorithm for one player versus uncertainty
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
{-# LANGUAGE BlockArguments #-} | |
{-# LANGUAGE DeriveFunctor #-} | |
{-# LANGUAGE NamedFieldPuns #-} | |
{-# OPTIONS_GHC -Wall #-} | |
module MaxiMin where | |
import Data.List.NonEmpty (NonEmpty(..)) | |
import Data.MemoTrie (HasTrie(..)) | |
import qualified Control.Monad as Monad | |
import qualified Data.MemoTrie as MemoTrie | |
import qualified Data.List as List | |
import qualified Data.Ord as Ord | |
{-| A single possibility, consisting of an outcome paired with the associated | |
weight of that outcome | |
-} | |
data Possibility a | |
= Possibility { outcome :: !a, weight :: !Int } | |
deriving (Functor, Show) | |
-- | A probability distribution, which is a non-empty list of weighted outcomes | |
newtype Distribution a | |
= Distribution { possibilities :: NonEmpty (Possibility a) } | |
deriving (Functor, Show) | |
instance Applicative Distribution where | |
pure x = Distribution (pure (Possibility x 1)) | |
(<*>) = Monad.ap | |
instance Monad Distribution where | |
m >>= f = Distribution do | |
Possibility x weight0 <- possibilities m | |
Possibility y weight1 <- possibilities (f x) | |
return $! Possibility y (weight0 * weight1) | |
-- | Compute the expected value for a probability distribution | |
expectedValue :: Fractional n => Distribution n -> n | |
expectedValue Distribution{ possibilities } = | |
totalTally / fromIntegral totalWeight | |
where | |
totalTally = sum (fmap tally possibilities) | |
totalWeight = sum (fmap weight possibilities) | |
tally Possibility{ outcome, weight } = fromIntegral weight * outcome | |
{-| Play the game optimally to its conclusion, always selecting the move that | |
leads to the highest expected value for the given objective function | |
-} | |
play | |
:: (Fractional n, Ord n, HasTrie state) | |
=> (state -> n) | |
-- ^ Objective function, which returns the value we are trying to maximize | |
-> (state -> Bool) | |
-- ^ Termination function, which returns True if the game is over | |
-> (state -> NonEmpty (Distribution state)) | |
-- ^ A function which generates the available moves from the current state | |
-> state | |
-- ^ The starting state | |
-> Distribution state | |
-- ^ The final probability distribution at the end of the game after optimal | |
-- play | |
play objective done choices = MemoTrie.memoFix memoized | |
where | |
memoized loop status | |
| done status = do | |
pure status | |
| otherwise = do | |
next <- List.maximumBy (Ord.comparing predict) (choices status) | |
loop next | |
where | |
predict choice = expectedValue do | |
nextStatus <- choice | |
finalStatus <- loop nextStatus | |
return (objective finalStatus) |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment