larskuhtz · December 4, 2018 23:05 · larskuhtz · Nov 27, 2018
diff --git a/README.md b/README.md
diff --git a/VarList.hs b/VarList.hs
 {-# LANGUAGE AllowAmbiguousTypes #-}
 {-# LANGUAGE BangPatterns #-}
 {-# LANGUAGE DeriveGeneric #-}
 {-# LANGUAGE FlexibleInstances #-}
 {-# LANGUAGE LambdaCase #-}
 {-# LANGUAGE MultiParamTypeClasses #-}
 {-# LANGUAGE OverloadedStrings #-}
 {-# LANGUAGE RankNTypes #-}
 {-# LANGUAGE ScopedTypeVariables #-}
 {-# LANGUAGE TypeApplications #-}
 {-# LANGUAGE TypeSynonymInstances #-}

 -- |
 -- Module: VarList
 -- Copyright: Copyright © 2018 Lars Kuhtz <[email protected]>
 -- License: MIT
 -- Maintainer: Lars Kuhtz <[email protected]>
 -- Stability: experimental
 --
 module VarList
 (
 -- * Mutable Variables

  Var(..)
 , MaybeIORef
 , MaybeTVar

 -- * Cell
 , Cell(..)
 , foldCell
 , cellToStream
 , cellFromStream

 -- * Test and Benchmark Data
 , testCell

 -- * Main functions
 , main
 , main1
 , main2
 , main3
 ) where

 import Control.Concurrent
 import Control.Concurrent.Async
 import Control.Concurrent.STM
 import Control.DeepSeq
 import Control.Monad
 import Control.Monad.Morph
 import Control.StopWatch

 import Criterion
 import Criterion.Main

 import Data.Foldable
 import Data.Functor.Compose
 import Data.Functor.Of
 import Data.IORef
 import qualified Data.List.NonEmpty as L
 import qualified Data.Sequence as Seq

 import qualified Streaming.Prelude as S

 import System.Clock
 import System.Environment
 import System.IO
 import System.Mem

 -- -------------------------------------------------------------------------- --
 -- Variables
 --
 -- Note that 'Compose' is used here for type constructors that aren't functors.

 class Monad m => Var m v where
    readVar :: v x -> m (Maybe x)
    newEmptyVar :: m (v x)
    newVar :: x -> m (v x)

    -- | Depending on the type of the variable this function may block or spin.
    awaitVar :: v x -> m x

 type MaybeIORef = Compose IORef Maybe
 type MaybeTVar = Compose TVar Maybe

 instance Var STM TMVar where
    readVar = tryReadTMVar
    newEmptyVar = newEmptyTMVar
    newVar = newTMVar
    awaitVar = takeTMVar
    {-# INLINE readVar #-}
    {-# INLINE newEmptyVar #-}
    {-# INLINE newVar #-}
    {-# INLINE awaitVar #-}

 instance Var IO TMVar where
    readVar = atomically . tryReadTMVar
    newEmptyVar = newEmptyTMVarIO
    newVar = newTMVarIO
    awaitVar = atomically . awaitVar
    {-# INLINE readVar #-}
    {-# INLINE newEmptyVar #-}
    {-# INLINE newVar #-}
    {-# INLINE awaitVar #-}

 instance Var IO MVar where
    readVar = tryReadMVar
    newEmptyVar = newEmptyMVar
    newVar = newMVar
    awaitVar = takeMVar
    {-# INLINE readVar #-}
    {-# INLINE newEmptyVar #-}
    {-# INLINE newVar #-}
    {-# INLINE awaitVar #-}

 instance Var STM (Compose TVar Maybe) where
    readVar = readTVar . getCompose
    newEmptyVar = Compose <$> newTVar Nothing
    newVar = fmap Compose . newTVar . Just
    awaitVar = readVar >=> maybe retry return
    {-# INLINE readVar #-}
    {-# INLINE newEmptyVar #-}
    {-# INLINE newVar #-}
    {-# INLINE awaitVar #-}

 instance Var IO (Compose TVar Maybe) where
    readVar = readTVarIO . getCompose
    newEmptyVar = Compose <$> newTVarIO Nothing
    newVar = fmap Compose . newTVarIO . Just
    awaitVar = atomically . awaitVar
    {-# INLINE readVar #-}
    {-# INLINE newEmptyVar #-}
    {-# INLINE newVar #-}
    {-# INLINE awaitVar #-}

 instance Var IO (Compose IORef Maybe) where
    readVar = readIORef . getCompose
    newEmptyVar = Compose <$> newIORef Nothing
    newVar = fmap Compose . newIORef . Just

    -- | This spins
    awaitVar v = let go = readVar v >>= maybe (yield >> go) return in go
    {-# INLINE readVar #-}
    {-# INLINE newEmptyVar #-}
    {-# INLINE newVar #-}
    {-# INLINE awaitVar #-}

 -- -------------------------------------------------------------------------- --
 -- Cell

 data Cell v a = Cell a !(v (Cell v a))

 instance NFData a => NFData (Cell v a) where
    rnf (Cell a _) = rnf a

 -- | Fold over the values in a cell
 --
 foldCell
    :: Monad m
    => Var m v
    => (b -> a -> b)
    -> b
    -> Cell v a
    -> m b
 foldCell f b = go b
  where
    go !i (Cell !h !t) = readVar t >>= \case
        Nothing -> return i
        Just c -> go (f i h) c

 cellToStream :: Var m v => Cell v a -> S.Stream (Of a) m ()
 cellToStream = go
  where
    go (Cell h t) = do
        S.yield h
        lift (readVar t) >>= \case
            Nothing -> return ()
            Just c -> go c

 -- | Transforms a stream into a cell and returns the first cell if the stream
 -- isn't empty.
 --
 -- This could be made lazy using 'unsafeInterleavedIO', which would be fine,
 -- since the 'Var's won't change once the are evaluated. However, for
 -- benchmarking we want it strict.
 --
 cellFromStream :: Var m v => S.Stream (Of a) m () -> m (v (Cell v a))
 cellFromStream s = S.foldrM f (s >> lift newEmptyVar)
  where
    f !a !x = newVar =<< (Cell a <$> x)

 cellFromList :: forall v a m . Var m v => L.NonEmpty a -> m (Cell v a)
 cellFromList (a L.:| l) = Cell a <$> go l
  where
    go [] = newEmptyVar
    go (!h:t) = newVar =<< (Cell h <$> go t)

 maybeIORefCellFromList :: forall a . L.NonEmpty a -> IO (Cell MaybeIORef a)
 maybeIORefCellFromList (a L.:| l) = do
    v <- newEmptyVar
    go v l
    return $ Cell a v
  where
    go :: MaybeIORef (Cell MaybeIORef a) -> [a] -> IO ()
    go _ [] = return ()
    go !v (!h:t) = do
        !v' <- newEmptyVar
        writeIORef (getCompose v) (Just (Cell h v'))
        go v' t

 -- -------------------------------------------------------------------------- --
 -- Main

 testCell :: forall v m . Var m v => Int -> m (Cell v Int)
 testCell i = awaitVar =<< cellFromStream (S.each [1..i])

 main :: IO ()
 main = main3

 -- -------------------------------------------------------------------------- --
 -- Test

 main1 :: IO ()
 main1 = do
    [minThreadCount, maxThreadCount, threadCountStep, minListLength, maxListLength, listLengthStep] <- fmap read . take 2 <$> getArgs
    hSetBuffering stdout LineBuffering
    putStrLn $ "threadCount, listLength, time"

    forM_ [minThreadCount, (minThreadCount + threadCountStep) .. maxThreadCount] $ \threadCount -> do
        forM_ [minListLength, (minListLength + listLengthStep) .. maxListLength] $ \listLength -> do
            -- Compute test cell
            cell <- testCell @MaybeTVar listLength

            -- prime test cell evaluation
            void $ atomically $ S.sum $ cellToStream $ cell

            -- measure concurrent test cell evaluation
            performMajorGC
            (_, t) <- stopWatch $ replicateConcurrently_ threadCount
                $ atomically $ S.sum_ $ cellToStream $ cell

            -- print result
            putStrLn
                $ show threadCount
                <> ", " <> show listLength
                <> ", " <> show (toNanoSecs t)

 -- -------------------------------------------------------------------------- --
 -- Comparison with Pure Sequence

 main3 :: IO ()
 main3 = defaultMain
    [ bs 1
    , bs 100
    , create
    ]
  where
    create = bgroup "create" $
        [ bench "seq"
            $ nf (\s -> Seq.fromList [0..s]) (1000000 :: Int)
        , bench "cell"
            $ nfAppIO (testCell @MaybeIORef) 1000000
        , bench "cell from list"
            $ nfAppIO (\s -> cellFromList @MaybeIORef @Int (0 L.:| [1..s])) 1000000
        , bench "cell from list 2"
            $ nfAppIO (\s -> maybeIORefCellFromList @Int (0 L.:| [1..s])) 1000000
        ]

    bs i = bgroup (show i <> " threads")
        [ bgroup "stream" $
            [ env (return $ Seq.fromList [0..1000000]) $ \(e :: Seq.Seq Int) -> bench "seq"
                $ nfAppIO (S.sum_ . S.each) e
            , env (testCell @MaybeIORef 1000000) $ \e -> bench "cell"
                $ nfAppIO (S.sum_ . cellToStream) e
            ]
        , bgroup "fold" $
            [ env (return $ Seq.fromList [0..1000000]) $ \(e :: Seq.Seq Int) -> bench "seq"
                $ nf (foldl' (+) 0) e
            , env (testCell @MaybeIORef 1000000) $ \e -> bench "cell"
                $ nfAppIO (foldCell (+) 0) e
            ]
        ]

 -- -------------------------------------------------------------------------- --
 -- Criterion Benchmarks

 main2 :: IO ()
 main2 = defaultMain
    [ benchmarks 1
    , benchmarks 10
    , benchmarks 1000
    ]

 benchmarks :: Int -> Benchmark
 benchmarks i = bgroup (show i <> " threads")
    [ env (testCell @MVar 10000) $ \e -> bench "MVar"
        $ nfAppIO (threaded $ S.sum_ . cellToStream) e
    , env (testCell @MaybeIORef 10000) $ \e -> bench "MaybeIORef"
        $ nfAppIO (threaded $ S.sum_ . cellToStream) e

    , bgroup "TMVar" $
        [ env (testCell @TMVar 10000) $ \e -> bench "TMVar hoisted"
            $ nfAppIO (threaded $ S.sum_ . hoist atomically . cellToStream) e
        , env (testCell @TMVar 10000) $ \e -> bench "TMVar in IO"
            $ nfAppIO (threaded $ S.sum_ . cellToStream) e
        ]
        <> if i > 1 then [] else
            [ env (testCell @TMVar 10000) $ \e -> bench "TMVar in STM"
                $ nfAppIO (threaded $ atomically . S.sum_ . cellToStream) e
            -- , env (testCell @TMVar 10000) $ \e -> bench "foldCell Cell TMVar"
            --     $ nfAppIO (threaded $ atomically . foldCell ((+) @Int) 0) e
            ]

    , bgroup "MaybeTVar" $
        [ env (testCell @MaybeTVar 10000) $ \e -> bench "MaybeTVar hoisted"
            $ nfAppIO (threaded $ S.sum_ . hoist atomically . cellToStream) e
        , env (testCell @MaybeTVar 10000) $ \e -> bench "MaybeTVar in IO"
            $ nfAppIO (threaded $ S.sum_ . cellToStream) e
        ]
        <> if i > 1 then [] else
            [ env (testCell @MaybeTVar 10000) $ \e -> bench "MaybeTVar in STM"
                $ nfAppIO (threaded $ atomically . S.sum_ . cellToStream) e
            ]
    ]
  where
    threaded f a = replicateConcurrently_ i (f a)

diff --git a/results.ipynb b/results.ipynb
	{-# LANGUAGE AllowAmbiguousTypes #-}
	{-# LANGUAGE BangPatterns #-}
	{-# LANGUAGE DeriveGeneric #-}
	{-# LANGUAGE FlexibleInstances #-}
	{-# LANGUAGE LambdaCase #-}
	{-# LANGUAGE MultiParamTypeClasses #-}
	{-# LANGUAGE OverloadedStrings #-}
	{-# LANGUAGE RankNTypes #-}
	{-# LANGUAGE ScopedTypeVariables #-}
	{-# LANGUAGE TypeApplications #-}
	{-# LANGUAGE TypeSynonymInstances #-}

	-- \|
	-- Module: VarList
	-- Copyright: Copyright © 2018 Lars Kuhtz <[email protected]>
	-- License: MIT
	-- Maintainer: Lars Kuhtz <[email protected]>
	-- Stability: experimental
	--
	module VarList
	(
	-- * Mutable Variables

	Var(..)
	, MaybeIORef
	, MaybeTVar

	-- * Cell
	, Cell(..)
	, foldCell
	, cellToStream
	, cellFromStream

	-- * Test and Benchmark Data
	, testCell

	-- * Main functions
	, main
	, main1
	, main2
	, main3
	) where

	import Control.Concurrent
	import Control.Concurrent.Async
	import Control.Concurrent.STM
	import Control.DeepSeq
	import Control.Monad
	import Control.Monad.Morph
	import Control.StopWatch

	import Criterion
	import Criterion.Main

	import Data.Foldable
	import Data.Functor.Compose
	import Data.Functor.Of
	import Data.IORef
	import qualified Data.List.NonEmpty as L
	import qualified Data.Sequence as Seq

	import qualified Streaming.Prelude as S

	import System.Clock
	import System.Environment
	import System.IO
	import System.Mem

	-- -------------------------------------------------------------------------- --
	-- Variables
	--
	-- Note that 'Compose' is used here for type constructors that aren't functors.

	class Monad m => Var m v where
	readVar :: v x -> m (Maybe x)
	newEmptyVar :: m (v x)
	newVar :: x -> m (v x)

	-- \| Depending on the type of the variable this function may block or spin.
	awaitVar :: v x -> m x

	type MaybeIORef = Compose IORef Maybe
	type MaybeTVar = Compose TVar Maybe

	instance Var STM TMVar where
	readVar = tryReadTMVar
	newEmptyVar = newEmptyTMVar
	newVar = newTMVar
	awaitVar = takeTMVar
	{-# INLINE readVar #-}
	{-# INLINE newEmptyVar #-}
	{-# INLINE newVar #-}
	{-# INLINE awaitVar #-}

	instance Var IO TMVar where
	readVar = atomically . tryReadTMVar
	newEmptyVar = newEmptyTMVarIO
	newVar = newTMVarIO
	awaitVar = atomically . awaitVar
	{-# INLINE readVar #-}
	{-# INLINE newEmptyVar #-}
	{-# INLINE newVar #-}
	{-# INLINE awaitVar #-}

	instance Var IO MVar where
	readVar = tryReadMVar
	newEmptyVar = newEmptyMVar
	newVar = newMVar
	awaitVar = takeMVar
	{-# INLINE readVar #-}
	{-# INLINE newEmptyVar #-}
	{-# INLINE newVar #-}
	{-# INLINE awaitVar #-}

	instance Var STM (Compose TVar Maybe) where
	readVar = readTVar . getCompose
	newEmptyVar = Compose <$> newTVar Nothing
	newVar = fmap Compose . newTVar . Just
	awaitVar = readVar >=> maybe retry return
	{-# INLINE readVar #-}
	{-# INLINE newEmptyVar #-}
	{-# INLINE newVar #-}
	{-# INLINE awaitVar #-}

	instance Var IO (Compose TVar Maybe) where
	readVar = readTVarIO . getCompose
	newEmptyVar = Compose <$> newTVarIO Nothing
	newVar = fmap Compose . newTVarIO . Just
	awaitVar = atomically . awaitVar
	{-# INLINE readVar #-}
	{-# INLINE newEmptyVar #-}
	{-# INLINE newVar #-}
	{-# INLINE awaitVar #-}

	instance Var IO (Compose IORef Maybe) where
	readVar = readIORef . getCompose
	newEmptyVar = Compose <$> newIORef Nothing
	newVar = fmap Compose . newIORef . Just

	-- \| This spins
	awaitVar v = let go = readVar v >>= maybe (yield >> go) return in go
	{-# INLINE readVar #-}
	{-# INLINE newEmptyVar #-}
	{-# INLINE newVar #-}
	{-# INLINE awaitVar #-}

	-- -------------------------------------------------------------------------- --
	-- Cell

	data Cell v a = Cell a !(v (Cell v a))

	instance NFData a => NFData (Cell v a) where
	rnf (Cell a _) = rnf a

	-- \| Fold over the values in a cell
	--
	foldCell
	:: Monad m
	=> Var m v
	=> (b -> a -> b)
	-> b
	-> Cell v a
	-> m b
	foldCell f b = go b
	where
	go !i (Cell !h !t) = readVar t >>= \case
	Nothing -> return i
	Just c -> go (f i h) c

	cellToStream :: Var m v => Cell v a -> S.Stream (Of a) m ()
	cellToStream = go
	where
	go (Cell h t) = do
	S.yield h
	lift (readVar t) >>= \case
	Nothing -> return ()
	Just c -> go c

	-- \| Transforms a stream into a cell and returns the first cell if the stream
	-- isn't empty.
	--
	-- This could be made lazy using 'unsafeInterleavedIO', which would be fine,
	-- since the 'Var's won't change once the are evaluated. However, for
	-- benchmarking we want it strict.
	--
	cellFromStream :: Var m v => S.Stream (Of a) m () -> m (v (Cell v a))
	cellFromStream s = S.foldrM f (s >> lift newEmptyVar)
	where
	f !a !x = newVar =<< (Cell a <$> x)

	cellFromList :: forall v a m . Var m v => L.NonEmpty a -> m (Cell v a)
	cellFromList (a L.:\| l) = Cell a <$> go l
	where
	go [] = newEmptyVar
	go (!h:t) = newVar =<< (Cell h <$> go t)

	maybeIORefCellFromList :: forall a . L.NonEmpty a -> IO (Cell MaybeIORef a)
	maybeIORefCellFromList (a L.:\| l) = do
	v <- newEmptyVar
	go v l
	return $ Cell a v
	where
	go :: MaybeIORef (Cell MaybeIORef a) -> [a] -> IO ()
	go _ [] = return ()
	go !v (!h:t) = do
	!v' <- newEmptyVar
	writeIORef (getCompose v) (Just (Cell h v'))
	go v' t

	-- -------------------------------------------------------------------------- --
	-- Main

	testCell :: forall v m . Var m v => Int -> m (Cell v Int)
	testCell i = awaitVar =<< cellFromStream (S.each [1..i])

	main :: IO ()
	main = main3

	-- -------------------------------------------------------------------------- --
	-- Test

	main1 :: IO ()
	main1 = do
	[minThreadCount, maxThreadCount, threadCountStep, minListLength, maxListLength, listLengthStep] <- fmap read . take 2 <$> getArgs
	hSetBuffering stdout LineBuffering
	putStrLn $ "threadCount, listLength, time"

	forM_ [minThreadCount, (minThreadCount + threadCountStep) .. maxThreadCount] $ \threadCount -> do
	forM_ [minListLength, (minListLength + listLengthStep) .. maxListLength] $ \listLength -> do
	-- Compute test cell
	cell <- testCell @MaybeTVar listLength

	-- prime test cell evaluation
	void $ atomically $ S.sum $ cellToStream $ cell

	-- measure concurrent test cell evaluation
	performMajorGC
	(_, t) <- stopWatch $ replicateConcurrently_ threadCount
	$ atomically $ S.sum_ $ cellToStream $ cell

	-- print result
	putStrLn
	$ show threadCount
	<> ", " <> show listLength
	<> ", " <> show (toNanoSecs t)

	-- -------------------------------------------------------------------------- --
	-- Comparison with Pure Sequence

	main3 :: IO ()
	main3 = defaultMain
	[ bs 1
	, bs 100
	, create
	]
	where
	create = bgroup "create" $
	[ bench "seq"
	$ nf (\s -> Seq.fromList [0..s]) (1000000 :: Int)
	, bench "cell"
	$ nfAppIO (testCell @MaybeIORef) 1000000
	, bench "cell from list"
	$ nfAppIO (\s -> cellFromList @MaybeIORef @Int (0 L.:\| [1..s])) 1000000
	, bench "cell from list 2"
	$ nfAppIO (\s -> maybeIORefCellFromList @Int (0 L.:\| [1..s])) 1000000
	]

	bs i = bgroup (show i <> " threads")
	[ bgroup "stream" $
	[ env (return $ Seq.fromList [0..1000000]) $ \(e :: Seq.Seq Int) -> bench "seq"
	$ nfAppIO (S.sum_ . S.each) e
	, env (testCell @MaybeIORef 1000000) $ \e -> bench "cell"
	$ nfAppIO (S.sum_ . cellToStream) e
	]
	, bgroup "fold" $
	[ env (return $ Seq.fromList [0..1000000]) $ \(e :: Seq.Seq Int) -> bench "seq"
	$ nf (foldl' (+) 0) e
	, env (testCell @MaybeIORef 1000000) $ \e -> bench "cell"
	$ nfAppIO (foldCell (+) 0) e
	]
	]

	-- -------------------------------------------------------------------------- --
	-- Criterion Benchmarks

	main2 :: IO ()
	main2 = defaultMain
	[ benchmarks 1
	, benchmarks 10
	, benchmarks 1000
	]

	benchmarks :: Int -> Benchmark
	benchmarks i = bgroup (show i <> " threads")
	[ env (testCell @MVar 10000) $ \e -> bench "MVar"
	$ nfAppIO (threaded $ S.sum_ . cellToStream) e
	, env (testCell @MaybeIORef 10000) $ \e -> bench "MaybeIORef"
	$ nfAppIO (threaded $ S.sum_ . cellToStream) e

	, bgroup "TMVar" $
	[ env (testCell @TMVar 10000) $ \e -> bench "TMVar hoisted"
	$ nfAppIO (threaded $ S.sum_ . hoist atomically . cellToStream) e
	, env (testCell @TMVar 10000) $ \e -> bench "TMVar in IO"
	$ nfAppIO (threaded $ S.sum_ . cellToStream) e
	]
	<> if i > 1 then [] else
	[ env (testCell @TMVar 10000) $ \e -> bench "TMVar in STM"
	$ nfAppIO (threaded $ atomically . S.sum_ . cellToStream) e
	-- , env (testCell @TMVar 10000) $ \e -> bench "foldCell Cell TMVar"
	-- $ nfAppIO (threaded $ atomically . foldCell ((+) @Int) 0) e
	]

	, bgroup "MaybeTVar" $
	[ env (testCell @MaybeTVar 10000) $ \e -> bench "MaybeTVar hoisted"
	$ nfAppIO (threaded $ S.sum_ . hoist atomically . cellToStream) e
	, env (testCell @MaybeTVar 10000) $ \e -> bench "MaybeTVar in IO"
	$ nfAppIO (threaded $ S.sum_ . cellToStream) e
	]
	<> if i > 1 then [] else
	[ env (testCell @MaybeTVar 10000) $ \e -> bench "MaybeTVar in STM"
	$ nfAppIO (threaded $ atomically . S.sum_ . cellToStream) e
	]
	]
	where
	threaded f a = replicateConcurrently_ i (f a)