{-# LANGUAGE CPP, NamedFieldPuns, RecordWildCards, ScopedTypeVariables, RankNTypes, DeriveDataTypeable #-} #if !MIN_VERSION_base(4,3,0) {-# LANGUAGE RankNTypes #-} #endif -- | -- Module: Data.Pool -- Copyright: (c) 2011 MailRank, Inc. -- License: BSD3 -- Maintainer: Bryan O'Sullivan , -- Bas van Dijk -- Stability: experimental -- Portability: portable -- -- A high-performance striped pooling abstraction for managing -- flexibly-sized collections of resources such as database -- connections. -- -- \"Striped\" means that a single 'Pool' consists of several -- sub-pools, each managed independently. A single stripe is fine for -- many applications, and probably what you should choose by default. -- More stripes will lead to reduced contention in high-performance -- multicore applications, at a trade-off of causing the maximum -- number of simultaneous resources in use to grow. module Data.Pool ( Pool(idleTime, maxResources, numStripes) , LocalPool , Stats(..) , PoolStats(..) , createPool , withResource , takeResource , tryWithResource , tryTakeResource , destroyResource , putResource , destroyAllResources , stats ) where import Control.Concurrent (ThreadId, forkIOWithUnmask, killThread, myThreadId, threadDelay) import Control.Concurrent.STM import Control.Exception (SomeException, onException, mask_) import Control.Monad (forM_, forever, join, liftM5, unless, when) import Data.Hashable (hash) import Data.IORef (IORef, newIORef, mkWeakIORef) import Data.List (partition) import Data.Pool.WaiterQueue (WaiterQueue, newQueueIO, push, pop) import Data.Time.Clock (NominalDiffTime, UTCTime, diffUTCTime, getCurrentTime) import Data.Typeable (Typeable) import GHC.Conc.Sync (labelThread) import qualified Control.Exception as E import qualified Data.Vector as V import UnliftIO (MonadUnliftIO, mask, withRunInIO) -- | A single resource pool entry. data Entry a = Entry { entry :: a , lastUse :: UTCTime -- ^ Time of last return. } -- | Stats for a single 'LocalPool'. data PoolStats = PoolStats { highwaterUsage :: Int -- ^ Highest usage since last reset. , currentUsage :: Int -- ^ Current number of items. , takes :: Int -- ^ Number of takes since last reset. , creates :: Int -- ^ Number of creates since last reset. , createFailures :: Int -- ^ Number of creation failures since last reset. } deriving (Show) -- | Pool-wide stats. data Stats = Stats { perStripe :: V.Vector PoolStats -- ^ Stats per 'LocalPool' (stripe). , poolStats :: PoolStats -- ^ Aggregate stats across pool. } deriving (Show) -- | A single striped pool. data LocalPool a = LocalPool { inUse :: TVar Int -- ^ Count of open entries (both idle and in use). , entries :: TVar [Entry a] -- ^ Idle entries. , highwaterVar :: TVar Int -- ^ Highest value of 'inUse' since last reset. , takeVar :: TVar Int -- ^ Number of takes since last reset. , createVar :: TVar Int -- ^ Number of creates since last reset. , createFailureVar :: TVar Int -- ^ Number of create failures since last reset. , waiters :: WaiterQueue (TMVar (Maybe (Entry a))) -- ^ threads waiting for a resource , lfin :: IORef () -- ^ empty value used to attach a finalizer to (internal) } deriving (Typeable) data Pool a = Pool { create :: IO a -- ^ Action for creating a new entry to add to the pool. , destroy :: a -> IO () -- ^ Action for destroying an entry that is now done with. , numStripes :: Int -- ^ The number of stripes (distinct sub-pools) to maintain. -- The smallest acceptable value is 1. , idleTime :: NominalDiffTime -- ^ Amount of time for which an unused resource is kept alive. -- The smallest acceptable value is 0.5 seconds. -- -- The elapsed time before closing may be a little longer than -- requested, as the reaper thread wakes at 1-second intervals. , maxResources :: Int -- ^ Maximum number of resources to maintain per stripe. The -- smallest acceptable value is 1. -- -- Requests for resources will block if this limit is reached on a -- single stripe, even if other stripes have idle resources -- available. , localPools :: V.Vector (LocalPool a) -- ^ Per-capability resource pools. , fin :: IORef () -- ^ empty value used to attach a finalizer to (internal) } deriving (Typeable) instance Show (Pool a) where show Pool{..} = "Pool {numStripes = " ++ show numStripes ++ ", " ++ "idleTime = " ++ show idleTime ++ ", " ++ "maxResources = " ++ show maxResources ++ "}" -- | Create a striped resource pool. -- -- Although the garbage collector will destroy all idle resources when -- the pool is garbage collected it's recommended to manually -- 'destroyAllResources' when you're done with the pool so that the -- resources are freed up as soon as possible. createPool :: IO a -- ^ Action that creates a new resource. -> (a -> IO ()) -- ^ Action that destroys an existing resource. -> Int -- ^ The number of stripes (distinct sub-pools) to maintain. -- The smallest acceptable value is 1. -> NominalDiffTime -- ^ Amount of time for which an unused resource is kept open. -- The smallest acceptable value is 0.5 seconds. -- -- The elapsed time before destroying a resource may be a little -- longer than requested, as the reaper thread wakes at 1-second -- intervals. -> Int -- ^ Maximum number of resources to keep open per stripe. The -- smallest acceptable value is 1. -- -- Requests for resources will block if this limit is reached on a -- single stripe, even if other stripes have idle resources -- available. -> IO (Pool a) createPool create destroy numStripes idleTime maxResources = do when (numStripes < 1) $ modError "pool " $ "invalid stripe count " ++ show numStripes when (idleTime < 0.5) $ modError "pool " $ "invalid idle time " ++ show idleTime when (maxResources < 1) $ modError "pool " $ "invalid maximum resource count " ++ show maxResources localPools <- V.replicateM numStripes $ LocalPool <$> newTVarIO 0 <*> newTVarIO [] <*> newTVarIO 0 <*> newTVarIO 0 <*> newTVarIO 0 <*> newTVarIO 0 <*> newQueueIO <*> newIORef () reaperId <- forkIOLabeledWithUnmask "resource-pool: reaper" $ \unmask -> unmask $ reaper destroy idleTime localPools fin <- newIORef () let p = Pool { create , destroy , numStripes , idleTime , maxResources , localPools , fin } mkWeakIORef fin (killThread reaperId) >> V.mapM_ (\lp -> mkWeakIORef (lfin lp) (purgeLocalPool destroy lp)) localPools return p -- TODO: Propose 'forkIOLabeledWithUnmask' for the base library. -- | Sparks off a new thread using 'forkIOWithUnmask' to run the given -- IO computation, but first labels the thread with the given label -- (using 'labelThread'). -- -- The implementation makes sure that asynchronous exceptions are -- masked until the given computation is executed. This ensures the -- thread will always be labeled which guarantees you can always -- easily find it in the GHC event log. -- -- Like 'forkIOWithUnmask', the given computation is given a function -- to unmask asynchronous exceptions. See the documentation of that -- function for the motivation of this. -- -- Returns the 'ThreadId' of the newly created thread. forkIOLabeledWithUnmask :: String -> ((forall a. IO a -> IO a) -> IO ()) -> IO ThreadId forkIOLabeledWithUnmask label m = mask_ $ forkIOWithUnmask $ \unmask -> do tid <- myThreadId labelThread tid label m unmask -- | Periodically go through all pools, closing any resources that -- have been left idle for too long. reaper :: (a -> IO ()) -> NominalDiffTime -> V.Vector (LocalPool a) -> IO () reaper destroy idleTime pools = forever $ do threadDelay (1 * 1000000) now <- getCurrentTime let isStale Entry{..} = now `diffUTCTime` lastUse > idleTime V.forM_ pools $ \LocalPool{..} -> do resources <- atomically $ do (stale,fresh) <- partition isStale <$> readTVar entries unless (null stale) $ do writeTVar entries fresh modifyTVar_ inUse (subtract (length stale)) return (map entry stale) forM_ resources $ \resource -> do destroy resource `E.catch` \(_::SomeException) -> return () -- | Destroy all idle resources of the given 'LocalPool' and remove them from -- the pool. purgeLocalPool :: (a -> IO ()) -> LocalPool a -> IO () purgeLocalPool destroy LocalPool{..} = do resources <- atomically $ do idle <- swapTVar entries [] modifyTVar_ inUse (subtract (length idle)) return (map entry idle) forM_ resources $ \resource -> destroy resource `E.catch` \(_::SomeException) -> return () -- | Temporarily take a resource from a 'Pool', perform an action with -- it, and return it to the pool afterwards. -- -- * If the pool has an idle resource available, it is used -- immediately. -- -- * Otherwise, if the maximum number of resources has not yet been -- reached, a new resource is created and used. -- -- * If the maximum number of resources has been reached, this -- function blocks until a resource becomes available. -- -- If the action throws an exception of any type, the resource is -- destroyed, and not returned to the pool. -- -- It probably goes without saying that you should never manually -- destroy a pooled resource, as doing so will almost certainly cause -- a subsequent user (who expects the resource to be valid) to throw -- an exception. withResource :: MonadUnliftIO m => Pool a -> (a -> m b) -> m b {-# SPECIALIZE withResource :: Pool a -> (a -> IO b) -> IO b #-} withResource pool act = withRunInIO $ \runInIO -> mask $ \restore -> do (resource, local) <- takeResource pool ret <- restore (runInIO (act resource)) `onException` destroyResource pool local resource putResource local resource return ret #if __GLASGOW_HASKELL__ >= 700 {-# INLINABLE withResource #-} #endif -- | Take a resource from the pool, following the same results as -- 'withResource'. Note that this function should be used with caution, as -- improper exception handling can lead to leaked resources. -- -- This function returns both a resource and the @LocalPool@ it came from so -- that it may either be destroyed (via 'destroyResource') or returned to the -- pool (via 'putResource'). takeResource :: Pool a -> IO (a, LocalPool a) takeResource pool@Pool{..} = do local@LocalPool{..} <- getLocalPool pool resource <- join . atomically $ do modifyTVar_ takeVar (+ 1) ents <- readTVar entries case ents of (Entry{..}:es) -> writeTVar entries es >> return (return entry) [] -> do used <- readTVar inUse case used == maxResources of False -> do writeTVar inUse $! used + 1 modifyTVar_ highwaterVar (`max` (used + 1)) modifyTVar_ createVar (+ 1) return $ create `onException` atomically (modifyTVar_ createFailureVar (+ 1) >> destroyResourceSTM local) True -> do var <- newEmptyTMVar removeSelf <- push waiters var let getResource x = case x of Just y -> pure (entry y) Nothing -> create `onException` atomically (destroyResourceSTM local) let dequeue = do maybeEntry <- atomically $ do removeSelf tryTakeTMVar var atomically $ case maybeEntry of Nothing -> pure () Just Nothing -> destroyResourceSTM local Just (Just v) -> putResourceSTM local v return (getResource =<< atomically (takeTMVar var) `onException` dequeue) return (resource, local) #if __GLASGOW_HASKELL__ >= 700 {-# INLINABLE takeResource #-} #endif -- | Similar to 'withResource', but only performs the action if a resource could -- be taken from the pool /without blocking/. Otherwise, 'tryWithResource' -- returns immediately with 'Nothing' (ie. the action function is /not/ called). -- Conversely, if a resource can be borrowed from the pool without blocking, the -- action is performed and it's result is returned, wrapped in a 'Just'. tryWithResource :: forall m a b. MonadUnliftIO m => Pool a -> (a -> m b) -> m (Maybe b) tryWithResource pool act = withRunInIO $ \runInIO -> mask $ \restore -> do res <- tryTakeResource pool case res of Just (resource, local) -> do ret <- restore (runInIO (Just <$> act resource)) `onException` destroyResource pool local resource putResource local resource return ret Nothing -> restore . runInIO $ return (Nothing :: Maybe b) #if __GLASGOW_HASKELL__ >= 700 {-# INLINABLE tryWithResource #-} #endif -- | A non-blocking version of 'takeResource'. The 'tryTakeResource' function -- returns immediately, with 'Nothing' if the pool is exhausted, or @'Just' (a, -- 'LocalPool' a)@ if a resource could be borrowed from the pool successfully. tryTakeResource :: Pool a -> IO (Maybe (a, LocalPool a)) tryTakeResource pool@Pool{..} = do local@LocalPool{..} <- getLocalPool pool resource <- join . atomically $ do ents <- readTVar entries case ents of (Entry{..}:es) -> writeTVar entries es >> return (return . Just $ entry) [] -> do used <- readTVar inUse if used == maxResources then return (return Nothing) else do writeTVar inUse $! used + 1 return $ Just <$> create `onException` atomically (destroyResourceSTM local) return $ (flip (,) local) <$> resource #if __GLASGOW_HASKELL__ >= 700 {-# INLINABLE tryTakeResource #-} #endif -- | Get a (Thread-)'LocalPool' -- -- Internal, just to not repeat code for 'takeResource' and 'tryTakeResource' getLocalPool :: Pool a -> IO (LocalPool a) getLocalPool Pool{..} = do i <- ((`mod` numStripes) . hash) <$> myThreadId return $ localPools V.! i #if __GLASGOW_HASKELL__ >= 700 {-# INLINABLE getLocalPool #-} #endif -- | Destroy a resource. Note that this will ignore any exceptions in the -- destroy function. destroyResource :: Pool a -> LocalPool a -> a -> IO () destroyResource Pool{..} local resource = do destroy resource `E.catch` \(_::SomeException) -> return () atomically (destroyResourceSTM local) #if __GLASGOW_HASKELL__ >= 700 {-# INLINABLE destroyResource #-} #endif -- | Return a resource to the given 'LocalPool'. putResource :: LocalPool a -> a -> IO () putResource lp resource = do now <- getCurrentTime atomically $ putResourceSTM lp (Entry resource now) #if __GLASGOW_HASKELL__ >= 700 {-# INLINABLE putResource #-} #endif putResourceSTM :: LocalPool a -> Entry a -> STM () putResourceSTM LocalPool{..} resourceEntry = do mWaiters <- pop waiters case mWaiters of Nothing -> modifyTVar_ entries (resourceEntry:) Just w -> putTMVar w (Just resourceEntry) {-# INLINE putResourceSTM #-} destroyResourceSTM :: LocalPool a -> STM () destroyResourceSTM LocalPool{..} = do mwaiter <- pop waiters case mwaiter of Nothing -> modifyTVar_ inUse (subtract 1) Just w -> putTMVar w Nothing {-# INLINE destroyResourceSTM #-} -- | Destroy all resources in all stripes in the pool. Note that this -- will ignore any exceptions in the destroy function. -- -- This function is useful when you detect that all resources in the -- pool are broken. For example after a database has been restarted -- all connections opened before the restart will be broken. In that -- case it's better to close those connections so that 'takeResource' -- won't take a broken connection from the pool but will open a new -- connection instead. -- -- Another use-case for this function is that when you know you are -- done with the pool you can destroy all idle resources immediately -- instead of waiting on the garbage collector to destroy them, thus -- freeing up those resources sooner. destroyAllResources :: Pool a -> IO () destroyAllResources Pool{..} = V.forM_ localPools $ purgeLocalPool destroy -- | @stats pool reset@ returns statistics on each 'LocalPool' as well as a summary across the entire Pool. -- When @reset@ is true, the stats are reset. stats :: Pool a -> Bool -> IO Stats stats Pool{..} reset = do let stripeStats LocalPool{..} = atomically $ do s <- liftM5 PoolStats (readTVar highwaterVar) (readTVar inUse) (readTVar takeVar) (readTVar createVar) (readTVar createFailureVar) when reset $ do mapM_ (\v -> writeTVar v 0) [takeVar, createVar, createFailureVar] writeTVar highwaterVar $! currentUsage s return s per <- V.mapM stripeStats localPools let poolWide = V.foldr merge (PoolStats 0 0 0 0 0) per merge (PoolStats hw1 cu1 t1 c1 f1) (PoolStats hw2 cu2 t2 c2 f2) = PoolStats (hw1 + hw2) (cu1 + cu2) (t1 + t2) (c1 + c2) (f1 + f2) return $ Stats per poolWide modifyTVar_ :: TVar a -> (a -> a) -> STM () modifyTVar_ v f = readTVar v >>= \a -> writeTVar v $! f a modError :: String -> String -> a modError func msg = error $ "Data.Pool." ++ func ++ ": " ++ msg