|
|
|
@ -12,25 +12,31 @@ import Control.Concurrent
|
|
|
|
|
import Control.Concurrent.Async
|
|
|
|
|
import Control.Concurrent.STM
|
|
|
|
|
import Control.Exception (Exception (..), try)
|
|
|
|
|
import Control.Monad (foldM, forM_, forever, void, when)
|
|
|
|
|
import Control.Monad (foldM, forM, forM_, forever, unless,
|
|
|
|
|
void, when)
|
|
|
|
|
import Control.Monad.IO.Class (liftIO)
|
|
|
|
|
import Data.Bifunctor
|
|
|
|
|
import qualified Data.ByteString.Lazy.UTF8 as BSUL
|
|
|
|
|
import qualified Data.ByteString.UTF8 as BSU
|
|
|
|
|
import qualified Data.DList as D
|
|
|
|
|
import Data.Either (lefts, rights)
|
|
|
|
|
import qualified Data.HashMap.Strict as HMap
|
|
|
|
|
import qualified Data.HashSet as HSet
|
|
|
|
|
import Data.Maybe (isJust)
|
|
|
|
|
import Data.Maybe (fromJust, isJust)
|
|
|
|
|
import Data.String (fromString)
|
|
|
|
|
import Data.Text.Lazy (Text)
|
|
|
|
|
import qualified Data.Text.Lazy as Txt
|
|
|
|
|
import qualified Data.Text.Lazy.IO as TxtI
|
|
|
|
|
import Data.Text.Normalize (NormalizationMode (NFC), normalize)
|
|
|
|
|
import Data.Time.Clock.POSIX
|
|
|
|
|
import Data.Typeable (Typeable)
|
|
|
|
|
import qualified Network.HTTP.Client as HTTP
|
|
|
|
|
import qualified Network.HTTP.Types as HTTPT
|
|
|
|
|
import System.IO
|
|
|
|
|
import System.Random
|
|
|
|
|
import Text.Read (readEither)
|
|
|
|
|
|
|
|
|
|
import Formatting (fixed, format, int, (%))
|
|
|
|
|
import qualified Network.Wai.Handler.Warp as Warp
|
|
|
|
|
import Servant
|
|
|
|
|
import Servant.Client
|
|
|
|
@ -38,7 +44,9 @@ import Servant.Client
|
|
|
|
|
import Hash2Pub.FediChordTypes
|
|
|
|
|
import Hash2Pub.PostService.API
|
|
|
|
|
import Hash2Pub.RingMap
|
|
|
|
|
import Hash2Pub.Utils
|
|
|
|
|
|
|
|
|
|
import Debug.Trace
|
|
|
|
|
|
|
|
|
|
data PostService d = PostService
|
|
|
|
|
{ serviceConf :: ServiceConf
|
|
|
|
@ -49,13 +57,16 @@ data PostService d = PostService
|
|
|
|
|
-- ^ for each tag store the subscribers + their queue
|
|
|
|
|
, ownSubscriptions :: TVar (HMap.HashMap NodeID POSIXTime)
|
|
|
|
|
-- ^ tags subscribed by the own node have an assigned lease time
|
|
|
|
|
, ownPosts :: TVar (HSet.HashSet Text)
|
|
|
|
|
-- ^ just store the existence of posts for saving memory,
|
|
|
|
|
, relayInQueue :: TQueue (Hashtag, PostID, PostContent)
|
|
|
|
|
-- ^ Queue for processing incoming posts of own instance asynchronously
|
|
|
|
|
, postFetchQueue :: TQueue PostID
|
|
|
|
|
-- ^ queue of posts to be fetched
|
|
|
|
|
, migrationsInProgress :: TVar (HMap.HashMap NodeID (MVar ()))
|
|
|
|
|
, httpMan :: HTTP.Manager
|
|
|
|
|
, statsQueue :: TQueue StatsEvent
|
|
|
|
|
, loadStats :: TVar RelayStats
|
|
|
|
|
-- ^ current load stats, replaced periodically
|
|
|
|
|
, logFileHandle :: Handle
|
|
|
|
|
}
|
|
|
|
|
deriving (Typeable)
|
|
|
|
|
|
|
|
|
@ -79,26 +90,38 @@ instance DHT d => Service PostService d where
|
|
|
|
|
threadVar <- newTVarIO =<< myThreadId -- own thread ID as placeholder
|
|
|
|
|
subscriberVar <- newTVarIO emptyRMap
|
|
|
|
|
ownSubsVar <- newTVarIO HMap.empty
|
|
|
|
|
ownPostVar <- newTVarIO HSet.empty
|
|
|
|
|
--ownPostVar <- newTVarIO HSet.empty
|
|
|
|
|
relayInQueue' <- newTQueueIO
|
|
|
|
|
postFetchQueue' <- newTQueueIO
|
|
|
|
|
migrationsInProgress' <- newTVarIO HMap.empty
|
|
|
|
|
httpMan' <- HTTP.newManager HTTP.defaultManagerSettings
|
|
|
|
|
statsQueue' <- newTQueueIO
|
|
|
|
|
loadStats' <- newTVarIO emptyStats
|
|
|
|
|
loggingFile <- openFile (confLogfilePath conf) WriteMode
|
|
|
|
|
hSetBuffering loggingFile LineBuffering
|
|
|
|
|
let
|
|
|
|
|
thisService = PostService {
|
|
|
|
|
serviceConf = conf
|
|
|
|
|
thisService = PostService
|
|
|
|
|
{ serviceConf = conf
|
|
|
|
|
, baseDHT = dht
|
|
|
|
|
, serviceThread = threadVar
|
|
|
|
|
, subscribers = subscriberVar
|
|
|
|
|
, ownSubscriptions = ownSubsVar
|
|
|
|
|
, ownPosts = ownPostVar
|
|
|
|
|
--, ownPosts = ownPostVar
|
|
|
|
|
, relayInQueue = relayInQueue'
|
|
|
|
|
, postFetchQueue = postFetchQueue'
|
|
|
|
|
, migrationsInProgress = migrationsInProgress'
|
|
|
|
|
, httpMan = httpMan'
|
|
|
|
|
}
|
|
|
|
|
, statsQueue = statsQueue'
|
|
|
|
|
, loadStats = loadStats'
|
|
|
|
|
, logFileHandle = loggingFile
|
|
|
|
|
}
|
|
|
|
|
port' = fromIntegral (confServicePort conf)
|
|
|
|
|
warpSettings = Warp.setPort port' . Warp.setHost (fromString . confServiceHost $ conf) $ Warp.defaultSettings
|
|
|
|
|
-- log a start message, this also truncates existing files
|
|
|
|
|
TxtI.hPutStrLn loggingFile $ Txt.unlines
|
|
|
|
|
[ "# Starting mock relay implementation"
|
|
|
|
|
, "#time stamp ; relay receive rate ;relay delivery rate ;instance publish rate ;instance fetch rate ;total subscriptions"
|
|
|
|
|
]
|
|
|
|
|
-- Run 'concurrently_' from another thread to be able to return the
|
|
|
|
|
-- 'PostService'.
|
|
|
|
|
-- Terminating that parent thread will make all child threads terminate as well.
|
|
|
|
@ -106,7 +129,11 @@ instance DHT d => Service PostService d where
|
|
|
|
|
concurrently_
|
|
|
|
|
-- web server
|
|
|
|
|
(Warp.runSettings warpSettings $ postServiceApplication thisService)
|
|
|
|
|
(processIncomingPosts thisService)
|
|
|
|
|
$ concurrently
|
|
|
|
|
-- background processing workers
|
|
|
|
|
(launchWorkerThreads thisService)
|
|
|
|
|
-- statistics/ measurements
|
|
|
|
|
(launchStatsThreads thisService)
|
|
|
|
|
-- update thread ID after fork
|
|
|
|
|
atomically $ writeTVar threadVar servThreadID
|
|
|
|
|
pure thisService
|
|
|
|
@ -150,6 +177,7 @@ postServer service = relayInbox service
|
|
|
|
|
:<|> tagUnsubscribe service
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
-- | delivery endpoint: receive posts of a handled tag and enqueue them for relaying
|
|
|
|
|
relayInbox :: DHT d => PostService d -> Hashtag -> Text -> Handler NoContent
|
|
|
|
|
relayInbox serv tag posts = do
|
|
|
|
|
let
|
|
|
|
@ -166,8 +194,10 @@ relayInbox serv tag posts = do
|
|
|
|
|
-- if noone subscribed to the tag, nothing needs to be done
|
|
|
|
|
(pure ())
|
|
|
|
|
-- otherwise enqueue posts into broadcast queue of the tag
|
|
|
|
|
(\queue ->
|
|
|
|
|
(\queue -> do
|
|
|
|
|
liftIO $ forM_ postIDs (atomically . writeTChan queue)
|
|
|
|
|
-- report the received post for statistic purposes
|
|
|
|
|
liftIO . atomically . writeTQueue (statsQueue serv) $ StatsEvent RelayReceiveEvent (length postIDs) (hashtagToId tag)
|
|
|
|
|
)
|
|
|
|
|
broadcastChan
|
|
|
|
|
pure NoContent
|
|
|
|
@ -178,6 +208,7 @@ newtype UnhandledTagException = UnhandledTagException String
|
|
|
|
|
|
|
|
|
|
instance Exception UnhandledTagException
|
|
|
|
|
|
|
|
|
|
-- | delivery endpoint: receives a list of subscribers of tags and their outstanding queues for migration
|
|
|
|
|
subscriptionDelivery :: DHT d => PostService d -> Integer -> Text -> Handler Text
|
|
|
|
|
subscriptionDelivery serv senderID subList = do
|
|
|
|
|
let
|
|
|
|
@ -223,27 +254,30 @@ subscriptionDelivery serv senderID subList = do
|
|
|
|
|
enqueueSubscription subscriberSTM (normaliseTag tag) sub postList leaseTime
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
-- | endpoint for fetching a post by its ID
|
|
|
|
|
postFetch :: PostService d -> Text -> Handler Text
|
|
|
|
|
postFetch serv postID = do
|
|
|
|
|
postSet <- liftIO . readTVarIO . ownPosts $ serv
|
|
|
|
|
if HSet.member postID postSet
|
|
|
|
|
-- decision: always return the same placeholder post
|
|
|
|
|
then pure placeholderPost
|
|
|
|
|
else throwError $ err404 { errBody = "No post found with this ID" }
|
|
|
|
|
postFetch serv _ = do
|
|
|
|
|
-- decision: for saving memory do not store published posts, just
|
|
|
|
|
-- pretend there is a post for each requested ID
|
|
|
|
|
liftIO . atomically . writeTQueue (statsQueue serv) $ StatsEvent IncomingPostFetchEvent 1 0 -- tag fetched for is irrelevant
|
|
|
|
|
pure placeholderPost
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
-- | endpoint for fetching multiple posts of this instance by their IDs
|
|
|
|
|
postMultiFetch :: PostService d -> Text -> Handler Text
|
|
|
|
|
postMultiFetch serv postIDs = do
|
|
|
|
|
let idList = Txt.lines postIDs
|
|
|
|
|
postSet <- liftIO . readTVarIO . ownPosts $ serv
|
|
|
|
|
-- look up existence of all given post IDs, fail if even one is missing
|
|
|
|
|
foldM (\response postID ->
|
|
|
|
|
if HSet.member postID postSet
|
|
|
|
|
then pure $ placeholderPost <> "\n" <> response
|
|
|
|
|
else throwError $ err404 { errBody = "No post found with this ID" }
|
|
|
|
|
let
|
|
|
|
|
idList = Txt.lines postIDs
|
|
|
|
|
-- decision: for saving memory do not store published posts, just
|
|
|
|
|
-- pretend there is a post for each requested ID
|
|
|
|
|
response = foldl (\response' _ ->
|
|
|
|
|
placeholderPost <> "\n" <> response'
|
|
|
|
|
) "" idList
|
|
|
|
|
liftIO . atomically . writeTQueue (statsQueue serv) $ StatsEvent IncomingPostFetchEvent (length idList) 0 -- tag fetched for is irrelevant
|
|
|
|
|
pure response
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
-- | delivery endpoint: inbox for initially publishing a post at an instance
|
|
|
|
|
postInbox :: PostService d -> Text -> Handler NoContent
|
|
|
|
|
postInbox serv post = do
|
|
|
|
|
-- extract contained hashtags
|
|
|
|
@ -251,8 +285,7 @@ postInbox serv post = do
|
|
|
|
|
containedTags = fmap (normaliseTag . Txt.tail) . filter ((==) '#' . Txt.head) . Txt.words $ post
|
|
|
|
|
-- generate post ID
|
|
|
|
|
postId <- liftIO $ Txt.pack . show <$> (randomRIO (0, 2^(128::Integer)-1) :: IO Integer)
|
|
|
|
|
-- add ID to own posts
|
|
|
|
|
liftIO . atomically $ modifyTVar' (ownPosts serv) (HSet.insert postId)
|
|
|
|
|
-- decision: for saving memory do not store published post IDs, just deliver a post for any requested ID
|
|
|
|
|
-- enqueue a relay job for each tag
|
|
|
|
|
liftIO $ forM_ (containedTags :: [Text]) (\tag ->
|
|
|
|
|
atomically $ writeTQueue (relayInQueue serv) (tag, postId, post)
|
|
|
|
@ -260,6 +293,7 @@ postInbox serv post = do
|
|
|
|
|
pure NoContent
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
-- | delivery endpoint: receive postIDs of a certain subscribed hashtag
|
|
|
|
|
tagDelivery :: PostService d -> Text -> Text -> Handler Text
|
|
|
|
|
tagDelivery serv hashtag posts = do
|
|
|
|
|
let postIDs = Txt.lines posts
|
|
|
|
@ -271,6 +305,8 @@ tagDelivery serv hashtag posts = do
|
|
|
|
|
pure ()
|
|
|
|
|
pure $ "Received a postID for tag " <> hashtag
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
-- | receive subscription requests to a handled hashtag
|
|
|
|
|
tagSubscribe :: DHT d => PostService d -> Text -> Maybe Text -> Handler Integer
|
|
|
|
|
tagSubscribe serv hashtag origin = do
|
|
|
|
|
responsible <- liftIO $ isResponsibleFor (baseDHT serv) (hashtagToId hashtag)
|
|
|
|
@ -287,9 +323,11 @@ tagSubscribe serv hashtag origin = do
|
|
|
|
|
let leaseTime = now + confSubscriptionExpiryTime (serviceConf serv)
|
|
|
|
|
-- setup subscription entry
|
|
|
|
|
_ <- liftIO . atomically $ setupSubscriberChannel (subscribers serv) hashtag (BSU.toString $ HTTP.host req, HTTP.port req) leaseTime
|
|
|
|
|
--liftIO . putStrLn $ "just got a subscription to " <> Txt.unpack hashtag
|
|
|
|
|
pure $ round leaseTime
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
-- | receive and handle unsubscription requests regarding a handled tag
|
|
|
|
|
tagUnsubscribe :: DHT d => PostService d -> Text -> Maybe Text -> Handler Text
|
|
|
|
|
tagUnsubscribe serv hashtag origin = do
|
|
|
|
|
responsible <- liftIO $ isResponsibleFor (baseDHT serv) (hashtagToId hashtag)
|
|
|
|
@ -310,15 +348,15 @@ tagUnsubscribe serv hashtag origin = do
|
|
|
|
|
clientAPI :: Proxy PostServiceAPI
|
|
|
|
|
clientAPI = Proxy
|
|
|
|
|
|
|
|
|
|
relayInboxClient :: Text -> Text -> ClientM NoContent
|
|
|
|
|
relayInboxClient :<|> subscriptionDeliveryClient
|
|
|
|
|
:<|> postFetchClient
|
|
|
|
|
:<|> postMultiFetchClient
|
|
|
|
|
:<|> postInboxClient
|
|
|
|
|
:<|> tagDeliveryClient
|
|
|
|
|
:<|> tagSubscribeClient
|
|
|
|
|
:<|> tagUnsubscribeClient
|
|
|
|
|
= client clientAPI
|
|
|
|
|
relayInboxClient
|
|
|
|
|
:<|> subscriptionDeliveryClient
|
|
|
|
|
:<|> postFetchClient
|
|
|
|
|
:<|> postMultiFetchClient
|
|
|
|
|
:<|> postInboxClient
|
|
|
|
|
:<|> tagDeliveryClient
|
|
|
|
|
:<|> tagSubscribeClient
|
|
|
|
|
:<|> tagUnsubscribeClient
|
|
|
|
|
= client clientAPI
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
-- | Deliver the subscriber list of all hashtags in the interval [fromTag, toTag]
|
|
|
|
@ -388,10 +426,12 @@ clientSubscribeTo serv tag = do
|
|
|
|
|
Left (FailureResponse _ fresp)
|
|
|
|
|
|(HTTPT.statusCode . responseStatusCode $ fresp) == 410 && allowRetry -> do -- responsibility gone, force new lookup
|
|
|
|
|
newRes <- forceLookupKey (baseDHT serv) (Txt.unpack tag)
|
|
|
|
|
--putStrLn $ "failed subscribing to " <> Txt.unpack tag <> " on " <> foundHost
|
|
|
|
|
doSubscribe newRes False
|
|
|
|
|
Left err -> pure . Left . show $ err
|
|
|
|
|
Right lease -> do
|
|
|
|
|
atomically . modifyTVar' (ownSubscriptions serv) $ HMap.insert (hashtagToId tag) (fromInteger lease)
|
|
|
|
|
--putStrLn $ "just subscribed to " <> Txt.unpack tag <> " on " <> foundHost
|
|
|
|
|
pure . Right $ lease
|
|
|
|
|
)
|
|
|
|
|
lookupResponse
|
|
|
|
@ -525,15 +565,37 @@ lookupTagSubscriptions :: Hashtag -> RingMap NodeID a -> Maybe a
|
|
|
|
|
lookupTagSubscriptions tag = rMapLookup (hashtagToId tag)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
-- normalise the unicode representation of a string to NFC
|
|
|
|
|
-- normalise the unicode representation of a string to NFC and convert to lower case
|
|
|
|
|
normaliseTag :: Text -> Text
|
|
|
|
|
normaliseTag = Txt.fromStrict . normalize NFC . Txt.toStrict
|
|
|
|
|
normaliseTag = Txt.toLower . Txt.fromStrict . normalize NFC . Txt.toStrict
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
-- | convert a hashtag to its representation on the DHT
|
|
|
|
|
hashtagToId :: Hashtag -> NodeID
|
|
|
|
|
hashtagToId = genKeyID . Txt.unpack
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
readUpToTChan :: Int -> TChan a -> STM [a]
|
|
|
|
|
readUpToTChan 0 _ = pure []
|
|
|
|
|
readUpToTChan n chan = do
|
|
|
|
|
readFromChan <- tryReadTChan chan
|
|
|
|
|
case readFromChan of
|
|
|
|
|
Nothing -> pure []
|
|
|
|
|
Just val -> do
|
|
|
|
|
moreReads <- readUpToTChan (pred n) chan
|
|
|
|
|
pure (val:moreReads)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
readUpToTQueue :: Int -> TQueue a -> STM [a]
|
|
|
|
|
readUpToTQueue 0 _ = pure []
|
|
|
|
|
readUpToTQueue n q = do
|
|
|
|
|
readFromQueue <- tryReadTQueue q
|
|
|
|
|
case readFromQueue of
|
|
|
|
|
Nothing -> pure []
|
|
|
|
|
Just val -> do
|
|
|
|
|
moreReads <- readUpToTQueue (pred n) q
|
|
|
|
|
pure (val:moreReads)
|
|
|
|
|
|
|
|
|
|
-- | define how to convert all showable types to PlainText
|
|
|
|
|
-- No idea what I'm doing with these overlappable instances though ¯\_(ツ)_/¯
|
|
|
|
|
-- TODO: figure out how this overlapping stuff actually works https://downloads.haskell.org/~ghc/latest/docs/html/users_guide/glasgow_exts.html#instance-overlap
|
|
|
|
@ -545,36 +607,78 @@ instance {-# OVERLAPPABLE #-} Read a => MimeUnrender PlainText a where
|
|
|
|
|
|
|
|
|
|
-- ====== worker threads ======
|
|
|
|
|
|
|
|
|
|
-- TODO: make configurable
|
|
|
|
|
numParallelDeliveries = 10
|
|
|
|
|
|
|
|
|
|
launchWorkerThreads :: DHT d => PostService d -> IO ()
|
|
|
|
|
launchWorkerThreads serv = concurrently_
|
|
|
|
|
(processIncomingPosts serv)
|
|
|
|
|
$ concurrently_
|
|
|
|
|
(purgeSubscriptionsThread serv)
|
|
|
|
|
$ concurrently_
|
|
|
|
|
(fetchTagPosts serv)
|
|
|
|
|
(relayWorker serv)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
-- | periodically remove expired subscription entries from relay subscribers
|
|
|
|
|
purgeSubscriptionsThread :: PostService d -> IO ()
|
|
|
|
|
purgeSubscriptionsThread serv = forever $ do
|
|
|
|
|
-- read config
|
|
|
|
|
now <- getPOSIXTime
|
|
|
|
|
let
|
|
|
|
|
purgeInterval = confSubscriptionExpiryTime (serviceConf serv) / 10
|
|
|
|
|
-- no need to atomically lock this, as newly incoming subscriptions do not
|
|
|
|
|
-- need to be purged
|
|
|
|
|
tagMap <- readTVarIO $ subscribers serv
|
|
|
|
|
forM_ tagMap $ \(subscriberMapSTM, _, _) ->
|
|
|
|
|
-- but each subscriberMap needs to be modified atomically
|
|
|
|
|
atomically . modifyTVar' subscriberMapSTM $ HMap.filter (\(_, ts) -> ts > now)
|
|
|
|
|
threadDelay $ fromEnum purgeInterval `div` 10^6
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
-- | process the pending relay inbox of incoming posts from the internal queue:
|
|
|
|
|
-- Look up responsible relay node for given hashtag and forward post to it
|
|
|
|
|
processIncomingPosts :: DHT d => PostService d -> IO ()
|
|
|
|
|
processIncomingPosts serv = forever $ do
|
|
|
|
|
-- blocks until available
|
|
|
|
|
-- TODO: process multiple in parallel
|
|
|
|
|
(tag, pID, pContent) <- atomically . readTQueue $ relayInQueue serv
|
|
|
|
|
let pIdUri = "http://" <> (Txt.pack . confServiceHost . serviceConf $ serv) <> ":" <> (fromString . show . confServicePort . serviceConf $ serv) <> "/post/" <> pID
|
|
|
|
|
lookupRes <- lookupKey (baseDHT serv) (Txt.unpack tag)
|
|
|
|
|
case lookupRes of
|
|
|
|
|
-- no vserver active => wait and retry
|
|
|
|
|
Nothing -> threadDelay $ 10 * 10^6
|
|
|
|
|
Just (responsibleHost, responsiblePort) -> do
|
|
|
|
|
resp <- runClientM (relayInboxClient tag $ pIdUri <> "," <> pContent) (mkClientEnv (httpMan serv) (BaseUrl Http responsibleHost (fromIntegral responsiblePort) ""))
|
|
|
|
|
case resp of
|
|
|
|
|
Left err -> do
|
|
|
|
|
putStrLn $ "Error: " <> show err
|
|
|
|
|
-- 410 error indicates outdated responsibility mapping
|
|
|
|
|
-- Simplification: just invalidate the mapping entry on all errors, force a re-lookup and re-queue the post
|
|
|
|
|
-- TODO: keep track of maximum retries
|
|
|
|
|
_ <- forceLookupKey (baseDHT serv) (Txt.unpack tag)
|
|
|
|
|
atomically . writeTQueue (relayInQueue serv) $ (tag, pID, pContent)
|
|
|
|
|
Right _ -> do
|
|
|
|
|
-- TODO: stats
|
|
|
|
|
-- idea for the experiment: each post publication makes the initial posting instance subscribe to all contained tags
|
|
|
|
|
now <- getPOSIXTime
|
|
|
|
|
subscriptionStatus <- HMap.lookup (hashtagToId tag) <$> readTVarIO (ownSubscriptions serv)
|
|
|
|
|
-- if not yet subscribed or subscription expires within 2 minutes, (re)subscribe to tag
|
|
|
|
|
when (maybe False (\subLease -> now - subLease < 120) subscriptionStatus) $
|
|
|
|
|
void $ clientSubscribeTo serv tag
|
|
|
|
|
deliveriesToProcess <- atomically $ do
|
|
|
|
|
readResult <- readUpToTQueue numParallelDeliveries $ relayInQueue serv
|
|
|
|
|
if null readResult
|
|
|
|
|
then retry
|
|
|
|
|
else pure readResult
|
|
|
|
|
runningJobs <- forM deliveriesToProcess $ \(tag, pID, pContent) -> async $ do
|
|
|
|
|
let pIdUri = "http://" <> (Txt.pack . confServiceHost . serviceConf $ serv) <> ":" <> (fromString . show . confServicePort . serviceConf $ serv) <> "/post/" <> pID
|
|
|
|
|
lookupRes <- lookupKey (baseDHT serv) (Txt.unpack tag)
|
|
|
|
|
case lookupRes of
|
|
|
|
|
-- no vserver active => wait and retry
|
|
|
|
|
Nothing -> threadDelay (10 * 10^6) >> pure (Left "no vserver active")
|
|
|
|
|
Just (responsibleHost, responsiblePort) -> do
|
|
|
|
|
resp <- runClientM (relayInboxClient tag $ pIdUri <> "," <> pContent) (mkClientEnv (httpMan serv) (BaseUrl Http responsibleHost (fromIntegral responsiblePort) ""))
|
|
|
|
|
case resp of
|
|
|
|
|
Left err -> do
|
|
|
|
|
-- 410 error indicates outdated responsibility mapping
|
|
|
|
|
-- Simplification: just invalidate the mapping entry on all errors, force a re-lookup and re-queue the post
|
|
|
|
|
-- TODO: keep track of maximum retries
|
|
|
|
|
_ <- forceLookupKey (baseDHT serv) (Txt.unpack tag)
|
|
|
|
|
atomically . writeTQueue (relayInQueue serv) $ (tag, pID, pContent)
|
|
|
|
|
pure . Left $ "Error: " <> show err
|
|
|
|
|
Right _ -> do
|
|
|
|
|
-- idea for the experiment: each post publication makes the initial posting instance subscribe to all contained tags
|
|
|
|
|
now <- getPOSIXTime
|
|
|
|
|
subscriptionStatus <- HMap.lookup (hashtagToId tag) <$> readTVarIO (ownSubscriptions serv)
|
|
|
|
|
-- if not yet subscribed or subscription expires within 5 minutes, (re)subscribe to tag
|
|
|
|
|
when (maybe True (\subLease -> now - subLease < 300) subscriptionStatus) $
|
|
|
|
|
void $ clientSubscribeTo serv tag
|
|
|
|
|
|
|
|
|
|
-- for evaluation, return the tag of the successfully forwarded post
|
|
|
|
|
pure $ Right tag
|
|
|
|
|
|
|
|
|
|
-- collect async results
|
|
|
|
|
results <- mapM waitCatch runningJobs
|
|
|
|
|
-- report the count of published posts for statistics
|
|
|
|
|
atomically . writeTQueue (statsQueue serv) $ StatsEvent PostPublishEvent (length . rights $ results) 0 -- hashtag published to doesn't matter
|
|
|
|
|
pure ()
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
-- | process the pending fetch jobs of delivered post IDs: Delivered posts are tried to be fetched from their URI-ID
|
|
|
|
@ -588,14 +692,193 @@ fetchTagPosts serv = forever $ do
|
|
|
|
|
resp <- try $ HTTP.httpLbs fetchReq (httpMan serv) :: IO (Either HTTP.HttpException (HTTP.Response BSUL.ByteString))
|
|
|
|
|
case resp of
|
|
|
|
|
Right response ->
|
|
|
|
|
if HTTPT.statusCode (HTTP.responseStatus response) == 200
|
|
|
|
|
then
|
|
|
|
|
-- success, TODO: statistics
|
|
|
|
|
putStrLn "post fetch success"
|
|
|
|
|
else
|
|
|
|
|
-- TODO error handling, retry
|
|
|
|
|
pure ()
|
|
|
|
|
-- TODO error handling, retry
|
|
|
|
|
--if HTTPT.statusCode (HTTP.responseStatus response) == 200
|
|
|
|
|
-- then
|
|
|
|
|
-- -- success, TODO: statistics
|
|
|
|
|
-- else
|
|
|
|
|
pure ()
|
|
|
|
|
Left _ ->
|
|
|
|
|
-- TODO error handling, retry
|
|
|
|
|
pure ()
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
relayWorker :: PostService d -> IO ()
|
|
|
|
|
relayWorker serv = forever $ do
|
|
|
|
|
-- atomically (to be able to retry) fold a list of due delivery actions
|
|
|
|
|
jobsToProcess <- atomically $ do
|
|
|
|
|
subscriptionMap <- readTVar $ subscribers serv
|
|
|
|
|
jobList <- D.toList <$> foldM (\jobAcc (subscriberMapSTM, _, tag) -> do
|
|
|
|
|
subscriberMap <- readTVar subscriberMapSTM
|
|
|
|
|
foldM (\jobAcc' ((subHost, subPort), (postChan, _)) -> do
|
|
|
|
|
postsToDeliver <- readUpToTChan 500 postChan
|
|
|
|
|
let postDeliveryAction = runClientM (tagDeliveryClient tag (Txt.unlines postsToDeliver)) (mkClientEnv (httpMan serv) (BaseUrl Http subHost (fromIntegral subPort) ""))
|
|
|
|
|
-- append relay push job to job list
|
|
|
|
|
pure $ if not (null postsToDeliver)
|
|
|
|
|
then jobAcc' `D.snoc` (do
|
|
|
|
|
deliveryResult <- postDeliveryAction
|
|
|
|
|
either
|
|
|
|
|
(const $ pure ())
|
|
|
|
|
-- on successful push, record that event for statistics
|
|
|
|
|
(const . atomically . writeTQueue (statsQueue serv) $ StatsEvent RelayDeliveryEvent (length postsToDeliver) (hashtagToId tag))
|
|
|
|
|
deliveryResult
|
|
|
|
|
pure deliveryResult
|
|
|
|
|
)
|
|
|
|
|
else jobAcc'
|
|
|
|
|
) jobAcc $ HMap.toList subscriberMap
|
|
|
|
|
) D.empty subscriptionMap
|
|
|
|
|
-- if no relay jobs, then retry
|
|
|
|
|
if null jobList
|
|
|
|
|
then retry
|
|
|
|
|
else pure jobList
|
|
|
|
|
|
|
|
|
|
-- when processing the list, send several deliveries in parallel
|
|
|
|
|
forM_ (chunksOf numParallelDeliveries jobsToProcess) $ \jobset -> do
|
|
|
|
|
runningJobs <- mapM async jobset
|
|
|
|
|
-- so far just dropping failed attempts, TODO: retry mechanism
|
|
|
|
|
results <- mapM waitCatch runningJobs
|
|
|
|
|
let
|
|
|
|
|
successfulResults = rights results
|
|
|
|
|
unsuccessfulResults = lefts results
|
|
|
|
|
unless (null unsuccessfulResults) $ putStrLn ("ERR: " <> show (length unsuccessfulResults) <> " failed deliveries!")
|
|
|
|
|
putStrLn $ "successfully relayed " <> show (length successfulResults)
|
|
|
|
|
pure ()
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
-- ======= statistics/measurement and logging =======
|
|
|
|
|
|
|
|
|
|
data StatsEventType = PostPublishEvent
|
|
|
|
|
| RelayReceiveEvent
|
|
|
|
|
| RelayDeliveryEvent
|
|
|
|
|
| IncomingPostFetchEvent
|
|
|
|
|
deriving (Enum, Show, Eq)
|
|
|
|
|
|
|
|
|
|
-- | Represents measurement event of a 'StatsEventType' with a count relevant for a certain key
|
|
|
|
|
data StatsEvent = StatsEvent StatsEventType Int NodeID
|
|
|
|
|
deriving (Show, Eq)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
-- | measured rates of relay performance
|
|
|
|
|
-- TODO: maybe include other metrics in here as well, like number of subscribers?
|
|
|
|
|
data RelayStats = RelayStats
|
|
|
|
|
{ relayReceiveRates :: RingMap NodeID Double
|
|
|
|
|
-- ^ rate of incoming posts in the responsibility of this relay
|
|
|
|
|
, relayDeliveryRates :: RingMap NodeID Double
|
|
|
|
|
-- ^ rate of relayed outgoing posts
|
|
|
|
|
, postFetchRate :: Double -- no need to differentiate between tags
|
|
|
|
|
-- ^ number of post-fetches delivered
|
|
|
|
|
, postPublishRate :: Double
|
|
|
|
|
-- ^ rate of initially publishing posts through this instance
|
|
|
|
|
}
|
|
|
|
|
deriving (Show, Eq)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
launchStatsThreads :: PostService d -> IO ()
|
|
|
|
|
launchStatsThreads serv = do
|
|
|
|
|
-- create shared accumulator
|
|
|
|
|
sharedAccum <- newTVarIO emptyStats
|
|
|
|
|
concurrently_
|
|
|
|
|
(accumulateStatsThread sharedAccum $ statsQueue serv)
|
|
|
|
|
(evaluateStatsThread serv sharedAccum)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
-- | Read stats events from queue and add them to a shared accumulator.
|
|
|
|
|
-- Instead of letting the events accumulate in the queue and allocate linear memory, immediately fold the result.
|
|
|
|
|
accumulateStatsThread :: TVar RelayStats -> TQueue StatsEvent -> IO ()
|
|
|
|
|
accumulateStatsThread statsAccumulator statsQ = forever $ do
|
|
|
|
|
-- blocks until stats event arrives
|
|
|
|
|
event <- atomically $ readTQueue statsQ
|
|
|
|
|
-- add the event number to current accumulator
|
|
|
|
|
atomically $ modifyTVar' statsAccumulator $ statsAdder event
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
-- | add incoming stats events to accumulator value
|
|
|
|
|
statsAdder :: StatsEvent -> RelayStats -> RelayStats
|
|
|
|
|
statsAdder event stats = case event of
|
|
|
|
|
StatsEvent PostPublishEvent num _ ->
|
|
|
|
|
stats {postPublishRate = fromIntegral num + postPublishRate stats}
|
|
|
|
|
StatsEvent RelayReceiveEvent num key ->
|
|
|
|
|
stats {relayReceiveRates = sumIfEntryExists key (fromIntegral num) (relayReceiveRates stats)}
|
|
|
|
|
StatsEvent RelayDeliveryEvent num key ->
|
|
|
|
|
stats {relayDeliveryRates = sumIfEntryExists key (fromIntegral num) (relayDeliveryRates stats)}
|
|
|
|
|
StatsEvent IncomingPostFetchEvent num _ ->
|
|
|
|
|
stats {postFetchRate = fromIntegral num + postFetchRate stats}
|
|
|
|
|
where
|
|
|
|
|
sumIfEntryExists = addRMapEntryWith (\newVal oldVal ->
|
|
|
|
|
let toInsert = fromJust $ extractRingEntry newVal
|
|
|
|
|
in
|
|
|
|
|
case oldVal of
|
|
|
|
|
KeyEntry n -> KeyEntry (n + toInsert)
|
|
|
|
|
ProxyEntry pointer (Just (KeyEntry n)) -> ProxyEntry pointer (Just (KeyEntry $ n + toInsert))
|
|
|
|
|
ProxyEntry pointer Nothing -> ProxyEntry pointer (Just newVal)
|
|
|
|
|
_ -> error "RingMap nested too deeply"
|
|
|
|
|
)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
-- Periodically exchange the accumulated statistics with empty ones, evaluate them
|
|
|
|
|
-- and make them the current statistics of the service.
|
|
|
|
|
evaluateStatsThread :: PostService d -> TVar RelayStats -> IO ()
|
|
|
|
|
evaluateStatsThread serv statsAcc = getPOSIXTime >>= loop
|
|
|
|
|
where
|
|
|
|
|
loop previousTs = do
|
|
|
|
|
threadDelay $ confStatsEvalDelay (serviceConf serv)
|
|
|
|
|
-- get and reset the stats accumulator
|
|
|
|
|
summedStats <- atomically $ do
|
|
|
|
|
stats <- readTVar statsAcc
|
|
|
|
|
writeTVar statsAcc emptyStats
|
|
|
|
|
pure stats
|
|
|
|
|
-- as the transaction might retry several times, current time needs to
|
|
|
|
|
-- be read afterwards
|
|
|
|
|
now <- getPOSIXTime
|
|
|
|
|
-- evaluate stats rate and replace server stats
|
|
|
|
|
-- persistently store in a TVar so it can be retrieved later by the DHT
|
|
|
|
|
let timePassed = (now - previousTs) * fromIntegral (confSpeedupFactor $ serviceConf serv)
|
|
|
|
|
rateStats = evaluateStats timePassed summedStats
|
|
|
|
|
atomically $ writeTVar (loadStats serv) rateStats
|
|
|
|
|
-- and now what? write a log to file
|
|
|
|
|
-- format: total relayReceiveRates;total relayDeliveryRates;postFetchRate;postPublishRate; subscriberSum
|
|
|
|
|
-- later: current (reported) load, target load
|
|
|
|
|
subscriberSum <- sumSubscribers
|
|
|
|
|
TxtI.hPutStrLn (logFileHandle serv) $
|
|
|
|
|
format (fixed 9 % ";" % fixed 20 % ";" % fixed 20 % ";" % fixed 20 % ";" % fixed 20 % ";" % int )
|
|
|
|
|
(realToFrac now :: Double)
|
|
|
|
|
(sum . relayReceiveRates $ rateStats)
|
|
|
|
|
(sum . relayDeliveryRates $ rateStats)
|
|
|
|
|
(postPublishRate rateStats)
|
|
|
|
|
(postFetchRate rateStats)
|
|
|
|
|
subscriberSum
|
|
|
|
|
loop now
|
|
|
|
|
|
|
|
|
|
sumSubscribers = do
|
|
|
|
|
tagMap <- readTVarIO $ subscribers serv
|
|
|
|
|
foldM (\subscriberSum (subscriberMapSTM, _, _) -> do
|
|
|
|
|
subscriberMap <- readTVarIO subscriberMapSTM
|
|
|
|
|
pure $ subscriberSum + HMap.size subscriberMap
|
|
|
|
|
)
|
|
|
|
|
0 tagMap
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
-- | Evaluate the accumulated statistic events: Currently mostly calculates the event
|
|
|
|
|
-- rates by dividing through the collection time frame
|
|
|
|
|
evaluateStats :: POSIXTime -> RelayStats -> RelayStats
|
|
|
|
|
evaluateStats timeInterval summedStats =
|
|
|
|
|
-- first sum all event numbers, then divide through number of seconds passed to
|
|
|
|
|
-- get rate per second
|
|
|
|
|
RelayStats
|
|
|
|
|
{ relayReceiveRates = (/ intervalSeconds) <$> relayReceiveRates summedStats
|
|
|
|
|
, relayDeliveryRates = (/ intervalSeconds) <$> relayDeliveryRates summedStats
|
|
|
|
|
, postPublishRate = postPublishRate summedStats / intervalSeconds
|
|
|
|
|
, postFetchRate = postFetchRate summedStats / intervalSeconds
|
|
|
|
|
}
|
|
|
|
|
where
|
|
|
|
|
intervalSeconds = realToFrac timeInterval
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
emptyStats :: RelayStats
|
|
|
|
|
emptyStats = RelayStats
|
|
|
|
|
{ relayReceiveRates = emptyRMap
|
|
|
|
|
, relayDeliveryRates = emptyRMap
|
|
|
|
|
, postFetchRate = 0
|
|
|
|
|
, postPublishRate = 0
|
|
|
|
|
}
|
|
|
|
|