Skip to content

Commit

Permalink
fix potential deadlock in the global watcher callback
Browse files Browse the repository at this point in the history
  • Loading branch information
4eUeP committed May 9, 2024
1 parent 079a558 commit 0695309
Show file tree
Hide file tree
Showing 5 changed files with 63 additions and 12 deletions.
2 changes: 1 addition & 1 deletion .github/workflows/ci.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -12,7 +12,7 @@ jobs:
runs-on: ${{ matrix.os }}
strategy:
matrix:
ghc: ['8.10.7', '9.0.2', '9.2.8', '9.4.5']
ghc: ['8.10.7', '9.0.2', '9.2.8', '9.4.8']
cabal: ['3.8']
os: [ubuntu-latest, macOS-latest]

Expand Down
10 changes: 6 additions & 4 deletions src/ZooKeeper.hs
Original file line number Diff line number Diff line change
Expand Up @@ -76,8 +76,9 @@ zookeeperResInit
-- server. e.g. "127.0.0.1:3000,127.0.0.1:3001,127.0.0.1:3002"
-> Maybe T.WatcherFn
-- ^ the global watcher callback function. When notifications are
-- triggered this function will be invoked. FIXME: Calling any zoo operations
-- (e.g. zooGet) will cause an infinite block.
-- triggered this function will be invoked.
--
-- Note that each callback will be called in a different thread of execution.
-> CInt
-- ^ session expiration time in milliseconds
-> Maybe T.ClientID
Expand Down Expand Up @@ -700,8 +701,9 @@ zookeeperInit
-- server. e.g. "127.0.0.1:3000,127.0.0.1:3001,127.0.0.1:3002"
-> Maybe T.WatcherFn
-- ^ the global watcher callback function. When notifications are
-- triggered this function will be invoked. FIXME: Calling any zoo operations
-- (e.g. zooGet) will cause an infinite block.
-- triggered this function will be invoked.
--
-- Note that each callback will be called in a different thread of execution.
-> CInt
-- ^ session expiration time in milliseconds
-> Maybe T.ClientID
Expand Down
28 changes: 27 additions & 1 deletion src/ZooKeeper/Internal/FFI.hsc
Original file line number Diff line number Diff line change
Expand Up @@ -63,7 +63,33 @@ foreign import ccall "wrapper"
mkWatcherFnPtr :: WatcherFn -> IO (FunPtr CWatcherFn)
mkWatcherFnPtr fn = mkCWatcherFnPtr $ \zh ev st cpath _ctx -> do
path <- CBytes.fromCString cpath
fn zh (ZooEvent ev) (ZooState st) path
-- FIXME: better way
--
-- Here we fork a new thread to run the user's watcher function to avoid
-- blocking the C thread, potential deadlock.
--
-- Without forkIO, the following code will deadlock,
--
-- @
-- gloWatcher :: WatcherFn
-- gloWatcher zh event state path = do
-- print =<< zooGet zh "/node"
--
-- zookeeperResInit "127.0.0.1:2181" (Just gloWatcher) 5000 Nothing 0
-- ...
-- @
--
-- * All zookeeper completions are run by one completion c thread (or likely
-- in one thread).
-- * We are blocking on a MVar and waiting for the callback of zoo_aget
-- return.
-- * gloWatcher will be called by zookeeper library as a c function, which
-- means any blocking in haskell code will block the c thread.
--
-- So, zooGet is waiting for the result of zoo_aget, and blocking on an MVar,
-- which will block the completion c thread here. The result of zoo_aget is
-- returned by this completion c thread, so it will never be called.
void $ forkIO $ fn zh (ZooEvent ev) (ZooState st) path

foreign import ccall safe "zookeeper.h zookeeper_init"
zookeeper_init
Expand Down
30 changes: 26 additions & 4 deletions test/Spec.hs
Original file line number Diff line number Diff line change
Expand Up @@ -21,14 +21,18 @@ import ZooKeeper.Types
recvTimeout :: CInt
recvTimeout = 5000

testZkHost :: CB.CBytes
testZkHost = "127.0.0.1:2182"

client :: Resource ZHandle
client = zookeeperResInit "127.0.0.1:2182" Nothing recvTimeout Nothing 0
client = zookeeperResInit testZkHost Nothing recvTimeout Nothing 0

main :: IO ()
main = withResource client $ \zh -> do
hspec $ opSpec zh
hspec $ multiOpSpec zh
hspec $ propSpec zh
hspec $ miscSpec zh
hspec $ electionSpec1 zh
hspec $ electionSpec2 client
hspec $ lockSpec1 zh
Expand Down Expand Up @@ -91,7 +95,7 @@ opSpec zh = do
-- https://issues.apache.org/jira/browse/ZOOKEEPER-834
it "create children of ephemeral nodes should throw exception" $ do
void $ zooCreate zh "/x" Nothing zooOpenAclUnsafe ZooEphemeral
zooCreate zh "/x/1" Nothing zooOpenAclUnsafe ZooEphemeral `shouldThrow` noChildrenForEphemerals
zooCreate zh "/x/1" Nothing zooOpenAclUnsafe ZooEphemeral `shouldThrow` noChildrenForEphemeralsEx

it "get children of a leaf node should return []" $ do
void $ zooCreate zh "/y" Nothing zooOpenAclUnsafe ZooPersistent
Expand Down Expand Up @@ -186,6 +190,21 @@ electionSpec2 client_ = describe "ZooKeeper.zooElection (multi sessions)" $ do
takeMVar finished4
readMVar leader `shouldReturn` (2 :: Int)

miscSpec :: ZHandle -> Spec
miscSpec zh = describe "Misc" $ do
it "call zooGet in global watcher should not block" $ do
let nodeName = "/test-misc-node"
void $ zooCreate zh nodeName Nothing zooOpenAclUnsafe ZooEphemeral
void $ zooSet zh nodeName (Just "hello") Nothing

mvar <- newEmptyMVar
let gloWatcher zh1 event state path = do

Check warning on line 201 in test/Spec.hs

View workflow job for this annotation

GitHub Actions / ghc-8.10.7 cabal-3.8 on ubuntu-latest

Defined but not used: ‘event’

Check warning on line 201 in test/Spec.hs

View workflow job for this annotation

GitHub Actions / ghc-8.10.7 cabal-3.8 on ubuntu-latest

Defined but not used: ‘state’

Check warning on line 201 in test/Spec.hs

View workflow job for this annotation

GitHub Actions / ghc-8.10.7 cabal-3.8 on ubuntu-latest

Defined but not used: ‘path’

Check warning on line 201 in test/Spec.hs

View workflow job for this annotation

GitHub Actions / ghc-9.0.2 cabal-3.8 on ubuntu-latest

Defined but not used: ‘event’

Check warning on line 201 in test/Spec.hs

View workflow job for this annotation

GitHub Actions / ghc-9.0.2 cabal-3.8 on ubuntu-latest

Defined but not used: ‘state’

Check warning on line 201 in test/Spec.hs

View workflow job for this annotation

GitHub Actions / ghc-9.0.2 cabal-3.8 on ubuntu-latest

Defined but not used: ‘path’

Check warning on line 201 in test/Spec.hs

View workflow job for this annotation

GitHub Actions / ghc-9.2.8 cabal-3.8 on ubuntu-latest

Defined but not used: ‘event’

Check warning on line 201 in test/Spec.hs

View workflow job for this annotation

GitHub Actions / ghc-9.2.8 cabal-3.8 on ubuntu-latest

Defined but not used: ‘state’

Check warning on line 201 in test/Spec.hs

View workflow job for this annotation

GitHub Actions / ghc-9.2.8 cabal-3.8 on ubuntu-latest

Defined but not used: ‘path’

Check warning on line 201 in test/Spec.hs

View workflow job for this annotation

GitHub Actions / ghc-9.4.8 cabal-3.8 on ubuntu-latest

Defined but not used: ‘event’

Check warning on line 201 in test/Spec.hs

View workflow job for this annotation

GitHub Actions / ghc-9.4.8 cabal-3.8 on ubuntu-latest

Defined but not used: ‘state’

Check warning on line 201 in test/Spec.hs

View workflow job for this annotation

GitHub Actions / ghc-9.4.8 cabal-3.8 on ubuntu-latest

Defined but not used: ‘path’
r <- zooGet zh1 nodeName
void $ tryPutMVar mvar r
let client1 = zookeeperResInit testZkHost (Just gloWatcher) recvTimeout Nothing 0
withResource client1 $ \zh1 -> do

Check warning on line 205 in test/Spec.hs

View workflow job for this annotation

GitHub Actions / ghc-8.10.7 cabal-3.8 on ubuntu-latest

Defined but not used: ‘zh1’

Check warning on line 205 in test/Spec.hs

View workflow job for this annotation

GitHub Actions / ghc-9.0.2 cabal-3.8 on ubuntu-latest

Defined but not used: ‘zh1’

Check warning on line 205 in test/Spec.hs

View workflow job for this annotation

GitHub Actions / ghc-9.2.8 cabal-3.8 on ubuntu-latest

Defined but not used: ‘zh1’

Check warning on line 205 in test/Spec.hs

View workflow job for this annotation

GitHub Actions / ghc-9.4.8 cabal-3.8 on ubuntu-latest

Defined but not used: ‘zh1’
(dataCompletionValue <$> takeMVar mvar) `shouldReturn` Just "hello"

lockSpec1 :: ZHandle -> Spec
lockSpec1 zh = describe "ZooKeeper.zooLock (single session)" $ do
it "Test single client situation" $ do
Expand Down Expand Up @@ -225,5 +244,8 @@ lockSpec2 client_ = describe "ZooKeeper.zooLock (multi sessions)" $ do

-------------------------------------------------------------------------------

noChildrenForEphemerals :: Selector ZNOCHILDRENFOREPHEMERALS
noChildrenForEphemerals = const True
noChildrenForEphemeralsEx :: Selector ZNOCHILDRENFOREPHEMERALS
noChildrenForEphemeralsEx = const True

nodeExistsEx :: Selector ZNODEEXISTS
nodeExistsEx = const True
5 changes: 3 additions & 2 deletions zoovisitor.cabal
Original file line number Diff line number Diff line change
@@ -1,6 +1,6 @@
cabal-version: 2.2
name: zoovisitor
version: 0.2.6.1
version: 0.2.7.0
synopsis:
A haskell binding to Apache Zookeeper C library(mt) using Haskell Z project.

Expand All @@ -12,7 +12,7 @@ license-file: LICENSE
copyright: Copyright (c)
author: mu
maintainer: [email protected]
tested-with: GHC ==8.10.7 || ==9.0.2 || ==9.2.8 || ==9.4.5
tested-with: GHC ==8.10.7 || ==9.0.2 || ==9.2.8 || ==9.4.8
category: Database
homepage: https://github.com/ZHaskell/zoovisitor
bug-reports: https://github.com/ZHaskell/zoovisitor/issues
Expand Down Expand Up @@ -72,6 +72,7 @@ library
includes: hs_zk.h
c-sources: cbits/hs_zk.c
include-dirs: include /usr/local/include
c-options: -DTHREADED
build-tool-depends: hsc2hs:hsc2hs
extra-libraries: zookeeper_mt

Expand Down

0 comments on commit 0695309

Please sign in to comment.