hbs2/hbs2-tests/test/NCQ3.hs

{-# Language AllowAmbiguousTypes #-}
{-# Language RecordWildCards #-}
{-# Language MultiWayIf #-}
module NCQ3 where

import HBS2.Prelude.Plated
import HBS2.OrDie
import HBS2.Hash
import HBS2.Data.Types.Refs
import HBS2.Misc.PrettyStuff
import HBS2.Clock
import HBS2.Merkle
import HBS2.Polling
import HBS2.Peer.Proto.AnyRef

import HBS2.Storage
import HBS2.Storage.Simple
import HBS2.Storage.Operations.ByteString
import HBS2.Storage.NCQ3
import HBS2.Storage.NCQ3.Internal.Files
import HBS2.Storage.NCQ3.Internal.Index
import HBS2.Storage.NCQ3.Internal.Fossil
import HBS2.Storage.NCQ3.Internal.State
import HBS2.Storage.NCQ3.Internal.Sweep
import HBS2.Storage.NCQ3.Internal

import HBS2.System.Logger.Simple.ANSI

import HBS2.Data.Log.Structured.SD
import HBS2.Data.Log.Structured.NCQ

import HBS2.CLI.Run.Internal.Merkle

import Data.Config.Suckless.Syntax
import Data.Config.Suckless.Script as SC
import Data.Config.Suckless.System

import NCQTestCommon
import NCQ3.Endurance
import NCQ3.EnduranceInProc

import Data.Generics.Labels
import Lens.Micro.Platform
import Network.ByteOrder qualified as N
import System.TimeIt
import Data.Fixed
import Data.HashSet qualified as HS
import Data.HashPSQ qualified as HPSQ
import Data.HashMap.Strict qualified as HM
import Test.Tasty.HUnit
import Data.ByteString qualified as BS
import Data.ByteString.Lazy qualified as LBS
import Data.Ord
import Data.Set qualified as Set
import System.Random.MWC as MWC
import Control.Concurrent.STM qualified as STM
import Data.List qualified as List
import Control.Monad.Trans.Cont
import Control.Monad.Except
import System.IO.Temp qualified as Temp
import System.Environment (getExecutablePath)
import System.Process.Typed as PT
import System.IO qualified as IO
import System.Posix.IO qualified as Posix
import GHC.IO.Handle qualified as GHC
import System.Random.Stateful
import UnliftIO
import UnliftIO.IO.File
import UnliftIO.IO as IO
import UnliftIO.Directory

import Streaming.Prelude qualified as S

{-HLINT ignore "Functor law"-}


failure :: forall a m . (Show a, MonadIO m) => Doc a -> m ()
failure = liftIO . assertFailure . show

ncq3Tests :: forall m . MonadUnliftIO m => MakeDictM C m ()
ncq3Tests = do
  entry $ bindMatch "test:ncq3:start-stop" $ nil_ $ \e ->do
      let (opts,args) = splitOpts [] e
      let num = headDef 1000 [ fromIntegral n | LitIntVal n <- args ]
      g <- liftIO MWC.createSystemRandom
      runTest $ \TestEnv{..} -> do
        ncqWithStorage testEnvDir $ \sto -> do
           notice "start/stop ncq3 storage / write 1000 blocks"
           replicateM_ num do
             n <- liftIO $ uniformRM (1024, 256*1024) g
             bs <- liftIO $ genRandomBS g n
             ncqPutBS sto (Just B) Nothing bs

  entry $ bindMatch "test:ncq3:write-reopen" $ nil_ $ \e ->do
      let (opts,args) = splitOpts [] e
      let num = headDef 1000 [ fromIntegral n | LitIntVal n <- args ]
      g <- liftIO MWC.createSystemRandom
      runTest $ \TestEnv{..} -> do

        pending <- ncqWithStorage testEnvDir $ \sto -> do
           notice $ "write" <+> pretty num <+> "blocks"
           replicateM_ num do
             n <- liftIO $ uniformRM (1024, 256*1024) g
             bs <- liftIO $ genRandomBS g n
             ncqPutBS sto (Just B) Nothing bs

           fa <- readTVarIO (ncqState sto) <&> ncqStateFacts

           pure $ [ (ncqGetFileName sto (toFileName k),s) | P (PData k s) <- Set.toList fa ]
                           & maximumByMay (comparing snd)

        for_ pending $ \(dataFile,_) -> do
           n <- liftIO $ uniformRM (1, 16*1024) g
           bss <- liftIO $ genRandomBS g n
           notice $ "CORRUPTING PENDING FILE" <+> pretty n <+> pretty dataFile
           liftIO $ BS.appendFile dataFile bss

        notice $ "reopen"
        ncqWithStorage testEnvDir $ \sto -> do
          pause @'Seconds 2
          notice $ "done"


  entry $ bindMatch "test:ncq3:write:simple" $ nil_ $ \e ->do
      let (opts,args) = splitOpts [] e
      let num = headDef 1000 [ fromIntegral n | LitIntVal n <- args ]
      g <- liftIO MWC.createSystemRandom

      w1 <- newTVarIO 0
      f1 <- newTVarIO 0
      m1 <- newTVarIO 0

      runTest $ \TestEnv{..} -> do
        hq <- newTQueueIO
        ncqWithStorage testEnvDir $ \sto -> do
           notice $ "write/lookup" <+> pretty num
           replicateM_ num do
             n <- liftIO $ uniformRM (1024, 256*1024) g
             bs <- liftIO $ genRandomBS g n
             h <- ncqPutBS sto (Just B) Nothing bs
             found <- ncqLocate sto h <&> isJust
             liftIO $ assertBool (show $ "found" <+> pretty h) found
             atomically do
              writeTQueue hq h
              modifyTVar w1 succ

        ncqWithStorage testEnvDir $ \sto -> do
          notice $ "reopen/lookup" <+> pretty num
          hh <- atomically $ STM.flushTQueue hq

          for_ hh $ \h -> do
             found <- ncqLocate sto h <&> isJust
             atomically do
               if found then do
                  modifyTVar f1 succ
               else do
                  modifyTVar m1 succ

        w <- readTVarIO w1
        f <- readTVarIO f1
        m <- readTVarIO m1

        notice $ "done" <+> pretty w <+> pretty f <+> pretty m

        liftIO $ assertBool (show $ "all-found" <+> pretty w) (f == w && m == 0)

  entry $ bindMatch "test:ncq3:seek" $ nil_ $ \case
    [ StringLike p, HashLike h ] -> do

        files <- dirFiles p  <&> filter (List.isPrefixOf "i-" .takeBaseName)

        for_ files $ \f -> do
          (bs,nw) <- nwayHashMMapReadOnly f >>= orThrowUser ("Can't mmap" <+> pretty f)

          nwayHashScanAll nw bs $ \_ k v -> do
            unless (coerce k == emptyKey) do
              let e = unpackIndexEntry v
              notice $ "found:" <+> pretty (coerce @_ @HashRef k) <+> viaShow e

    e -> throwIO $ BadFormException @C (mkList e)


  entry $ bindMatch "test:ncq3:merge" $ nil_ \e -> do

      let (opts,args) = splitOpts [] e
      let num = headDef 1000 [ fromIntegral n | LitIntVal n <- args ]
      g <- liftIO MWC.createSystemRandom

      runTest $ \TestEnv{..} -> do
        ncqWithStorage testEnvDir $ \sto@NCQStorage{..} -> do
           notice $ "write" <+> pretty num
           hst <- newTVarIO ( mempty :: HashSet HashRef )
           replicateM_ num do
             n <- liftIO $ uniformRM (1024, 64*1024) g
             bs <- liftIO $ genRandomBS g n
             h <- ncqPutBS sto (Just B) Nothing bs
             atomically $ modifyTVar hst (HS.insert h)

           idx <- readTVarIO ncqState
                     <&> ncqStateIndex
                     <&> fmap (IndexFile . snd)

           r <- ncqFindMinPairOf sto idx
           notice $ pretty r

           fix $ \loop -> do
             notice "compacting once"
             w <- ncqIndexCompactStep sto
             when w loop

           nstate <- readTVarIO ncqState

           notice $ "new state" <> line <> pretty nstate

           hss <- readTVarIO hst

           for_ hss $ \h -> do
              found <- ncqLocate sto h <&> isJust
              liftIO $ assertBool (show $ "found" <+> pretty h) found


  entry $ bindMatch "test:ncq3:sweep" $ nil_ \e -> do

      t0 <- getTimeCoarse

      let (opts,args) = splitOpts [] e
      let num = headDef 1000 [ fromIntegral n | LitIntVal n <- args ]
      g <- liftIO MWC.createSystemRandom

      runTest $ \TestEnv{..} -> do
        ncqWithStorage testEnvDir $ \sto@NCQStorage{..} -> flip runContT pure do

           hst <- newTVarIO ( mempty :: HashSet HashRef )
           lostt <- newTVarIO 0
           req   <- newTVarIO 0

           ContT $ withAsync $ forever do
            pause @'Seconds 20
            t <- getTimeCoarse <&> sec2 . (*1e-9) . realToFrac . toNanoSecs . (+ (-t0))
            l <- readTVarIO lostt
            r <- readTVarIO req
            pp <- readTVarIO ncqStateUse <&> HM.size
            let c = if l > 0 then red else id
            debug $ "Elapsed" <+> pretty t <+> pretty pp <+> pretty r <+> c (pretty l)

           ContT $ withAsync $ forever do
            p <- liftIO $ uniformRM (0, 0.75) g
            pause @'Seconds (realToFrac p)
            hh <- readTVarIO hst

            when (HS.size hh > 0) do

              i <- liftIO $ uniformRM (0, HS.size hh - 1) g
              let hi = HS.toList hh !! i
              found <- ncqLocate sto hi <&> isJust
              atomically $ modifyTVar req succ

              unless found do
                err $ red "NOT FOUND" <+> pretty hi
                atomically $ modifyTVar lostt succ

           notice $ "write" <+> pretty num
           replicateM_ num do
             n <- liftIO $ uniformRM (1024, 64*1024) g
             bs <- liftIO $ genRandomBS g n
             h <- lift  $ ncqPutBS sto (Just B) Nothing bs
             atomically $ modifyTVar hst (HS.insert h)

           pause @'Seconds 180

           notice "check after compaction"

           h1 <- readTVarIO hst

           for_ h1 $ \h -> lift do
              found <- ncqLocate sto h <&> isJust
              liftIO $ assertBool (show $ "found" <+> pretty h) found


  entry $ bindMatch "test:ncq3:merge:fossil" $ nil_ \e -> do

      let (opts,args) = splitOpts [] e
      let num = headDef 1000 [ fromIntegral n | LitIntVal n <- args ]
      g <- liftIO MWC.createSystemRandom

      runTest $ \TestEnv{..} -> do
        ncqWithStorage testEnvDir $ \sto@NCQStorage{..} -> flip runContT pure do

           hst <- newTVarIO ( mempty :: HashSet HashRef )

           notice $ "write" <+> pretty num
           replicateM_ num do
             n <- liftIO $ uniformRM (1024, 64*1024) g
             bs <- liftIO $ genRandomBS g n
             h <- lift  $ ncqPutBS sto (Just B) Nothing bs
             atomically $ modifyTVar hst (HS.insert h)

           lift (ncqFossilMergeStep sto)

           notice "merge done"

           pause @'Seconds 180

           notice "check after compaction"

           h1 <- readTVarIO hst

           for_ h1 $ \h -> lift do
              found <- ncqLocate sto h <&> isJust
              liftIO $ assertBool (show $ "found" <+> pretty h) found

  entry $ bindMatch "test:ncq3:long-write" $ nil_ $ \e -> lift do
    g <- liftIO MWC.createSystemRandom
    let (opts,args) = splitOpts [] e

    let seconds = headDef 10 [ t0 | LitScientificVal t0 <- args ]

    let path' = headMay [ p | StringLike p  <- drop 1 $ args ]

    path <- case path' of
              Just p -> pure p
              Nothing -> liftIO $ Temp.createTempDirectory "." "ncq-long-write-test"


    ncqWithStorage path $ \sto -> do

      let writtenLog = ncqGetFileName sto "written.log"
      touch writtenLog

      race (pause @'Seconds (realToFrac seconds) >> ncqStorageStop sto) $ forever do
        n <- liftIO  $ uniformRM (1, 256*1024) g
        s <- liftIO $ genRandomBS g n
        h <- ncqPutBS sto (Just B) Nothing s
        liftIO $ appendFile writtenLog (show (pretty h <+> pretty n <> line))
        none


  entry $ bindMatch "test:ncq3:crash-test1" $ nil_ \e -> runTest \TestEnv{..} -> do
    g <- liftIO MWC.createSystemRandom
    let (opts,args) = splitOpts [] e

    let (s,seconds) = headDef (5.00,mkDouble 5) [ (realToFrac t0,s) | s@(LitScientificVal t0) <- args ]

    let path0 = testEnvDir

    self <- liftIO getExecutablePath

    flip runContT pure do

      p <- liftIO $ uniformM @Word32 g

      let path = path0 </> show p

      p <- ContT $ withProcessWait (proc self ["debug off"
                                              , "and"
                                              , "test:ncq3:long-write", show (pretty seconds), path
                                              ])

      pid <- liftIO (PT.getPid p) `orDie` "oopsie!"

      delta <- liftIO $ uniformRM (0.25, s + 0.10) g

      notice $ "Run" <+> "test:ncq3:long-write"
              <+> green "pid" <+> viaShow pid
              <+> pretty testEnvDir
              <+> pretty (sec2 s)

      pause @'Seconds (realToFrac delta)

      void $ runProcess (proc "kill" ["-9", show pid])

      notice $ "Killed" <+> viaShow pid <+> pretty testEnvDir <+> "at" <+> pretty (sec2 delta)

      pause @'Seconds 2

      lift $ ncqWithStorage path $ \sto@NCQStorage{..} -> do
        let log = ncqGetFileName sto "written.log"
        hashes <- liftIO (readFile log) <&> fmap words . lines

        found       <- newTVarIO 0
        foundBytes  <- newTVarIO 0
        missedN     <- newTVarIO 0
        missedBytes <- newTVarIO 0

        for_ hashes $ \case
          [hs, slen] -> do

            let h = fromString hs
            let s = read slen :: Int

            what <- ncqLocate sto h >>= mapM (ncqGetEntryBS sto) <&> join

            case what of
              Just bs  -> do

                ok <- case ncqEntryUnwrap bs of
                           (_, Left{}) -> pure False

                           (k, Right (B, bss)) -> do
                             let good = HashRef (hashObject @HbSync bss) == h
                             -- debug $ "WTF?" <+> pretty (coerce @_ @HashRef k)
                             --                 <+> pretty good
                             --                 <+> pretty s
                             --                 <+> pretty (BS.length bss)
                             pure good

                           (_,Right (_, s)) -> pure True

                if ok then do

                  atomically do
                    modifyTVar found succ
                    modifyTVar foundBytes (+s)
                else do
                  atomically do
                    modifyTVar missedN succ
                    modifyTVar missedBytes (+s)
                  -- err $ red "Entry corrupted!"

              Nothing -> do
                atomically do
                  modifyTVar missedN succ
                  modifyTVar missedBytes (+s)


          _ -> error "invalid record"

        f  <- readTVarIO found
        fb <- readTVarIO foundBytes
        mb <- readTVarIO missedBytes
        mn <- readTVarIO missedN

        let okay = if mb <= ncqFsync then green "OK" else red "FAIL"

        notice $ okay <+> "(found/lost)"
              <+> pretty f <+> pretty fb <+>
              "/"
              <+> pretty mn <+> pretty mb

  entry $ bindMatch "test:ncq3:concurrent1" $ nil_ $ \case
    [ LitIntVal tn, LitIntVal n ] -> do
      runTest $ testNCQ3Concurrent1 False ( fromIntegral tn) (fromIntegral n)
    e -> throwIO $ BadFormException @C (mkList e)

  entry $ bindMatch "test:ncq3:lookup1" $ nil_ $ \e -> do
      runTest (testNCQ3Lookup1 e)


  entry $ bindMatch "test:ncq3:del1" $ nil_ $ \syn -> do

    runTest $ \TestEnv{..} -> do
      g <- liftIO MWC.createSystemRandom
      let dir = testEnvDir

      let (opts, argz) = splitOpts [("-m",0)] syn
      let n = headDef 10000 [ fromIntegral x | LitIntVal x <- argz ]

      let merge = or [ True | ListVal [StringLike "-m"] <- opts ]

      thashes <- newTVarIO mempty

      ncqWithStorage dir $ \sto -> do

        notice $ "write+immediate delete" <+> pretty n <+> "records"

        hashes <- replicateM n do

          h <- ncqPutBS sto (Just B) Nothing =<< liftIO (genRandomBS g (64*1024))
          ncqDelEntry sto h

          t <- (ncqLocate sto h <&> fmap ncqIsTomb)
                 >>= orThrowUser ("missed" <+> pretty h)

          liftIO $ assertBool (show $ "tomb/1" <+> pretty h) t

          pure h

        atomically $ writeTVar thashes (HS.fromList hashes)

        flip runContT pure $ callCC \exit -> do

          for_ hashes $ \h -> do
            loc <- lift (ncqLocate sto h)
                     >>= orThrowUser ("missed" <+> pretty h)

            unless (ncqEntrySize loc == ncqTombEntrySize) do
              notice $ pretty h <+> pretty (ncqEntrySize loc) <+> pretty ncqTombEntrySize

            liftIO $ assertBool (show $ "tomb/1" <+> pretty h) (ncqIsTomb loc)

        ncqIndexCompactFull sto

      ncqWithStorage dir $ \sto -> do
        -- notice "check deleted"
        hashes  <- readTVarIO  thashes

        for_ hashes $ \h -> do

          ncqLocate sto h >>= \case
            Nothing -> notice $ "not-found" <+> pretty h
            Just loc -> do
             liftIO $ assertBool (show $ "tomb/1" <+> pretty h) (ncqIsTomb loc)


  entry $ bindMatch "test:ncq3:del2" $ nil_ $ \syn -> do

    runTest $ \TestEnv{..} -> do
      g <- liftIO MWC.createSystemRandom
      let dir = testEnvDir

      let (_, argz) = splitOpts [] syn
      let n = headDef 50000 [ fromIntegral x | LitIntVal x <- argz ]
      let p0 = headDef 0.55  [ realToFrac x   | LitScientificVal x <- drop 1 argz ]

      thashes <- newTVarIO mempty

      ncqWithStorage dir $ \sto -> do

        sizes <- replicateM n $ liftIO $ uniformRM (32*1024, 256*1024) g

        notice $ "write" <+> pretty n <+> "blocks"
        pooledForConcurrentlyN_ 16 sizes $ \s -> do
          h <- ncqPutBS sto (Just B) Nothing =<< liftIO (genRandomBS g s)

          p1 <- liftIO $ uniformRM @Double (0, 1) g

          when (p1 < p0) do
            ncqDelEntry sto h
            atomically $ modifyTVar thashes (HS.insert h)

        deleted <- readTVarIO thashes

        tombs <- for (HS.toList deleted) $ \d -> do
                   ncqLocate sto d <&>  maybe False ncqIsTomb

        let tnum = sum [ 1 | x <- tombs, x ]

        notice $ "should be deleted" <+> pretty (HS.size deleted) <+> "/" <+> pretty tnum <+> "of" <+> pretty n

      ncqWithStorage dir $ \sto@NCQStorage{..} -> do

        notice "wait for compaction"

        flip runContT pure do

          void $ ContT $ withAsync $ forever do
            fs <- dirFiles (ncqGetWorkDir sto)
            let n = List.length fs
            ss <- sum <$> mapM getFileSize fs
            notice $ "dir size" <+> pretty n <+> pretty (ss `div` megabytes)
            pause @'Seconds 20

          notice "wait index to compact or 600 sec"

          what <- liftIO $ race (pause @'Seconds 600) do
            atomically do
              ntrack <- ncqLiveKeysSTM sto
              unless (List.length ntrack <= 3) STM.retry

          liftIO do
            deleted <- readTVarIO thashes
            for (HS.toList deleted) $ \d -> do
              tomb <- ncqLocate sto d <&>  maybe False ncqIsTomb
              assertBool (show $ "TOMB" <+> pretty d) tomb

          none

  entry $ bindMatch "test:ncq3:lock" $ nil_ $ \e -> runTest $ \TestEnv{..} -> do

    w <- newTVarIO 0

    r <- try @_ @SomeException do
            flip runContT pure do

              notice $ "run 1st storage" <+> pretty testEnvDir
              sto1 <- ContT $ ncqWithStorage testEnvDir

              atomically $ writeTVar w 1

              pause @'Seconds 1

              notice $ "run 2nd storage" <+> pretty testEnvDir
              sto1 <- ContT $ ncqWithStorage testEnvDir

              pause @'Seconds 1

              notice "so what?"

              atomically $ writeTVar w 2

              pure 42

    wx <- readTVarIO w

    liftIO $ assertBool "first run, second fail" (wx == 1)

    notice $ "second must fail" <+> pretty wx <+> "=>" <+> viaShow r


  entry $ bindMatch "test:ncq3:merkle:file" $ nil_ $ \e -> runTest $ \TestEnv{..} -> do

    let (opts,args) = splitOpts [] e
    let n  = headDef (1 * gigabytes) [ fromIntegral x | LitIntVal x <- args ]

    fn <- orThrowUser "no file given" (headMay [ x | StringLike x <- args ])

    ncqWithStorage testEnvDir $ \ncq -> do

      let sto = AnyStorage ncq
      -- lbs <- liftIO $ LBS.readFile fn

      lbs <- liftIO $ LBS.readFile fn

      chu <- S.toList_ (readChunkedBS lbs (256*1024))
      hashes <- forConcurrently chu $ \chunk -> do
        ncqTossBlock ncq chunk >>= orThrowUser "can't save"
        -- ncqPutBlock ncq chunk
        -- ncqPutBS ncq (Just B) Nothing (LBS.toStrict chunk

      none

      -- -- FIXME: handle-hardcode
      -- let pt = toPTree (MaxSize 1024) (MaxNum 256) hashes -- FIXME: settings

      -- m <- makeMerkle 0 pt $ \(_,_,bss) -> liftIO do
      --        void $ ncqPutBlock ncq bss >>= orThrowUser "can't save"

      -- notice $ pretty m

  entry $ bindMatch "test:ncq3:merkle" $ nil_ $ \e -> runTest $ \TestEnv{..} -> do

    let (opts,args) = splitOpts [] e
    let n  = headDef (1 * gigabytes) [ fromIntegral x | LitIntVal x <- args ]

    g <- liftIO MWC.createSystemRandom
    ncqWithStorage testEnvDir $ \ncq -> do

      fn <- liftIO $ Temp.emptyTempFile (ncqGetWorkDir ncq) "wtf"

      debug $ "generate file" <+> pretty n <+> pretty fn

      flip fix n $ \loop rest -> when (rest > 0) do
          let size = min (1 * megabytes) rest
          block <- liftIO $ genRandomBS g size
          liftIO (BS.appendFile fn block)
          loop (rest - size)


      debug $ "done file" <+> pretty fn

      debug $ "make merkle from" <+> pretty fn

      let sto = AnyStorage ncq

      lbs <- liftIO $ LBS.readFile fn

      t0 <- getTimeCoarse

      tree <- createTreeWithMetadata sto Nothing mempty lbs
                >>= orThrowUser "can't create tree"

      t2 <- getTimeCoarse

      let s = sec2 (1e-9 * realToFrac (toNanoSecs (t2 - t0)))

      notice $ "merkle hash" <+> pretty s <+> pretty tree

      h0 <- liftIO (LBS.readFile fn) <&> HashRef . hashObject @HbSync

      debug $ pretty h0

      notice "full compact index first"

      -- ncqIndexCompactFull ncq

      replicateM_ 3 do

        t1 <- getTimeCoarse
        lbs1 <- runExceptT (getTreeContents sto tree)
                  >>= orThrowPassIO
                  <&> HashRef . hashObject @HbSync

        debug $ pretty lbs1

        t3 <- getTimeCoarse

        notice $ "found" <+> pretty (sec2 (1e-9 * realToFrac (t3 - t1))) <+> pretty lbs1 <+> pretty h0

        liftIO $ assertBool (show $ "hash eq" <+> pretty h0 <+> pretty lbs1) (h0 == lbs1)

  entry $ bindMatch "test:ncq3:refs:shape" $ nil_ $ \_ -> runTest $ \TestEnv{..} -> do
    ncqWithStorage testEnvDir $ \sto -> do
      -- random 32B ref & val
      g   <- liftIO MWC.createSystemRandom
      ref <- HashRef . coerce <$> liftIO (genRandomBS g ncqKeyLen)
      val <- HashRef . coerce <$> liftIO (genRandomBS g ncqKeyLen)

      -- roundtrip via API
      ncqStorageSetRef sto ref val
      m <- ncqStorageGetRef sto ref
      when (m /= Just val) $
        failure "refs:shape: getRef mismatch (expected Just val)"

      -- raw check
      let rkey = ncqRefHash sto ref
      loc <- ncqLocate sto rkey >>= orThrowUser "refs:shape: locate failed"
      bs  <- ncqGetEntryBS sto loc >>= orThrowUser "refs:shape: ncqGetEntryBS failed"

      payload <- case snd (ncqEntryUnwrap bs) of
                   Right (R, p) -> pure p
                   _            -> error "refs:shape: unexpected section type (not R)"

      when (BS.length payload /= 2 * ncqKeyLen) $
        failure "refs:shape: payload length != 64"

      let (val', raw) = BS.splitAt ncqKeyLen payload
      when (val' /= coerce val) $
        failure "refs:shape: first 32B != VAL_HASH"
      when (raw /= coerce ref) $
        failure "refs:shape: last 32B != RAW_REF_KEY"


  entry $ bindMatch "test:ncq3:storage:tails" $ nil_ $ \e -> runTest $ \TestEnv{..} -> do
    g <- liftIO MWC.createSystemRandom
    what <- newTVarIO (mempty :: HashSet HashRef)

    ncqWithStorage testEnvDir $ \sto -> do

        replicateM_ 100 do
          n  <- liftIO $ uniformRM (1,1024) g
          bs <- liftIO $ genRandomBS g n
          ha <- putBlock (AnyStorage sto) (LBS.fromStrict bs) `orDie` "not written"
          debug $ "written" <+> pretty ha <+> pretty n
          atomically $ modifyTVar what (HS.insert (coerce ha))

        notice "pause 30 sec"
        pause @'Seconds 30

    ncqWithStorage testEnvDir $ \sto -> do
      hss <- readTVarIO what
      for_ hss $ \h -> do
        found <- hasBlock (AnyStorage sto) (coerce h)
        liftIO $ assertBool (show $ "found" <+> pretty h) (isJust found)

      notice $ "all" <+> pretty (HS.size hss) <+> "found"

  brief "basic full storage test"
   $ args [ arg "number (def: 100000)" "n"
          , arg "del. probability (def: 0.10)" "pD"
          , arg "ref probability (def: 0.01)" "pR"
          ]

   $ entry $ bindMatch "test:ncq3:storage:basic" $ nil_ $ \e -> do
    let (opts,args) = splitOpts [] e
    let n  = headDef 100000 [ fromIntegral x | LitIntVal x <- args ]
    let pD  = headDef 0.10  [ realToFrac  x | LitScientificVal x <- drop 1 args ]
    let pR  = 0.01
    let kN = headDef 1000  [ fromIntegral x | LitIntVal x <- drop 2 args ]

    blkz <- newTVarIO (mempty :: HashMap (Hash HbSync) (Maybe LBS.ByteString))
    refz <- newTVarIO (mempty :: HashMap (SomeRefKey HashRef) (Maybe (Hash HbSync)))

    runTest $ \TestEnv{..} -> do
      g <- liftIO MWC.createSystemRandom

      ncqWithStorage testEnvDir $ \sto -> do

        replicateM_ n $ liftIO do
          sz <- uniformRM (1, 64*1024) g
          bs <- genRandomBS g sz <&> LBS.fromStrict
          ha <- putBlock sto bs `orDie`  "Block not stored"
          mb <- getBlock sto ha

          when (mb /= Just bs) do
            assertFailure ("getBlock mismatch for " <> show (pretty ha))

          sz <- hasBlock sto ha `orDie` "block not found"

          assertBool ("hasBlock size mismatch for " <> show (pretty ha)) (sz == fromIntegral (LBS.length bs))

          atomically $ modifyTVar blkz (HM.insert ha (Just bs))

          pd <- uniformRM (0, 1.0) g

          when (pd < pD) do
            delBlock sto ha
            atomically $ modifyTVar blkz (HM.insert ha Nothing)
            found <- hasBlock sto ha
            assertBool (show $ "not deleted" <+> pretty ha) (isNothing found)

          pr <- uniformRM (0, 1.0) g

          when (pr < pR) do
            k <- uniformRM (1,10) g
            replicateM_ k do
              ref <- SomeRefKey . HashRef . coerce <$> genRandomBS g 32
              updateRef sto ref ha
              atomically $ modifyTVar refz (HM.insert ref (Just ha))
              what <- getRef sto ref
              assertBool (show $ "ref not found" <+> pretty ref) (what == Just ha)

              prd <- uniformRM (0, 1.0) g

              when (prd < 0.10) do
                delRef sto ref
                atomically $ modifyTVar refz (HM.insert ref Nothing)

      notice "immediate test done"

      ncqWithStorage testEnvDir $ \sto -> flip runContT pure do

        p <- newTVarIO (0,0)

        void $ ContT $ withAsync $ forever do
          (b,r) <- readTVarIO p
          ema <- readTVarIO (ncqWriteEMA sto)
          pause @'Seconds 2
          notice $ "progress" <+> pretty ema <+> pretty b <+> pretty r

        fix \next -> do

          blokz <- readTVarIO blkz <&> HM.toList
          for_ blokz $ \b -> do
            atomically $ modifyTVar p (over _1 succ)
            case b of
              (h,Nothing) -> liftIO do
                found <- hasBlock sto h
                assertBool (show $ "not deleted" <+> pretty h) (isNothing found)

              (h,Just bs) -> liftIO do
                size <- hasBlock sto h >>= orThrowUser ("not found" <+> pretty h)

                assertBool (show $ "size mismatch" <+> pretty h <+> pretty size <+> pretty (LBS.length bs))
                           (size == fromIntegral (LBS.length bs))

                bs1 <- getBlock sto h >>= orThrowUser ("not found data for" <+> pretty h)
                assertBool (show $ "data mismatch" <+> pretty h) (bs1 == bs)

          refsz <- readTVarIO refz <&> HM.toList
          for_ refsz \r -> do
            atomically $ modifyTVar p (over _2 succ)
            case r of
              (ref, Nothing) -> liftIO do
                what <- getRef sto ref
                assertBool (show $ "ref resurrected" <+> pretty ref) (isNothing what)

              (ref, Just hv) -> liftIO do
                what <- getRef sto ref
                assertBool (show $ "ref mismatch" <+> pretty ref <+> pretty what <+> pretty hv)
                           (what == Just hv)

          noone <- lift (ncqFossilMergeStep sto) <&> not

          if noone then
            none
          else do
            notice "again"
            next

      notice "re-opened storage test done"


  ncq3EnduranceTest
  ncq3EnduranceTestInProc

testNCQ3Concurrent1 :: MonadUnliftIO m
         => Bool
         -> Int
         -> Int
         -> TestEnv
         -> m ()

testNCQ3Concurrent1 noRead tn n TestEnv{..} = flip runContT pure do

  let tmp = testEnvDir
  let inputDir = tmp </> "input"
  let ncqDir   = tmp </> "ncq"

  debug "preparing"

  mkdir inputDir

  debug $ pretty inputDir

  g <- liftIO MWC.createSystemRandom

  log <- liftIO $ Temp.emptyTempFile inputDir "log-.bin"

  (t0,size) <- timeItT do
    liftIO $ withFile log IO.AppendMode $ \hlog -> do
      replicateM_ n do
        size <- MWC.uniformRM (64*1024, 256*1024) g
        tbs <- genRandomBS g size
        let ha  = hashObject @HbSync tbs
        let ss = coerce ha <> tbs
        let bssize  = N.bytestring32 (fromIntegral $ BS.length ss)
        BS.hPut hlog (bssize <> ss)
      getFileSize log


  let mbps = realToFrac size / (1024**2)
  let v0 = mbps / t0
  notice $ "baseline" <+> pretty n
                      <+> pretty (sec3 t0)
                      <+> pretty (realToFrac @_ @(Fixed E2) mbps)
                      <+> pretty (sec2 v0)


  for_ [1..tn] $ \tnn -> liftIO do
    testWriteNThreads3 ncqDir tnn n


testWriteNThreads3 :: forall g m . (MonadUnliftIO m)
                  => FilePath
                  -> Int
                  -> Int
                  -> m ()
testWriteNThreads3 ncqDir tnn n = do

    g <- liftIO MWC.createSystemRandom

    wtf <- liftIO getPOSIXTime <&> show . round

    t0 <- getTimeCoarse

    w <- ncqWithStorage (ncqDir </> show tnn)  $ \sto -> do
       ss <- liftIO $ replicateM n $ MWC.uniformRM (64*1024, 256*1024) g

       pooledForConcurrentlyN_ tnn ss $ \len -> do
         tbs <- liftIO $ genRandomBS g len
         ncqPutBS sto (Just B) Nothing tbs
         -- atomically $ modifyTVar' tss (+ len)

       -- 32 bytes per key, 4 per len
       pure $ (List.length ss * 36) +  sum ss

    t1 <- getTimeCoarse

    let t = realToFrac (toNanoSecs (t1 - t0)) / 1e9

    let total = realToFrac w

    let speed = if t > 0 then total / t else 0
    let totMegs = realToFrac @_ @(Fixed E2) $ total / (1024**2)
    let speedMbs = realToFrac @_ @(Fixed E2) $ speed / (1024**2)

    notice $ pretty tnn <+> pretty (sec2 t) <+> pretty totMegs <+> pretty speedMbs


testNCQ3Lookup1 :: forall c m . (MonadUnliftIO m, IsContext c)
         => [Syntax c]
         -> TestEnv
         -> m ()

testNCQ3Lookup1 syn TestEnv{..} = do
  debug $ "testNCQ3Lookup1" <+> pretty syn
  let tmp = testEnvDir
  let ncqDir   = tmp
  q <- newTQueueIO

  g <- liftIO MWC.createSystemRandom

  let (opts, argz) = splitOpts [("-m",1),("-M",0)] syn

  let n = headDef 100000 [ fromIntegral x | LitIntVal x <- argz ]
  let nt = headDef 1 $ [ fromIntegral x | LitIntVal x <- drop 1 argz ]
  let nl = headDef 3 $ [ fromIntegral x | LitIntVal x <- drop 2 argz ]
  let r = (64*1024, 256*1024)

  let merge = headDef 0 [ step | ListVal [StringLike "-m", LitIntVal step] <- opts ]
  let mergeFull = headDef False [ True | ListVal [StringLike "-M"] <- opts ]

  notice $ "insert" <+> pretty n <+> "random blocks of size" <+> parens (pretty r) <+> pretty opts

  thashes <- newTQueueIO

  sizes <- liftIO $ replicateM n (uniformRM r g )

  res <- newTQueueIO

  let ntimes n m = flip fix n $ \loop i -> do
        r <- m
        if r && i > 0 then loop (i - 1) else pure r

  ncqWithStorage ncqDir $ \sto -> liftIO do
    pooledForConcurrentlyN_ 8  sizes $ \size -> do
      z <- genRandomBS g size
      h <- ncqPutBS sto (Just B) Nothing z
      atomically $ writeTQueue thashes h

    hs <- atomically $ STM.flushTQueue thashes

    let wrap m = if | mergeFull -> notice "full merge" >> ncqIndexCompactFull sto >> m
                    | merge > 0 ->
                       fix \next -> do
                          notice $ "run ncqIndexCompactStep" <+> pretty merge
                          flip fix merge \inner i -> do
                            left <- ntimes merge (ncqIndexCompactStep sto)
                            m
                            if left then next else none

                    | otherwise -> m
    wrap do

      idx <- readTVarIO (ncqState sto) <&> List.length . view #ncqStateIndex

      replicateM_ nl do

        tfound <- newTVarIO 0


        t0 <- getTimeCoarse

        liftIO $ pooledForConcurrentlyN_ nt hs $ \h -> do
          found <- ncqLocate sto h <&> isJust
          when found do
            atomically $ modifyTVar' tfound succ

        t1 <- getTimeCoarse

        let dt = realToFrac (toNanoSecs (t1 - t0)) / 1e9 :: Fixed E3
        atomically $ writeTQueue res dt

        found <- readTVarIO tfound

        notice $ "scan all files" <+> pretty idx <+> pretty dt <+> pretty found

      m <- atomically (STM.flushTQueue res)
            <&> List.sort
            <&> \x -> atDef 0 x (List.length x `quot` 2)

      notice $ "median" <+> pretty m