Skip to content

Commit

Permalink
database directory configuration (#1128)
Browse files Browse the repository at this point in the history
* run amberdata monitor only when amberdata logging is enabled

* fix database director configuration and remove deprecated NodeId

* hide node-id command line option

* be more lenient when parsing deprecated node-id option

Co-authored-by: Emily Pillmore <[email protected]>
  • Loading branch information
larskuhtz and emilypi authored Aug 7, 2020
1 parent cf61dec commit 512debe
Show file tree
Hide file tree
Showing 17 changed files with 281 additions and 227 deletions.
2 changes: 1 addition & 1 deletion bench/Chainweb/Pact/Backend/ForkingBench.hs
Original file line number Diff line number Diff line change
Expand Up @@ -331,7 +331,7 @@ withResources trunkLength logLevel f = C.envWithCleanup create destroy unwrap
coinAccounts <- newMVar mempty
nonceCounter <- newIORef 1
txPerBlock <- newIORef 10
sqlEnv <- startSqliteDb testVer cid logger (Just tempDir) Nothing False
sqlEnv <- startSqliteDb cid logger tempDir False
pactService <-
startPact testVer logger blockHeaderDb payloadDb (testMemPoolAccess txPerBlock coinAccounts) sqlEnv
mainTrunkBlocks <-
Expand Down
1 change: 0 additions & 1 deletion chainweb.cabal
Original file line number Diff line number Diff line change
Expand Up @@ -193,7 +193,6 @@ library
, Chainweb.Miner.RestAPI
, Chainweb.Miner.RestAPI.Client
, Chainweb.Miner.RestAPI.Server
, Chainweb.NodeId
, Chainweb.NodeVersion
, Chainweb.Payload
, Chainweb.Payload.PayloadStore
Expand Down
2 changes: 1 addition & 1 deletion minimal-config.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -90,4 +90,4 @@ logging:
- key: component
value: local-handler
level: info
default: error
default: error
201 changes: 186 additions & 15 deletions node/ChainwebNode.hs
Original file line number Diff line number Diff line change
Expand Up @@ -5,6 +5,7 @@
{-# LANGUAGE FlexibleContexts #-}
{-# LANGUAGE FlexibleInstances #-}
{-# LANGUAGE LambdaCase #-}
{-# LANGUAGE MultiWayIf #-}
{-# LANGUAGE NumericUnderscores #-}
{-# LANGUAGE OverloadedStrings #-}
{-# LANGUAGE ScopedTypeVariables #-}
Expand Down Expand Up @@ -56,11 +57,13 @@ import Control.Monad.Managed
import Data.CAS
import Data.CAS.RocksDB
import qualified Data.HashSet as HS
import qualified Data.List as L
import qualified Data.Text as T
import Data.Time
import Data.Typeable

import GHC.Generics hiding (from)
import GHC.Stack
import GHC.Stats

import qualified Network.HTTP.Client as HTTP
Expand Down Expand Up @@ -173,6 +176,20 @@ pChainwebNodeConfiguration = id
% long "reset-chain-databases"
<> help "Reset the chain databases for all chains on startup"

getRocksDbDir :: HasCallStack => ChainwebNodeConfiguration -> IO FilePath
getRocksDbDir conf = (<> "/rocksDb") <$> getDbBaseDir conf

getPactDbDir :: HasCallStack => ChainwebNodeConfiguration -> IO FilePath
getPactDbDir conf = (<> "/sqlite") <$> getDbBaseDir conf

getDbBaseDir :: HasCallStack => ChainwebNodeConfiguration -> IO FilePath
getDbBaseDir conf = case _nodeConfigDatabaseDirectory conf of
Nothing -> getXdgDirectory XdgData
$ "chainweb-node/" <> sshow v <> "/0"
Just d -> return (d <> "/0")
where
v = _configChainwebVersion $ _nodeConfigChainweb conf

-- -------------------------------------------------------------------------- --
-- Monitors

Expand Down Expand Up @@ -244,10 +261,19 @@ runBlockUpdateMonitor logger db = L.withLoggerLabel ("component", "block-update-
<*> pure True -- _blockUpdateOrphaned
<*> ((0 -) <$> txCount bh) -- _blockUpdateTxCount

runAmberdataBlockMonitor :: (PayloadCasLookup cas, Logger logger) => Maybe ChainId -> logger -> CutDb cas -> IO ()
runAmberdataBlockMonitor cid logger db
= L.withLoggerLabel ("component", "amberdata-block-monitor") logger $ \l ->
runAmberdataBlockMonitor
:: PayloadCasLookup cas
=> Logger logger
=> EnableConfig AmberdataConfig
-> logger
-> CutDb cas
-> IO ()
runAmberdataBlockMonitor config logger db
| _enableConfigEnabled config = L.withLoggerLabel ("component", "amberdata-block-monitor") logger $ \l ->
runMonitorLoop "Chainweb.Logging.amberdataBlockMonitor" l (amberdataBlockMonitor cid l db)
| otherwise = return ()
where
cid = _amberdataChainId $ _enableConfigConfig config

-- type CutLog = HM.HashMap ChainId (ObjectEncoded BlockHeader)

Expand Down Expand Up @@ -289,30 +315,29 @@ runQueueMonitor logger cutDb = L.withLoggerLabel ("component", "queue-monitor")
-- -------------------------------------------------------------------------- --
-- Run Node

node :: Logger logger => ChainwebNodeConfiguration -> logger -> IO ()
node :: HasCallStack => Logger logger => ChainwebNodeConfiguration -> logger -> IO ()
node conf logger = do
rocksDbDir <- getRocksDbDir
when (_nodeConfigResetChainDbs conf) $ destroyRocksDb rocksDbDir
migrateDbDirectory logger conf
dbBaseDir <- getDbBaseDir conf
when (_nodeConfigResetChainDbs conf) $ removeDirectoryRecursive dbBaseDir
rocksDbDir <- getRocksDbDir conf
pactDbDir <- getPactDbDir conf
withRocksDb rocksDbDir $ \rocksDb -> do
logFunctionText logger Info $ "opened rocksdb in directory " <> sshow rocksDbDir
withChainweb cwConf logger rocksDb (_nodeConfigDatabaseDirectory conf) (_nodeConfigResetChainDbs conf) $ \cw -> mapConcurrently_ id
withChainweb cwConf logger rocksDb pactDbDir (_nodeConfigResetChainDbs conf) $ \cw -> mapConcurrently_ id
[ runChainweb cw
-- we should probably push 'onReady' deeper here but this should be ok
, runCutMonitor (_chainwebLogger cw) (_cutResCutDb $ _chainwebCutResources cw)
, runAmberdataBlockMonitor (amberdataChainId conf) (_chainwebLogger cw) (_cutResCutDb $ _chainwebCutResources cw)
, runAmberdataBlockMonitor (amberdataConfig conf) (_chainwebLogger cw) (_cutResCutDb $ _chainwebCutResources cw)
, runQueueMonitor (_chainwebLogger cw) (_cutResCutDb $ _chainwebCutResources cw)
, runRtsMonitor (_chainwebLogger cw)
, runBlockUpdateMonitor (_chainwebLogger cw) (_cutResCutDb $ _chainwebCutResources cw)
]
where
cwConf = _nodeConfigChainweb conf
nodeText = T.unpack (toText (_configNodeId cwConf))
v = _configChainwebVersion cwConf
getRocksDbDir = case _nodeConfigDatabaseDirectory conf of
Nothing -> getXdgDirectory XdgData
$ "chainweb-node/" <> sshow v <> "/" <> nodeText <> "/rocksDb"
Just d -> return d
amberdataChainId = _amberdataChainId . _enableConfigConfig . _logConfigAmberdataBackend . _nodeConfigLog
amberdataConfig = _logConfigAmberdataBackend . _nodeConfigLog



withNodeLogger
:: LogConfig
Expand Down Expand Up @@ -492,3 +517,149 @@ main = do
node conf logger
where
timeFormat = iso8601DateFormat (Just "%H:%M:%SZ")

-- -------------------------------------------------------------------------- --
-- Database Directory Migration
--
-- TODO: This code can be removed in chainweb-2.2.
--
-- Legacy default locations:
--
-- `$XDGDATA/chainweb-node/$CHAINWEB_VERSION/$NODEID/rocksDb`
-- `$XDGDATA/chainweb-node/$CHAINWEB_VERSION/$NODEID/sqlite`
--
-- New default locations:
--
-- `$XDGDATA/chainweb-node/$CHAINWEB_VERSION/0/rocksDb`
-- `$XDGDATA/chainweb-node/$CHAINWEB_VERSION/0/sqlite`
--
-- Legacy custom locations:
--
-- `${CUSTOM_PATH}`
-- `${CUSTOM_PATH}sqlite` # Note that there is no slash before `sqlite`
--
-- New custom locations:
--
-- `$CUSTOM_PATH/rocksDb`
-- `$CUSTOM_PATH/sqlite`
--
-- Migration scenarios:
--
-- 1. Custom location configured (and directory exists):
--
-- * Log warning
-- * `mkdir -p "$CUSTOM_PATH/rockDb"
-- * `mv "${CUSTOM_PATH}*" "$CUSTOM_PATH/rocksDb"
-- * `mv "${CUSTOM_PATH}slqite "$CUSTOM_PATH/sqlite"`
-- * fail if target directory already exists
--
-- 2. No custom location configured:
--
-- * Log warning if `$XDGDATA/chainweb-node/$CHAINWEB_VERSION/[1-9]*` exists
--
--
-- Migration code can be removed in the next version. We don't need to support
-- longer backwards compatibility, because in those situations it will be faster
-- and more convenient to start over with a fresh db.
--
migrateDbDirectory
:: HasCallStack
=> Logger logger
=> logger
-> ChainwebNodeConfiguration
-> IO ()
migrateDbDirectory logger config = case _nodeConfigDatabaseDirectory config of
Just custom -> do
let legacyCustomRocksDb = custom
newCustomRocksDb <- getRocksDbDir config

let legacyCustomPactDb = custom <> "sqlite"
newCustomPactDb <- getPactDbDir config

logg Warn
$ "Checking database directory layout for new chainweb version"
<> ". Legacy rocks db location: " <> T.pack legacyCustomRocksDb
<> ". New rocks db location: " <> T.pack newCustomRocksDb
<> ". Legacy sqlite db location: " <> T.pack legacyCustomPactDb
<> ". New sqlite db location: " <> T.pack newCustomPactDb
logg Warn
$ "If this operation fails it may be retried"
<> ". If it still fails the database may be corrupted and must be deleted and re-synchronized"

migrateDb "rocks" legacyCustomRocksDb newCustomRocksDb
migrateDb "sqlite" legacyCustomPactDb newCustomPactDb

Nothing -> do
defDir <- getXdgDirectory XdgData $ "chainweb-node/" <> sshow v
whenM (doesDirectoryExist defDir) $ do
dirs <- listDirectory defDir
forM_ (filter (/= defDir <> "/0") dirs) $ \i ->
logg Warn $ "ignoring existing database directory " <> T.pack (defDir <> "/" <> i)
where
logg = logFunctionText (setComponent "database-migration" logger)
v = _configChainwebVersion $ _nodeConfigChainweb config

-- There are many things that can go wrong in here. In particular we don't
-- check for permissions, mounts, hard links, etc. We also don't care about
-- races with other operating system threads.
--
-- However, the worst that can happen is that the database becomes corrupted
-- and must be resynchronized.
--
migrateDb db oldRaw newRaw = do
old <- canonicalizePath oldRaw
new <- canonicalizePath newRaw

oldExists <- doesDirectoryExist old
newExists <- doesDirectoryExist new
oldIsFile <- doesFileExist old
newIsFile <- doesFileExist new

let cpy f = copyFile (old <> "/" <> f) (new <> "/" <> f)
rm dir f = removeFile (dir <> "/" <> f)
ex dir f = doesFileExist (dir <> "/" <> f)

if
| oldIsFile -> do
logg Error
$ "A file with the name of the legacy directory for the " <> db <> " database exists. Terminating chainweb node"
error $ "A file with the name of the legacy directory for the " <> T.unpack db <> " database exists"
| newIsFile -> do
logg Error
$ "A file with the name of the new directory for " <> db <> " database exists. Terminating chainweb node"
error $ "A file with the name of the new directory for " <> T.unpack db <> " database exists"
| old == new -> logg Warn
$ "Legacy and new " <> db <> " directories are the the same. No action needed"
| not oldExists -> logg Warn
$ "Legacy " <> db <> " database directory doesn't exist. No action needed"
| newExists && (old `L.isPrefixOf` new) -> logg Warn
$ "New " <> db <> " database already exists. If an legacy database exists, it is ignored. No action needed"
| newExists -> logg Error
$ "Can't move legacy " <> db <> " database to new location because the database already exists"
<> ". Chainweb node will attempt to use the database at the new location"
| old `L.isPrefixOf` new -> do
logg Warn
$ "moving " <> db <> " database files to new location in sub-directory"
<> ". Legacy location: " <> T.pack old
<> ". New location: " <> T.pack new

fileEntries <- filterM (ex old) =<< listDirectory old

-- This isn't bullet proof. If something goes wrong here, there's a chance for a
-- corrupted database.
(mask_ $ createDirectoryIfMissing True new >> mapM_ cpy fileEntries)
`onException` do
removeDirectoryRecursive new
-- we know that the directory didn't exist before. So, this is safe.
-- (modulo races with other operating system processes)
logg Error $ "failed to create new " <> db <> " database directory " <> T.pack new
logg Info "done moving files. Cleaning up"
mapM_ (rm old) fileEntries
logg Info "done cleaning up"

| otherwise -> do
logg Warn
$ "moving " <> db <> " database:"
<> " Legacy location: " <> T.pack old
<> ". New location: " <> T.pack new
renameDirectory old new
Loading

0 comments on commit 512debe

Please sign in to comment.