X-Git-Url: https://code.grnet.gr/git/ganeti-local/blobdiff_plain/b0517d61247b932bdbd5bd9f54d0be6798e6e9b0..12fa49b3f82ea5c4efc831f4045a62e0ddb27e09:/hbal.hs diff --git a/hbal.hs b/hbal.hs index b6c2d16..3ac9e78 100644 --- a/hbal.hs +++ b/hbal.hs @@ -1,4 +1,25 @@ -{-| Solver for N+1 cluster errors +{-| Cluster rebalancer + +-} + +{- + +Copyright (C) 2009 Google Inc. + +This program is free software; you can redistribute it and/or modify +it under the terms of the GNU General Public License as published by +the Free Software Foundation; either version 2 of the License, or +(at your option) any later version. + +This program is distributed in the hope that it will be useful, but +WITHOUT ANY WARRANTY; without even the implied warranty of +MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU +General Public License for more details. + +You should have received a copy of the GNU General Public License +along with this program; if not, write to the Free Software +Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA +02110-1301, USA. -} @@ -6,102 +27,42 @@ module Main (main) where import Data.List import Data.Function -import Data.Maybe (isJust, fromJust, fromMaybe) +import Data.Maybe (isJust, fromJust) import Monad import System import System.IO -import System.Console.GetOpt import qualified System -import Text.Printf (printf) +import Text.Printf (printf, hPrintf) import qualified Ganeti.HTools.Container as Container import qualified Ganeti.HTools.Cluster as Cluster import qualified Ganeti.HTools.Node as Node -import qualified Ganeti.HTools.CLI as CLI -import Ganeti.HTools.Rapi -import Ganeti.HTools.Utils --- | Command line options structure. -data Options = Options - { optShowNodes :: Bool -- ^ Whether to show node status - , optShowCmds :: Maybe FilePath -- ^ Whether to show the command list - , optOneline :: Bool -- ^ Switch output to a single line - , optNodef :: FilePath -- ^ Path to the nodes file - , optNodeSet :: Bool -- ^ The nodes have been set by options - , optInstf :: FilePath -- ^ Path to the instances file - , optInstSet :: Bool -- ^ The insts have been set by options - , optMaxLength :: Int -- ^ Stop after this many steps - , optMaster :: String -- ^ Collect data from RAPI - , optVerbose :: Int -- ^ Verbosity level - , optOffline :: [String] -- ^ Names of offline nodes - , optMinScore :: Cluster.Score -- ^ The minimum score we aim for - , optShowVer :: Bool -- ^ Just show the program version - , optShowHelp :: Bool -- ^ Just show the help - } deriving Show - --- | Default values for the command line options. -defaultOptions :: Options -defaultOptions = Options - { optShowNodes = False - , optShowCmds = Nothing - , optOneline = False - , optNodef = "nodes" - , optNodeSet = False - , optInstf = "instances" - , optInstSet = False - , optMaxLength = -1 - , optMaster = "" - , optVerbose = 0 - , optOffline = [] - , optMinScore = 1e-9 - , optShowVer = False - , optShowHelp = False - } +import Ganeti.HTools.CLI +import Ganeti.HTools.ExtLoader +import Ganeti.HTools.Utils -- | Options list and functions -options :: [OptDescr (Options -> Options)] +options :: [OptType] options = - [ Option ['p'] ["print-nodes"] - (NoArg (\ opts -> opts { optShowNodes = True })) - "print the final node list" - , Option ['C'] ["print-commands"] - (OptArg ((\ f opts -> opts { optShowCmds = Just f }) . fromMaybe "-") - "FILE") - "print the ganeti command list for reaching the solution,\ - \if an argument is passed then write the commands to a file named\ - \ as such" - , Option ['o'] ["oneline"] - (NoArg (\ opts -> opts { optOneline = True })) - "print the ganeti command list for reaching the solution" - , Option ['n'] ["nodes"] - (ReqArg (\ f opts -> opts { optNodef = f, optNodeSet = True }) "FILE") - "the node list FILE" - , Option ['i'] ["instances"] - (ReqArg (\ f opts -> opts { optInstf = f, optInstSet = True }) "FILE") - "the instance list FILE" - , Option ['m'] ["master"] - (ReqArg (\ m opts -> opts { optMaster = m }) "ADDRESS") - "collect data via RAPI at the given ADDRESS" - , Option ['l'] ["max-length"] - (ReqArg (\ i opts -> opts { optMaxLength = (read i)::Int }) "N") - "cap the solution at this many moves (useful for very unbalanced \ - \clusters)" - , Option ['v'] ["verbose"] - (NoArg (\ opts -> opts { optVerbose = (optVerbose opts) + 1 })) - "increase the verbosity level" - , Option ['O'] ["offline"] - (ReqArg (\ n opts -> opts { optOffline = n:optOffline opts }) "NODE") - " set node as offline" - , Option ['e'] ["min-score"] - (ReqArg (\ e opts -> opts { optMinScore = read e }) "EPSILON") - " mininum score to aim for" - , Option ['V'] ["version"] - (NoArg (\ opts -> opts { optShowVer = True})) - "show the version of the program" - , Option ['h'] ["help"] - (NoArg (\ opts -> opts { optShowHelp = True})) - "show help" + [ oPrintNodes + , oPrintCommands + , oOneline + , oNodeFile + , oInstFile + , oRapiMaster + , oLuxiSocket + , oMaxSolLength + , oVerbose + , oQuiet + , oOfflineNode + , oMinScore + , oMaxCpu + , oMinDisk + , oDiskMoves + , oShowVer + , oShowHelp ] {- | Start computing the solution at the given depth and recurse until @@ -110,115 +71,102 @@ we find a valid solution or we exceed the maximum depth. -} iterateDepth :: Cluster.Table -- ^ The starting table -> Int -- ^ Remaining length - -> Cluster.NameList -- ^ Node idx to name list - -> Cluster.NameList -- ^ Inst idx to name list + -> Bool -- ^ Allow disk moves -> Int -- ^ Max node name len -> Int -- ^ Max instance name len -> [[String]] -- ^ Current command list - -> Bool -- ^ Wheter to be silent + -> Bool -- ^ Whether to be silent -> Cluster.Score -- ^ Score at which to stop -> IO (Cluster.Table, [[String]]) -- ^ The resulting table and -- commands -iterateDepth ini_tbl max_rounds ktn kti nmlen imlen +iterateDepth ini_tbl max_rounds disk_moves nmlen imlen cmd_strs oneline min_score = - let Cluster.Table ini_nl ini_il ini_cv ini_plc = ini_tbl - all_inst = Container.elems ini_il - node_idx = map Node.idx . filter (not . Node.offline) $ - Container.elems ini_nl - fin_tbl = Cluster.checkMove node_idx ini_tbl all_inst - (Cluster.Table _ _ fin_cv fin_plc) = fin_tbl - ini_plc_len = length ini_plc - fin_plc_len = length fin_plc - allowed_next = (max_rounds < 0 || length fin_plc < max_rounds) + let Cluster.Table ini_nl ini_il _ _ = ini_tbl + m_fin_tbl = Cluster.tryBalance ini_tbl max_rounds disk_moves min_score in - do - let - (sol_line, cmds) = Cluster.printSolutionLine ini_il ktn kti - nmlen imlen (head fin_plc) fin_plc_len - upd_cmd_strs = cmds:cmd_strs - unless (oneline || fin_plc_len == ini_plc_len) $ do - putStrLn sol_line - hFlush stdout - (if fin_cv < ini_cv then -- this round made success, try deeper - if allowed_next && fin_cv > min_score - then iterateDepth fin_tbl max_rounds ktn kti - nmlen imlen upd_cmd_strs oneline min_score - -- don't go deeper, but return the better solution - else return (fin_tbl, upd_cmd_strs) - else - return (ini_tbl, cmd_strs)) + case m_fin_tbl of + Just fin_tbl -> + do + let + (Cluster.Table _ _ _ fin_plc) = fin_tbl + fin_plc_len = length fin_plc + (sol_line, cmds) = Cluster.printSolutionLine ini_nl ini_il + nmlen imlen (head fin_plc) fin_plc_len + upd_cmd_strs = cmds:cmd_strs + unless oneline $ do + putStrLn sol_line + hFlush stdout + iterateDepth fin_tbl max_rounds disk_moves + nmlen imlen upd_cmd_strs oneline min_score + Nothing -> return (ini_tbl, cmd_strs) + +-- | Formats the solution for the oneline display +formatOneline :: Double -> Int -> Double -> String +formatOneline ini_cv plc_len fin_cv = + printf "%.8f %d %.8f %8.3f" ini_cv plc_len fin_cv + (if fin_cv == 0 then 1 else ini_cv / fin_cv) -- | Main function. main :: IO () main = do cmd_args <- System.getArgs - (opts, args) <- CLI.parseOpts cmd_args "hbal" options - defaultOptions optShowHelp + (opts, args) <- parseOpts cmd_args "hbal" options unless (null args) $ do hPutStrLn stderr "Error: this program doesn't take any arguments." exitWith $ ExitFailure 1 - when (optShowVer opts) $ do - putStr $ CLI.showVersion "hbal" - exitWith ExitSuccess - - (env_node, env_inst) <- CLI.parseEnv () - let nodef = if optNodeSet opts then optNodef opts - else env_node - instf = if optInstSet opts then optInstf opts - else env_inst - oneline = optOneline opts + let oneline = optOneline opts verbose = optVerbose opts - (node_data, inst_data) = - case optMaster opts of - "" -> (readFile nodef, - readFile instf) - host -> (readData getNodes host, - readData getInstances host) - (loaded_nl, il, csf, ktn, kti) <- liftM2 Cluster.loadData node_data inst_data - let (fix_msgs, fixed_nl) = Cluster.checkData loaded_nl il ktn kti - - unless (null fix_msgs) $ do - putStrLn "Warning: cluster has inconsistent data:" - putStrLn . unlines . map (\s -> printf " - %s" s) $ fix_msgs + (fixed_nl, il, csf) <- loadExternalData opts let offline_names = optOffline opts - all_names = snd . unzip $ ktn - offline_wrong = filter (\n -> not $ elem n all_names) offline_names - offline_indices = fst . unzip . - filter (\(_, n) -> elem n offline_names) $ ktn + all_nodes = Container.elems fixed_nl + all_names = map Node.name all_nodes + offline_wrong = filter (flip notElem all_names) offline_names + offline_indices = map Node.idx $ + filter (\n -> elem (Node.name n) offline_names) + all_nodes + m_cpu = optMcpu opts + m_dsk = optMdsk opts when (length offline_wrong > 0) $ do - printf "Wrong node name(s) set as offline: %s\n" - (commaJoin offline_wrong) + hPrintf stderr "Wrong node name(s) set as offline: %s\n" + (commaJoin offline_wrong) exitWith $ ExitFailure 1 - let nl = Container.map (\n -> if elem (Node.idx n) offline_indices + let nm = Container.map (\n -> if elem (Node.idx n) offline_indices then Node.setOffline n True else n) fixed_nl + nl = Container.map (flip Node.setMdsk m_dsk . flip Node.setMcpu m_cpu) + nm + + when (Container.size il == 0) $ do + (if oneline then putStrLn $ formatOneline 0 0 0 + else printf "Cluster is empty, exiting.\n") + exitWith ExitSuccess unless oneline $ printf "Loaded %d nodes, %d instances\n" (Container.size nl) (Container.size il) - when (length csf > 0 && not oneline && verbose > 0) $ do - printf "Note: Stripping common suffix of '%s' from names\n" csf + when (length csf > 0 && not oneline && verbose > 1) $ + printf "Note: Stripping common suffix of '%s' from names\n" csf let (bad_nodes, bad_instances) = Cluster.computeBadItems nl il unless (oneline || verbose == 0) $ printf "Initial check done: %d bad nodes, %d bad instances.\n" (length bad_nodes) (length bad_instances) - when (length bad_nodes > 0) $ do + when (length bad_nodes > 0) $ putStrLn "Cluster is not N+1 happy, continuing but no guarantee \ \that the cluster will end N+1 happy." when (optShowNodes opts) $ do putStrLn "Initial cluster status:" - putStrLn $ Cluster.printNodes ktn nl + putStrLn $ Cluster.printNodes nl let ini_cv = Cluster.compCV nl ini_tbl = Cluster.Table nl il ini_cv [] @@ -226,36 +174,35 @@ main = do when (ini_cv < min_cv) $ do (if oneline then - printf "%.8f %d %.8f %8.3f\n" - ini_cv (0::Integer) ini_cv (1::Double) + putStrLn $ formatOneline ini_cv 0 ini_cv else printf "Cluster is already well balanced (initial score %.6g,\n\ \minimum score %.6g).\nNothing to do, exiting\n" ini_cv min_cv) exitWith ExitSuccess - unless oneline (if verbose > 1 then + unless oneline (if verbose > 2 then printf "Initial coefficients: overall %.8f, %s\n" ini_cv (Cluster.printStats nl) else printf "Initial score: %.8f\n" ini_cv) unless oneline $ putStrLn "Trying to minimize the CV..." - let mlen_fn = maximum . (map length) . snd . unzip - imlen = mlen_fn kti - nmlen = mlen_fn ktn + let imlen = Container.maxNameLen il + nmlen = Container.maxNameLen nl (fin_tbl, cmd_strs) <- iterateDepth ini_tbl (optMaxLength opts) - ktn kti nmlen imlen [] oneline min_cv + (optDiskMoves opts) + nmlen imlen [] oneline min_cv let (Cluster.Table fin_nl _ fin_cv fin_plc) = fin_tbl ord_plc = reverse fin_plc sol_msg = if null fin_plc then printf "No solution found\n" - else (if verbose > 1 - then printf "Final coefficients: overall %.8f, %s\n" - fin_cv (Cluster.printStats fin_nl) - else printf "Cluster score improved from %.8f to %.8f\n" - ini_cv fin_cv - ) + else if verbose > 2 + then printf "Final coefficients: overall %.8f, %s\n" + fin_cv (Cluster.printStats fin_nl) + else printf "Cluster score improved from %.8f to %.8f\n" + ini_cv fin_cv + ::String unless oneline $ putStr sol_msg @@ -274,20 +221,21 @@ main = do filter (/= "check") . lines $ cmd_data) else do - writeFile out_path (CLI.shTemplate ++ cmd_data) + writeFile out_path (shTemplate ++ cmd_data) printf "The commands have been written to file '%s'\n" out_path) when (optShowNodes opts) $ do - let (orig_mem, orig_disk) = Cluster.totalResources nl - (final_mem, final_disk) = Cluster.totalResources fin_nl + let ini_cs = Cluster.totalResources nl + fin_cs = Cluster.totalResources fin_nl putStrLn "" putStrLn "Final cluster status:" - putStrLn $ Cluster.printNodes ktn fin_nl - when (verbose > 2) $ + putStrLn $ Cluster.printNodes fin_nl + when (verbose > 3) $ do - printf "Original: mem=%d disk=%d\n" orig_mem orig_disk - printf "Final: mem=%d disk=%d\n" final_mem final_disk - when oneline $ do - printf "%.8f %d %.8f %8.3f\n" - ini_cv (length ord_plc) fin_cv (ini_cv / fin_cv) + printf "Original: mem=%d disk=%d\n" + (Cluster.cs_fmem ini_cs) (Cluster.cs_fdsk ini_cs) + printf "Final: mem=%d disk=%d\n" + (Cluster.cs_fmem fin_cs) (Cluster.cs_fdsk fin_cs) + when oneline $ + putStrLn $ formatOneline ini_cv (length ord_plc) fin_cv