From 18e91937cd94ea199acff95c2e25015482d82005 Mon Sep 17 00:00:00 2001 From: Julien Dessaux Date: Wed, 8 Jan 2020 10:51:59 +0100 Subject: Initial import --- go.mod | 3 + main.go | 152 +++++++++++++++++++++++++++++++++++++++++++++++++++ spool.go | 72 ++++++++++++++++++++++++ state.go | 188 +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ 4 files changed, 415 insertions(+) create mode 100644 go.mod create mode 100644 main.go create mode 100644 spool.go create mode 100644 state.go diff --git a/go.mod b/go.mod new file mode 100644 index 0000000..505d991 --- /dev/null +++ b/go.mod @@ -0,0 +1,3 @@ +module bareos-zabbix-check + +go 1.13 diff --git a/main.go b/main.go new file mode 100644 index 0000000..10a0d63 --- /dev/null +++ b/main.go @@ -0,0 +1,152 @@ +package main + +import ( + "flag" + "fmt" + "log" + "os" + "path" + "time" +) + +const ( + bareosWorkDir = "/var/lib/bareos" + bareosStateFile = "bareos-fd.9102.state" + baculaWorkDir = "/var/lib/bacula" + baculaStateFile = "bacula-fd.9102.state" + spoolFile = "bareos-zabbix-check.spool" +) + +// We declare globally the variables that will hold the command line arguments +var ( + verbose bool + quiet bool + stateFile string + workDir string +) + +func main() { + var ( + info os.FileInfo + err error + successfulJobs jobs + errorJobs jobs + spoolJobs jobs + jobName string + ts uint64 + now uint64 + errorString string + missingString string + ) + + // command line arguments parsing + flag.BoolVar(&verbose, "v", false, "Activates verbose debugging output, defaults to false.") + flag.BoolVar(&quiet, "q", false, "Suppress all output, suitable to force a silent update of the spool file.") + flag.StringVar(&stateFile, "f", "", "Force the state file to use, defaults to "+bareosStateFile+" if it exists else "+baculaStateFile+".") + flag.StringVar(&workDir, "w", "", "Force the work directory to use, defaults to "+bareosWorkDir+" if it exists else "+baculaWorkDir+".") + flag.Parse() + + // Determine the work directory to use. + if workDir != "" { + info, err = os.Stat(workDir) + if os.IsNotExist(err) || !info.IsDir() { + fmt.Printf("INFO Invalid work directory %s : it does not exist or is not a directory.\n", workDir) + os.Exit(0) + } + } else { + workDir = "/var/lib/bareos" + info, err = os.Stat(workDir) + if os.IsNotExist(err) || !info.IsDir() { + workDir = "/var/lib/bacula" + info, err := os.Stat(workDir) + if os.IsNotExist(err) || !info.IsDir() { + fmt.Println("INFO Could not find a suitable work directory. Is bareos or bacula installed?") + os.Exit(0) + } + } + } + workDir = path.Clean(workDir) + if verbose { + log.Println("Setting work directory to ", workDir) + } + + // Finds the state file to parse + if stateFile != "" { + stateFile = path.Join(workDir, stateFile) + info, err = os.Stat(stateFile) + if os.IsNotExist(err) || info.IsDir() { + fmt.Printf("INFO The state file %s does not exist.\n", stateFile) + os.Exit(0) + } + } else { + stateFile = path.Join(workDir, bareosStateFile) + info, err = os.Stat(stateFile) + if os.IsNotExist(err) || info.IsDir() { + stateFile = path.Join(workDir, baculaStateFile) + info, err = os.Stat(stateFile) + if os.IsNotExist(err) || info.IsDir() { + fmt.Println("INFO Could not find a suitable state file. Has a job ever run?") + os.Exit(0) + } + } + } + if verbose { + log.Println("Using state file ", stateFile) + } + + successfulJobs, errorJobs, err = parseStateFile() + if err != nil { + fmt.Print(err) + os.Exit(0) + } + // We will check for errors in loading the spool file only if necessary. If all jobs ran successfully without errors in the state file and we manage to write + // a new spool file without errors, then we will ignore any error here to avoid false positives during backup bootstrap + spoolJobs, err = loadSpool() + + // if we have jobs in the spool we merge this list with successfull jobs from the state file + if err == nil { + for jobName, ts = range spoolJobs { + var ( + current uint64 + ok bool + ) + current, ok = successfulJobs[jobName] + if !ok || current < ts { + successfulJobs[jobName] = ts + } + } + } + // we write this new spool + if err2 := saveSpool(successfulJobs); err2 != nil { + fmt.Printf("AVERAGE: Couldn't save spool : %s\n", err2) + os.Exit(0) + } + + // We build the error string listing the jobs in error + for jobName, ts = range errorJobs { + if errorString == "" { + errorString = fmt.Sprintf("errors: %s", jobName) + } else { + errorString = fmt.Sprintf("%s, %s", errorString, jobName) + } + } + now = uint64(time.Now().Unix()) + // Next we check if all jobs ran recently and build the missing string + for jobName, ts = range successfulJobs { + if ts < now-24*3600 { + if missingString == "" { + missingString = fmt.Sprintf("missing: %s", jobName) + } else { + missingString = fmt.Sprintf("%s, %s", missingString, jobName) + } + } + } + if errorString != "" || missingString != "" { + fmt.Printf("AVERAGE: %s %s", errorString, missingString) + if err != nil { + fmt.Printf(" additionnal errors: %s", err) + } + } else { + fmt.Printf("OK") + } +} diff --git a/spool.go b/spool.go new file mode 100644 index 0000000..e3d00d9 --- /dev/null +++ b/spool.go @@ -0,0 +1,72 @@ +package main + +import ( + "encoding/csv" + "fmt" + "log" + "os" + "path" + "strconv" +) + +// jobs is a map that matches a job name string to its last successfull run timestamp +type jobs map[string]uint64 + +func loadSpool() (entries jobs, err error) { + var ( + file *os.File + lines [][]string + ) + // We read the spool + file, err = os.Open(path.Join(workDir, spoolFile)) + if err != nil { + return nil, fmt.Errorf("INFO Couldn't open spool file: %s", err) + } + defer file.Close() + lines, err = csv.NewReader(file).ReadAll() + if err != nil { + return nil, fmt.Errorf("INFO Corrupted spool file : %s", err) + } + if verbose { + log.Printf("Spool file content : %v\n", lines) + } + + entries = make(map[string]uint64) + for _, line := range lines { + var ( + i int + ) + i, err = strconv.Atoi(line[1]) + if err != nil { + return nil, fmt.Errorf("INFO Corrupted spool file : couldn't parse timestamp entry") + } + entries[line[0]] = uint64(i) + } + return +} + +func saveSpool(entries jobs) (err error) { + var ( + file *os.File + lines [][]string + jobName string + ts uint64 + i int + ) + file, err = os.Create(path.Join(workDir, spoolFile)) + if err != nil { + return fmt.Errorf("INFO Couldn't open spool file for writing : %s", err) + } + defer file.Close() + + lines = make([][]string, len(entries)) + i = 0 + for jobName, ts = range entries { + lines[i] = make([]string, 2) + lines[i][0] = jobName + lines[i][1] = fmt.Sprintf("%d", ts) + i++ + } + err = csv.NewWriter(file).WriteAll(lines) + return +} diff --git a/state.go b/state.go new file mode 100644 index 0000000..2cfb5df --- /dev/null +++ b/state.go @@ -0,0 +1,188 @@ +package main + +import ( + "bytes" + "encoding/binary" + "fmt" + "log" + "os" + "regexp" +) + +// stateFileHeader : A structure to hold the header of the state file. It is statically aligned for amd64 architecture +type stateFileHeader struct { + ID [14]byte + _ int16 + Version int32 + _ int32 + LastJobsAddr uint64 + EndOfRecentJobResultsList uint64 + Reserved [19]uint64 +} + +func (sfh stateFileHeader) String() string { + return fmt.Sprintf("ID: \"%s\", Version: %d, LastJobsAddr: %d, EndOfRecentJobResultsList: %d", sfh.ID[:len(sfh.ID)-2], sfh.Version, sfh.EndOfRecentJobResultsList, sfh.Reserved) +} + +// jobEntry : A structure to hold a job result from the state file +type jobEntry struct { + Pad [16]byte + Errors int32 + JobType int32 + JobStatus int32 + JobLevel int32 + JobID uint32 + VolSessionID uint32 + VolSessionTime uint32 + JobFiles uint32 + JobBytes uint64 + StartTime uint64 + EndTime uint64 + Job [maxNameLength]byte +} + +func (je jobEntry) String() string { + var matches = jobNameRegex.FindSubmatchIndex(je.Job[:]) + var jobNameLen int + if len(matches) >= 4 { + jobNameLen = matches[3] + } + return fmt.Sprintf("Errors: %d, JobType: %c, JobStatus: %c, JobLevel: %c, JobID: %d, VolSessionID: %d, VolSessionTime: %d, JobFiles: %d, JobBytes: %d, StartTime: %d, EndTime: %d, Job: %s", + je.Errors, je.JobType, je.JobStatus, je.JobLevel, je.JobID, je.VolSessionID, je.VolSessionTime, je.JobFiles, je.JobBytes, je.StartTime, je.EndTime, je.Job[:jobNameLen]) +} + +const ( + // maxNameLength : the maximum length of a string, hard coded in bareos + maxNameLength = 128 + // stateFileHeaderLength : the length of the state file header struct + stateFileHeaderLength = 14 + 2 + 4 + 4 + 8 + 8 + 19*8 + // jobResultLength : the length of the job result struct + jobResultLength = 16 + 4 + 4 + 4 + 4 + 4 + 4 + 4 + 4 + 8 + 8 + 8 + maxNameLength +) + +var jobNameRegex = regexp.MustCompilePOSIX(`^([-A-Za-z0-9_]+)\.[0-9]{4}-[0-9]{2}-[0-9]{2}.*`) + +// readNextBytes : Reads the next "number" bytes from a "file", returns the number of bytes actually read as well as the bytes read +func readNextBytes(file *os.File, number int) (int, []byte) { + var bytes = make([]byte, number) + + var n, err = file.Read(bytes) + if err != nil { + fmt.Printf("INFO Corrupted state file : file.Read failed in %s : %s\n", stateFile, err) + } + + return n, bytes +} + +func parseStateFile() (successfulJobs jobs, errorJobs jobs, err error) { + var ( + n int + stateFileHandle *os.File + data []byte + buffer *bytes.Buffer + numberOfJobs uint32 + matches []int + ) + // Open the state file + stateFileHandle, err = os.Open(stateFile) + if err != nil { + return nil, nil, fmt.Errorf("INFO Couldn't open state file : %s", err) + } + defer stateFileHandle.Close() + + // Parsing the state file header + var header stateFileHeader + n, data = readNextBytes(stateFileHandle, stateFileHeaderLength) + if n != stateFileHeaderLength { + return nil, nil, fmt.Errorf("INFO Corrupted state file : invalid header length in %s", stateFile) + } + buffer = bytes.NewBuffer(data) + err = binary.Read(buffer, binary.LittleEndian, &header) + if err != nil { + return nil, nil, fmt.Errorf("INFO Corrupted state file : binary.Read failed on header in %s : %s", stateFile, err) + } + if verbose { + log.Printf("Parsed header: %+s\n", header) + } + if id := string(header.ID[:len(header.ID)-1]); id != "Bareos State\n" && id != "Bacula State\n" { + return nil, nil, fmt.Errorf("INFO Corrupted state file : Not a bareos or bacula state file %s", stateFile) + } + if header.Version != 4 { + return nil, nil, fmt.Errorf("INFO Invalid state file : This script only supports bareos state file version 4, got %d", header.Version) + } + if header.LastJobsAddr == 0 { + return nil, nil, fmt.Errorf("INFO No jobs exist in the state file") + } + + // We seek to the jobs position in the state file + stateFileHandle.Seek(int64(header.LastJobsAddr), 0) + + // We read how many jobs there are in the state file + n, data = readNextBytes(stateFileHandle, 4) + if n != 4 { + return nil, nil, fmt.Errorf("INFO Corrupted state file : invalid numberOfJobs read length in %s", stateFile) + } + buffer = bytes.NewBuffer(data) + err = binary.Read(buffer, binary.LittleEndian, &numberOfJobs) + if err != nil { + return nil, nil, fmt.Errorf("INFO Corrupted state file : binary.Read failed on numberOfJobs in %s : %s", stateFile, err) + } + if verbose { + log.Printf("%d jobs found in state file\n", numberOfJobs) + } + + // We parse the job entries + successfulJobs = make(map[string]uint64) + errorJobs = make(map[string]uint64) + for ; numberOfJobs > 0; numberOfJobs-- { + var ( + jobResult jobEntry + jobName string + ) + n, data = readNextBytes(stateFileHandle, jobResultLength) + if n != jobResultLength { + return nil, nil, fmt.Errorf("INFO Corrupted state file : invalid job entry in %s", stateFile) + } + buffer = bytes.NewBuffer(data) + err = binary.Read(buffer, binary.LittleEndian, &jobResult) + if err != nil { + return nil, nil, fmt.Errorf("INFO Corrupted state file : binary.Read failed on job entry in %s : %s", stateFile, err) + } + matches = jobNameRegex.FindSubmatchIndex(jobResult.Job[:]) + if len(matches) >= 4 { + jobName = string(jobResult.Job[:matches[3]]) + } else { + return nil, nil, fmt.Errorf("INFO Couldn't parse job name, this shouldn't happen : %s", jobResult.Job[:]) + } + if verbose { + log.Printf("Parsed job entry: %s\n", jobResult) + } + // If the job is of type backup (B == ascii 66) + if jobResult.JobType == 66 { + var ( + successExists bool + errorExists bool + currentSuccess uint64 + currentError uint64 + ) + currentSuccess, successExists = successfulJobs[jobName] + currentError, errorExists = errorJobs[jobName] + // If the job is of status success (T == ascii 84) + if jobResult.JobStatus == 84 { + // if there is an older entry in errorJobs we delete it + if errorExists && jobResult.StartTime > currentError { + delete(errorJobs, jobName) + } + // if there are no entries more recent in successfulJobs we add this one + if !successExists || successExists && jobResult.StartTime > currentSuccess { + successfulJobs[jobName] = jobResult.StartTime + } + } else { + if !errorExists || jobResult.StartTime > currentError { + errorJobs[jobName] = jobResult.StartTime + } + } + } + } + return +} -- cgit v1.2.3