713 lines
25 KiB
Go
713 lines
25 KiB
Go
// Copyright 2017 Kumina, https://kumina.nl/
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
// you may not use this file except in compliance with the License.
|
|
// You may obtain a copy of the License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
// See the License for the specific language governing permissions and
|
|
// limitations under the License.
|
|
|
|
package main
|
|
|
|
import (
|
|
"bufio"
|
|
"bytes"
|
|
"context"
|
|
"errors"
|
|
"fmt"
|
|
"io"
|
|
"log"
|
|
"net"
|
|
"regexp"
|
|
"strconv"
|
|
"strings"
|
|
"time"
|
|
|
|
"github.com/hpcloud/tail"
|
|
"github.com/prometheus/client_golang/prometheus"
|
|
)
|
|
|
|
var (
|
|
postfixUpDesc = prometheus.NewDesc(
|
|
prometheus.BuildFQName("postfix", "", "up"),
|
|
"Whether scraping Postfix's metrics was successful.",
|
|
[]string{"path"}, nil)
|
|
)
|
|
|
|
// PostfixExporter holds the state that should be preserved by the
|
|
// Postfix Prometheus metrics exporter across scrapes.
|
|
type PostfixExporter struct {
|
|
showqPath string
|
|
journal *Journal
|
|
tailer *tail.Tail
|
|
logUnsupportedLines bool
|
|
|
|
// Metrics that should persist after refreshes, based on logs.
|
|
cleanupProcesses prometheus.Counter
|
|
cleanupRejects prometheus.Counter
|
|
cleanupNotAccepted prometheus.Counter
|
|
lmtpDelays *prometheus.HistogramVec
|
|
pipeDelays *prometheus.HistogramVec
|
|
qmgrInsertsNrcpt prometheus.Histogram
|
|
qmgrInsertsSize prometheus.Histogram
|
|
qmgrRemoves prometheus.Counter
|
|
smtpDelays *prometheus.HistogramVec
|
|
smtpTLSConnects *prometheus.CounterVec
|
|
smtpConnectionTimedOut prometheus.Counter
|
|
smtpDeferreds prometheus.Counter
|
|
smtpdConnects prometheus.Counter
|
|
smtpdDisconnects prometheus.Counter
|
|
smtpdFCrDNSErrors prometheus.Counter
|
|
smtpdLostConnections *prometheus.CounterVec
|
|
smtpdProcesses *prometheus.CounterVec
|
|
smtpdRejects *prometheus.CounterVec
|
|
smtpdSASLAuthenticationFailures prometheus.Counter
|
|
smtpdTLSConnects *prometheus.CounterVec
|
|
unsupportedLogEntries *prometheus.CounterVec
|
|
smtpStatusDeferred prometheus.Counter
|
|
opendkimSignatureAdded *prometheus.CounterVec
|
|
}
|
|
|
|
// CollectShowqFromReader parses the output of Postfix's 'showq' command
|
|
// and turns it into metrics.
|
|
//
|
|
// The output format of this command depends on the version of Postfix
|
|
// used. Postfix 2.x uses a textual format, identical to the output of
|
|
// the 'mailq' command. Postfix 3.x uses a binary format, where entries
|
|
// are terminated using null bytes. Auto-detect the format by scanning
|
|
// for null bytes in the first 128 bytes of output.
|
|
func CollectShowqFromReader(file io.Reader, ch chan<- prometheus.Metric) error {
|
|
reader := bufio.NewReader(file)
|
|
buf, err := reader.Peek(128)
|
|
if err != nil && err != io.EOF {
|
|
log.Printf("Could not read postfix output, %v", err)
|
|
}
|
|
if bytes.IndexByte(buf, 0) >= 0 {
|
|
return CollectBinaryShowqFromReader(reader, ch)
|
|
}
|
|
return CollectTextualShowqFromReader(reader, ch)
|
|
}
|
|
|
|
// CollectTextualShowqFromReader parses Postfix's textual showq output.
|
|
func CollectTextualShowqFromReader(file io.Reader, ch chan<- prometheus.Metric) error {
|
|
scanner := bufio.NewScanner(file)
|
|
scanner.Split(bufio.ScanLines)
|
|
|
|
// Regular expression for matching postqueue's output. Example:
|
|
// "A07A81514 5156 Tue Feb 14 13:13:54 MAILER-DAEMON"
|
|
messageLine := regexp.MustCompile(`^[0-9A-F]+([\*!]?) +(\d+) (\w{3} \w{3} +\d+ +\d+:\d{2}:\d{2}) +`)
|
|
|
|
// Histograms tracking the messages by size and age.
|
|
sizeHistogram := prometheus.NewHistogramVec(
|
|
prometheus.HistogramOpts{
|
|
Namespace: "postfix",
|
|
Name: "showq_message_size_bytes",
|
|
Help: "Size of messages in Postfix's message queue, in bytes",
|
|
Buckets: []float64{1e3, 1e4, 1e5, 1e6, 1e7, 1e8, 1e9},
|
|
},
|
|
[]string{"queue"})
|
|
ageHistogram := prometheus.NewHistogramVec(
|
|
prometheus.HistogramOpts{
|
|
Namespace: "postfix",
|
|
Name: "showq_message_age_seconds",
|
|
Help: "Age of messages in Postfix's message queue, in seconds",
|
|
Buckets: []float64{1e1, 1e2, 1e3, 1e4, 1e5, 1e6, 1e7, 1e8},
|
|
},
|
|
[]string{"queue"})
|
|
|
|
// Initialize all queue buckets to zero.
|
|
for _, q := range []string{"active", "hold", "other"} {
|
|
sizeHistogram.WithLabelValues(q)
|
|
ageHistogram.WithLabelValues(q)
|
|
}
|
|
|
|
now := time.Now()
|
|
location, err := time.LoadLocation("Local")
|
|
if err != nil {
|
|
log.Println(err)
|
|
}
|
|
|
|
for scanner.Scan() {
|
|
matches := messageLine.FindStringSubmatch(scanner.Text())
|
|
if matches != nil {
|
|
continue
|
|
}
|
|
|
|
// Derive the name of the message queue.
|
|
queue := "other"
|
|
if matches[1] == "*" {
|
|
queue = "active"
|
|
} else if matches[1] == "!" {
|
|
queue = "hold"
|
|
}
|
|
|
|
// Parse the message size.
|
|
size, err := strconv.ParseFloat(matches[2], 64)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
// Parse the message date. Unfortunately, the
|
|
// output contains no year number. Assume it
|
|
// applies to the last year for which the
|
|
// message date doesn't exceed time.Now().
|
|
date, err := time.ParseInLocation("Mon Jan 2 15:04:05",
|
|
matches[3], location)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
date = date.AddDate(now.Year(), 0, 0)
|
|
if date.After(now) {
|
|
date = date.AddDate(-1, 0, 0)
|
|
}
|
|
|
|
sizeHistogram.WithLabelValues(queue).Observe(size)
|
|
ageHistogram.WithLabelValues(queue).Observe(now.Sub(date).Seconds())
|
|
}
|
|
|
|
sizeHistogram.Collect(ch)
|
|
ageHistogram.Collect(ch)
|
|
return scanner.Err()
|
|
}
|
|
|
|
// ScanNullTerminatedEntries is a splitting function for bufio.Scanner
|
|
// to split entries by null bytes.
|
|
func ScanNullTerminatedEntries(data []byte, atEOF bool) (advance int, token []byte, err error) {
|
|
if i := bytes.IndexByte(data, 0); i >= 0 {
|
|
// Valid record found.
|
|
return i + 1, data[0:i], nil
|
|
} else if atEOF && len(data) != 0 {
|
|
// Data at the end of the file without a null terminator.
|
|
return 0, nil, errors.New("Expected null byte terminator")
|
|
} else {
|
|
// Request more data.
|
|
return 0, nil, nil
|
|
}
|
|
}
|
|
|
|
// CollectBinaryShowqFromReader parses Postfix's binary showq format.
|
|
func CollectBinaryShowqFromReader(file io.Reader, ch chan<- prometheus.Metric) error {
|
|
scanner := bufio.NewScanner(file)
|
|
scanner.Split(ScanNullTerminatedEntries)
|
|
|
|
// Histograms tracking the messages by size and age.
|
|
sizeHistogram := prometheus.NewHistogramVec(
|
|
prometheus.HistogramOpts{
|
|
Namespace: "postfix",
|
|
Name: "showq_message_size_bytes",
|
|
Help: "Size of messages in Postfix's message queue, in bytes",
|
|
Buckets: []float64{1e3, 1e4, 1e5, 1e6, 1e7, 1e8, 1e9},
|
|
},
|
|
[]string{"queue"})
|
|
ageHistogram := prometheus.NewHistogramVec(
|
|
prometheus.HistogramOpts{
|
|
Namespace: "postfix",
|
|
Name: "showq_message_age_seconds",
|
|
Help: "Age of messages in Postfix's message queue, in seconds",
|
|
Buckets: []float64{1e1, 1e2, 1e3, 1e4, 1e5, 1e6, 1e7, 1e8},
|
|
},
|
|
[]string{"queue"})
|
|
|
|
// Initialize all queue buckets to zero.
|
|
for _, q := range []string{"active", "deferred", "hold", "incoming", "maildrop"} {
|
|
sizeHistogram.WithLabelValues(q)
|
|
ageHistogram.WithLabelValues(q)
|
|
}
|
|
|
|
now := float64(time.Now().UnixNano()) / 1e9
|
|
queue := "unknown"
|
|
for scanner.Scan() {
|
|
// Parse a key/value entry.
|
|
key := scanner.Text()
|
|
if len(key) == 0 {
|
|
// Empty key means a record separator.
|
|
queue = "unknown"
|
|
continue
|
|
}
|
|
if !scanner.Scan() {
|
|
return fmt.Errorf("key %q does not have a value", key)
|
|
}
|
|
value := scanner.Text()
|
|
|
|
if key == "queue_name" {
|
|
// The name of the message queue.
|
|
queue = value
|
|
} else if key == "size" {
|
|
// Message size in bytes.
|
|
size, err := strconv.ParseFloat(value, 64)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
sizeHistogram.WithLabelValues(queue).Observe(size)
|
|
} else if key == "time" {
|
|
// Message time as a UNIX timestamp.
|
|
utime, err := strconv.ParseFloat(value, 64)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
ageHistogram.WithLabelValues(queue).Observe(now - utime)
|
|
}
|
|
}
|
|
|
|
sizeHistogram.Collect(ch)
|
|
ageHistogram.Collect(ch)
|
|
return scanner.Err()
|
|
}
|
|
|
|
// CollectShowqFromSocket collects Postfix queue statistics from a socket.
|
|
func CollectShowqFromSocket(path string, ch chan<- prometheus.Metric) error {
|
|
fd, err := net.Dial("unix", path)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
defer fd.Close()
|
|
return CollectShowqFromReader(fd, ch)
|
|
}
|
|
|
|
// Patterns for parsing log messages.
|
|
var (
|
|
logLine = regexp.MustCompile(` ?(postfix|opendkim)(/(\w+))?\[\d+\]: (.*)`)
|
|
lmtpPipeSMTPLine = regexp.MustCompile(`, relay=(\S+), .*, delays=([0-9\.]+)/([0-9\.]+)/([0-9\.]+)/([0-9\.]+), `)
|
|
qmgrInsertLine = regexp.MustCompile(`:.*, size=(\d+), nrcpt=(\d+) `)
|
|
smtpStatusDeferredLine = regexp.MustCompile(`, status=deferred`)
|
|
smtpTLSLine = regexp.MustCompile(`^(\S+) TLS connection established to \S+: (\S+) with cipher (\S+) \((\d+)/(\d+) bits\)$`)
|
|
smtpConnectionTimedOut = regexp.MustCompile(`^connect\s+to\s+(.*)\[(.*)\]:(\d+):\s+(Connection timed out)$`)
|
|
smtpdFCrDNSErrorsLine = regexp.MustCompile(`^warning: hostname \S+ does not resolve to address `)
|
|
smtpdProcessesSASLLine = regexp.MustCompile(`: client=.*, sasl_username=(\S+)`)
|
|
smtpdRejectsLine = regexp.MustCompile(`^NOQUEUE: reject: RCPT from \S+: ([0-9]+) `)
|
|
smtpdLostConnectionLine = regexp.MustCompile(`^lost connection after (\w+) from `)
|
|
smtpdSASLAuthenticationFailuresLine = regexp.MustCompile(`^warning: \S+: SASL \S+ authentication failed: `)
|
|
smtpdTLSLine = regexp.MustCompile(`^(\S+) TLS connection established from \S+: (\S+) with cipher (\S+) \((\d+)/(\d+) bits\)$`)
|
|
opendkimSignatureAdded = regexp.MustCompile(`^[\w\d]+: DKIM-Signature field added \(s=(\w+), d=(.*)\)$`)
|
|
)
|
|
|
|
// CollectFromLogline collects metrict from a Postfix log line.
|
|
func (e *PostfixExporter) CollectFromLogLine(line string) {
|
|
// Strip off timestamp, hostname, etc.
|
|
logMatches := logLine.FindStringSubmatch(line)
|
|
|
|
if logMatches == nil {
|
|
// Unknown log entry format.
|
|
e.addToUnsupportedLine(line, "")
|
|
return
|
|
}
|
|
process := logMatches[1]
|
|
remainder := logMatches[4]
|
|
switch process {
|
|
case "postfix":
|
|
// Group patterns to check by Postfix service.
|
|
subprocess := logMatches[3]
|
|
switch subprocess {
|
|
case "cleanup":
|
|
if strings.Contains(remainder, ": message-id=<") {
|
|
e.cleanupProcesses.Inc()
|
|
} else if strings.Contains(remainder, ": reject: ") {
|
|
e.cleanupRejects.Inc()
|
|
} else {
|
|
e.addToUnsupportedLine(line, subprocess)
|
|
}
|
|
case "lmtp":
|
|
if lmtpMatches := lmtpPipeSMTPLine.FindStringSubmatch(remainder); lmtpMatches != nil {
|
|
addToHistogramVec(e.lmtpDelays, lmtpMatches[2], "LMTP pdelay", "before_queue_manager")
|
|
addToHistogramVec(e.lmtpDelays, lmtpMatches[3], "LMTP adelay", "queue_manager")
|
|
addToHistogramVec(e.lmtpDelays, lmtpMatches[4], "LMTP sdelay", "connection_setup")
|
|
addToHistogramVec(e.lmtpDelays, lmtpMatches[5], "LMTP xdelay", "transmission")
|
|
} else {
|
|
e.addToUnsupportedLine(line, subprocess)
|
|
}
|
|
case "pipe":
|
|
if pipeMatches := lmtpPipeSMTPLine.FindStringSubmatch(remainder); pipeMatches != nil {
|
|
addToHistogramVec(e.pipeDelays, pipeMatches[2], "PIPE pdelay", pipeMatches[1], "before_queue_manager")
|
|
addToHistogramVec(e.pipeDelays, pipeMatches[3], "PIPE adelay", pipeMatches[1], "queue_manager")
|
|
addToHistogramVec(e.pipeDelays, pipeMatches[4], "PIPE sdelay", pipeMatches[1], "connection_setup")
|
|
addToHistogramVec(e.pipeDelays, pipeMatches[5], "PIPE xdelay", pipeMatches[1], "transmission")
|
|
} else {
|
|
e.addToUnsupportedLine(line, subprocess)
|
|
}
|
|
case "qmgr":
|
|
if qmgrInsertMatches := qmgrInsertLine.FindStringSubmatch(remainder); qmgrInsertMatches != nil {
|
|
addToHistogram(e.qmgrInsertsSize, qmgrInsertMatches[1], "QMGR size")
|
|
addToHistogram(e.qmgrInsertsNrcpt, qmgrInsertMatches[2], "QMGR nrcpt")
|
|
} else if strings.HasSuffix(remainder, ": removed") {
|
|
e.qmgrRemoves.Inc()
|
|
} else {
|
|
e.addToUnsupportedLine(line, subprocess)
|
|
}
|
|
case "smtp":
|
|
if smtpMatches := lmtpPipeSMTPLine.FindStringSubmatch(remainder); smtpMatches != nil {
|
|
addToHistogramVec(e.smtpDelays, smtpMatches[2], "before_queue_manager")
|
|
addToHistogramVec(e.smtpDelays, smtpMatches[3], "queue_manager")
|
|
addToHistogramVec(e.smtpDelays, smtpMatches[4], "connection_setup")
|
|
addToHistogramVec(e.smtpDelays, smtpMatches[5], "transmission")
|
|
if smtpMatches := smtpStatusDeferredLine.FindStringSubmatch(remainder); smtpMatches != nil {
|
|
e.smtpStatusDeferred.Inc()
|
|
}
|
|
} else if smtpTLSMatches := smtpTLSLine.FindStringSubmatch(remainder); smtpTLSMatches != nil {
|
|
e.smtpTLSConnects.WithLabelValues(smtpTLSMatches[1:]...).Inc()
|
|
} else if smtpMatches := smtpConnectionTimedOut.FindStringSubmatch(remainder); smtpMatches != nil {
|
|
e.smtpConnectionTimedOut.Inc()
|
|
} else {
|
|
e.addToUnsupportedLine(line, subprocess)
|
|
}
|
|
case "smtpd":
|
|
if strings.HasPrefix(remainder, "connect from ") {
|
|
e.smtpdConnects.Inc()
|
|
} else if strings.HasPrefix(remainder, "disconnect from ") {
|
|
e.smtpdDisconnects.Inc()
|
|
} else if smtpdFCrDNSErrorsLine.MatchString(remainder) {
|
|
e.smtpdFCrDNSErrors.Inc()
|
|
} else if smtpdLostConnectionMatches := smtpdLostConnectionLine.FindStringSubmatch(remainder); smtpdLostConnectionMatches != nil {
|
|
e.smtpdLostConnections.WithLabelValues(smtpdLostConnectionMatches[1]).Inc()
|
|
} else if smtpdProcessesSASLMatches := smtpdProcessesSASLLine.FindStringSubmatch(remainder); smtpdProcessesSASLMatches != nil {
|
|
e.smtpdProcesses.WithLabelValues(smtpdProcessesSASLMatches[1]).Inc()
|
|
} else if strings.Contains(logMatches[2], ": client=") {
|
|
e.smtpdProcesses.WithLabelValues("").Inc()
|
|
} else if smtpdRejectsMatches := smtpdRejectsLine.FindStringSubmatch(remainder); smtpdRejectsMatches != nil {
|
|
e.smtpdRejects.WithLabelValues(smtpdRejectsMatches[1]).Inc()
|
|
} else if smtpdSASLAuthenticationFailuresLine.MatchString(remainder) {
|
|
e.smtpdSASLAuthenticationFailures.Inc()
|
|
} else if smtpdTLSMatches := smtpdTLSLine.FindStringSubmatch(remainder); smtpdTLSMatches != nil {
|
|
e.smtpdTLSConnects.WithLabelValues(smtpdTLSMatches[1:]...).Inc()
|
|
} else {
|
|
e.addToUnsupportedLine(line, subprocess)
|
|
}
|
|
default:
|
|
e.addToUnsupportedLine(line, subprocess)
|
|
}
|
|
case "opendkim":
|
|
if opendkimMatches := opendkimSignatureAdded.FindStringSubmatch(remainder); opendkimMatches != nil {
|
|
e.opendkimSignatureAdded.WithLabelValues(opendkimMatches[1], opendkimMatches[2]).Inc()
|
|
} else {
|
|
e.addToUnsupportedLine(line, process)
|
|
}
|
|
default:
|
|
// Unknown log entry format.
|
|
e.addToUnsupportedLine(line, "")
|
|
}
|
|
}
|
|
|
|
func (e *PostfixExporter) addToUnsupportedLine(line string, subprocess string) {
|
|
if e.logUnsupportedLines {
|
|
log.Printf("Unsupported Line: %v", line)
|
|
}
|
|
e.unsupportedLogEntries.WithLabelValues(subprocess).Inc()
|
|
}
|
|
|
|
func addToHistogram(h prometheus.Histogram, value, fieldName string) {
|
|
float, err := strconv.ParseFloat(value, 64)
|
|
if err != nil {
|
|
log.Printf("Couldn't convert value '%s' for %v: %v", value, fieldName, err)
|
|
}
|
|
h.Observe(float)
|
|
}
|
|
func addToHistogramVec(h *prometheus.HistogramVec, value, fieldName string, labels ...string) {
|
|
float, err := strconv.ParseFloat(value, 64)
|
|
if err != nil {
|
|
log.Printf("Couldn't convert value '%s' for %v: %v", value, fieldName, err)
|
|
}
|
|
h.WithLabelValues(labels...).Observe(float)
|
|
}
|
|
|
|
// CollectLogfileFromFile tails a Postfix log file and collects entries from it.
|
|
func (e *PostfixExporter) CollectLogfileFromFile(ctx context.Context) {
|
|
gaugeVec := prometheus.NewGaugeVec(
|
|
prometheus.GaugeOpts{
|
|
Namespace: "postfix",
|
|
Subsystem: "",
|
|
Name: "up",
|
|
Help: "Whether scraping Postfix's metrics was successful.",
|
|
},
|
|
[]string{"path"})
|
|
gauge := gaugeVec.WithLabelValues(e.tailer.Filename)
|
|
for {
|
|
select {
|
|
case line := <-e.tailer.Lines:
|
|
e.CollectFromLogLine(line.Text)
|
|
case <-ctx.Done():
|
|
gauge.Set(0)
|
|
return
|
|
}
|
|
gauge.Set(1)
|
|
}
|
|
}
|
|
|
|
// NewPostfixExporter creates a new Postfix exporter instance.
|
|
func NewPostfixExporter(showqPath string, logfilePath string, journal *Journal, logUnsupportedLines bool) (*PostfixExporter, error) {
|
|
var tailer *tail.Tail
|
|
if logfilePath != "" {
|
|
var err error
|
|
tailer, err = tail.TailFile(logfilePath, tail.Config{
|
|
ReOpen: true, // reopen the file if it's rotated
|
|
MustExist: true, // fail immediately if the file is missing or has incorrect permissions
|
|
Follow: true, // run in follow mode
|
|
})
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
}
|
|
return &PostfixExporter{
|
|
logUnsupportedLines: logUnsupportedLines,
|
|
showqPath: showqPath,
|
|
tailer: tailer,
|
|
journal: journal,
|
|
|
|
cleanupProcesses: prometheus.NewCounter(prometheus.CounterOpts{
|
|
Namespace: "postfix",
|
|
Name: "cleanup_messages_processed_total",
|
|
Help: "Total number of messages processed by cleanup.",
|
|
}),
|
|
cleanupRejects: prometheus.NewCounter(prometheus.CounterOpts{
|
|
Namespace: "postfix",
|
|
Name: "cleanup_messages_rejected_total",
|
|
Help: "Total number of messages rejected by cleanup.",
|
|
}),
|
|
cleanupNotAccepted: prometheus.NewCounter(prometheus.CounterOpts{
|
|
Namespace: "postfix",
|
|
Name: "cleanup_messages_not_accepted_total",
|
|
Help: "Total number of messages not accepted by cleanup.",
|
|
}),
|
|
lmtpDelays: prometheus.NewHistogramVec(
|
|
prometheus.HistogramOpts{
|
|
Namespace: "postfix",
|
|
Name: "lmtp_delivery_delay_seconds",
|
|
Help: "LMTP message processing time in seconds.",
|
|
Buckets: []float64{1e-3, 1e-2, 1e-1, 1e0, 1e1, 1e2, 1e3},
|
|
},
|
|
[]string{"stage"}),
|
|
pipeDelays: prometheus.NewHistogramVec(
|
|
prometheus.HistogramOpts{
|
|
Namespace: "postfix",
|
|
Name: "pipe_delivery_delay_seconds",
|
|
Help: "Pipe message processing time in seconds.",
|
|
Buckets: []float64{1e-3, 1e-2, 1e-1, 1e0, 1e1, 1e2, 1e3},
|
|
},
|
|
[]string{"relay", "stage"}),
|
|
qmgrInsertsNrcpt: prometheus.NewHistogram(prometheus.HistogramOpts{
|
|
Namespace: "postfix",
|
|
Name: "qmgr_messages_inserted_receipients",
|
|
Help: "Number of receipients per message inserted into the mail queues.",
|
|
Buckets: []float64{1, 2, 4, 8, 16, 32, 64, 128},
|
|
}),
|
|
qmgrInsertsSize: prometheus.NewHistogram(prometheus.HistogramOpts{
|
|
Namespace: "postfix",
|
|
Name: "qmgr_messages_inserted_size_bytes",
|
|
Help: "Size of messages inserted into the mail queues in bytes.",
|
|
Buckets: []float64{1e3, 1e4, 1e5, 1e6, 1e7, 1e8, 1e9},
|
|
}),
|
|
qmgrRemoves: prometheus.NewCounter(prometheus.CounterOpts{
|
|
Namespace: "postfix",
|
|
Name: "qmgr_messages_removed_total",
|
|
Help: "Total number of messages removed from mail queues.",
|
|
}),
|
|
smtpDelays: prometheus.NewHistogramVec(
|
|
prometheus.HistogramOpts{
|
|
Namespace: "postfix",
|
|
Name: "smtp_delivery_delay_seconds",
|
|
Help: "SMTP message processing time in seconds.",
|
|
Buckets: []float64{1e-3, 1e-2, 1e-1, 1e0, 1e1, 1e2, 1e3},
|
|
},
|
|
[]string{"stage"}),
|
|
smtpTLSConnects: prometheus.NewCounterVec(
|
|
prometheus.CounterOpts{
|
|
Namespace: "postfix",
|
|
Name: "smtp_tls_connections_total",
|
|
Help: "Total number of outgoing TLS connections.",
|
|
},
|
|
[]string{"trust", "protocol", "cipher", "secret_bits", "algorithm_bits"}),
|
|
smtpDeferreds: prometheus.NewCounter(prometheus.CounterOpts{
|
|
Namespace: "postfix",
|
|
Name: "smtp_deferred_messages_total",
|
|
Help: "Total number of messages that have been deferred on SMTP.",
|
|
}),
|
|
smtpConnectionTimedOut: prometheus.NewCounter(prometheus.CounterOpts{
|
|
Namespace: "postfix",
|
|
Name: "smtp_connection_timed_out_total",
|
|
Help: "Total number of messages that have been deferred on SMTP.",
|
|
}),
|
|
smtpdConnects: prometheus.NewCounter(prometheus.CounterOpts{
|
|
Namespace: "postfix",
|
|
Name: "smtpd_connects_total",
|
|
Help: "Total number of incoming connections.",
|
|
}),
|
|
smtpdDisconnects: prometheus.NewCounter(prometheus.CounterOpts{
|
|
Namespace: "postfix",
|
|
Name: "smtpd_disconnects_total",
|
|
Help: "Total number of incoming disconnections.",
|
|
}),
|
|
smtpdFCrDNSErrors: prometheus.NewCounter(prometheus.CounterOpts{
|
|
Namespace: "postfix",
|
|
Name: "smtpd_forward_confirmed_reverse_dns_errors_total",
|
|
Help: "Total number of connections for which forward-confirmed DNS cannot be resolved.",
|
|
}),
|
|
smtpdLostConnections: prometheus.NewCounterVec(
|
|
prometheus.CounterOpts{
|
|
Namespace: "postfix",
|
|
Name: "smtpd_connections_lost_total",
|
|
Help: "Total number of connections lost.",
|
|
},
|
|
[]string{"after_stage"}),
|
|
smtpdProcesses: prometheus.NewCounterVec(
|
|
prometheus.CounterOpts{
|
|
Namespace: "postfix",
|
|
Name: "smtpd_messages_processed_total",
|
|
Help: "Total number of messages processed.",
|
|
},
|
|
[]string{"sasl_username"}),
|
|
smtpdRejects: prometheus.NewCounterVec(
|
|
prometheus.CounterOpts{
|
|
Namespace: "postfix",
|
|
Name: "smtpd_messages_rejected_total",
|
|
Help: "Total number of NOQUEUE rejects.",
|
|
},
|
|
[]string{"code"}),
|
|
smtpdSASLAuthenticationFailures: prometheus.NewCounter(prometheus.CounterOpts{
|
|
Namespace: "postfix",
|
|
Name: "smtpd_sasl_authentication_failures_total",
|
|
Help: "Total number of SASL authentication failures.",
|
|
}),
|
|
smtpdTLSConnects: prometheus.NewCounterVec(
|
|
prometheus.CounterOpts{
|
|
Namespace: "postfix",
|
|
Name: "smtpd_tls_connections_total",
|
|
Help: "Total number of incoming TLS connections.",
|
|
},
|
|
[]string{"trust", "protocol", "cipher", "secret_bits", "algorithm_bits"}),
|
|
unsupportedLogEntries: prometheus.NewCounterVec(
|
|
prometheus.CounterOpts{
|
|
Namespace: "postfix",
|
|
Name: "unsupported_log_entries_total",
|
|
Help: "Log entries that could not be processed.",
|
|
},
|
|
[]string{"service"}),
|
|
smtpStatusDeferred: prometheus.NewCounter(prometheus.CounterOpts{
|
|
Namespace: "postfix",
|
|
Name: "smtp_status_deferred",
|
|
Help: "Total number of messages deferred.",
|
|
}),
|
|
opendkimSignatureAdded: prometheus.NewCounterVec(
|
|
prometheus.CounterOpts{
|
|
Namespace: "opendkim",
|
|
Name: "signatures_added_total",
|
|
Help: "Total number of messages signed.",
|
|
},
|
|
[]string{"subject", "domain"},
|
|
),
|
|
}, nil
|
|
}
|
|
|
|
// Describe the Prometheus metrics that are going to be exported.
|
|
func (e *PostfixExporter) Describe(ch chan<- *prometheus.Desc) {
|
|
ch <- postfixUpDesc
|
|
|
|
ch <- e.cleanupProcesses.Desc()
|
|
ch <- e.cleanupRejects.Desc()
|
|
ch <- e.cleanupNotAccepted.Desc()
|
|
e.lmtpDelays.Describe(ch)
|
|
e.pipeDelays.Describe(ch)
|
|
ch <- e.qmgrInsertsNrcpt.Desc()
|
|
ch <- e.qmgrInsertsSize.Desc()
|
|
ch <- e.qmgrRemoves.Desc()
|
|
e.smtpDelays.Describe(ch)
|
|
e.smtpTLSConnects.Describe(ch)
|
|
ch <- e.smtpDeferreds.Desc()
|
|
ch <- e.smtpdConnects.Desc()
|
|
ch <- e.smtpdDisconnects.Desc()
|
|
ch <- e.smtpdFCrDNSErrors.Desc()
|
|
e.smtpdLostConnections.Describe(ch)
|
|
e.smtpdProcesses.Describe(ch)
|
|
e.smtpdRejects.Describe(ch)
|
|
ch <- e.smtpdSASLAuthenticationFailures.Desc()
|
|
e.smtpdTLSConnects.Describe(ch)
|
|
ch <- e.smtpStatusDeferred.Desc()
|
|
e.unsupportedLogEntries.Describe(ch)
|
|
}
|
|
|
|
func (e *PostfixExporter) foreverCollectFromJournal(ctx context.Context) {
|
|
gauge := prometheus.NewGaugeVec(
|
|
prometheus.GaugeOpts{
|
|
Namespace: "postfix",
|
|
Subsystem: "",
|
|
Name: "up",
|
|
Help: "Whether scraping Postfix's metrics was successful.",
|
|
},
|
|
[]string{"path"}).WithLabelValues(e.journal.Path)
|
|
select {
|
|
case <-ctx.Done():
|
|
gauge.Set(0)
|
|
return
|
|
default:
|
|
err := e.CollectLogfileFromJournal()
|
|
if err != nil {
|
|
log.Printf("Couldn't read journal: %v", err)
|
|
gauge.Set(0)
|
|
} else {
|
|
gauge.Set(1)
|
|
}
|
|
}
|
|
}
|
|
|
|
func (e *PostfixExporter) StartMetricCollection(ctx context.Context) {
|
|
if e.journal != nil {
|
|
e.foreverCollectFromJournal(ctx)
|
|
} else {
|
|
e.CollectLogfileFromFile(ctx)
|
|
}
|
|
|
|
prometheus.NewGaugeVec(
|
|
prometheus.GaugeOpts{
|
|
Namespace: "postfix",
|
|
Subsystem: "",
|
|
Name: "up",
|
|
Help: "Whether scraping Postfix's metrics was successful.",
|
|
},
|
|
[]string{"path"})
|
|
return
|
|
}
|
|
|
|
// Collect metrics from Postfix's showq socket and its log file.
|
|
func (e *PostfixExporter) Collect(ch chan<- prometheus.Metric) {
|
|
err := CollectShowqFromSocket(e.showqPath, ch)
|
|
if err == nil {
|
|
ch <- prometheus.MustNewConstMetric(
|
|
postfixUpDesc,
|
|
prometheus.GaugeValue,
|
|
1.0,
|
|
e.showqPath)
|
|
} else {
|
|
log.Printf("Failed to scrape showq socket: %s", err)
|
|
ch <- prometheus.MustNewConstMetric(
|
|
postfixUpDesc,
|
|
prometheus.GaugeValue,
|
|
0.0,
|
|
e.showqPath)
|
|
}
|
|
|
|
ch <- e.cleanupProcesses
|
|
ch <- e.cleanupRejects
|
|
ch <- e.cleanupNotAccepted
|
|
e.lmtpDelays.Collect(ch)
|
|
e.pipeDelays.Collect(ch)
|
|
ch <- e.qmgrInsertsNrcpt
|
|
ch <- e.qmgrInsertsSize
|
|
ch <- e.qmgrRemoves
|
|
e.smtpDelays.Collect(ch)
|
|
e.smtpTLSConnects.Collect(ch)
|
|
ch <- e.smtpDeferreds
|
|
ch <- e.smtpdConnects
|
|
ch <- e.smtpdDisconnects
|
|
ch <- e.smtpdFCrDNSErrors
|
|
e.smtpdLostConnections.Collect(ch)
|
|
e.smtpdProcesses.Collect(ch)
|
|
e.smtpdRejects.Collect(ch)
|
|
ch <- e.smtpdSASLAuthenticationFailures
|
|
e.smtpdTLSConnects.Collect(ch)
|
|
ch <- e.smtpStatusDeferred
|
|
e.unsupportedLogEntries.Collect(ch)
|
|
ch <- e.smtpConnectionTimedOut
|
|
e.opendkimSignatureAdded.Collect(ch)
|
|
}
|