Node_Exporter/collector/tapestats_linux.go
Luiz Angelo Daros de Luca 00aa2f34ce Add tapestats to collect tape devices statistics
It is based on diskstats to allow metrics reuse by simply
s/disk/tape/ the query.

Signed-off-by: Luiz Angelo Daros de Luca <luizluca@gmail.com>
2021-07-09 21:01:08 -03:00

152 lines
6.4 KiB
Go

// Copyright 2015 The Prometheus Authors
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
// +build !notapestats
package collector
import (
"fmt"
"os"
"regexp"
"github.com/go-kit/log"
"github.com/go-kit/log/level"
"github.com/prometheus/client_golang/prometheus"
"github.com/prometheus/procfs/sysfs"
"gopkg.in/alecthomas/kingpin.v2"
)
var (
ignoredTapeDevices = kingpin.Flag("collector.tapestats.ignored-devices", "Regexp of devices to ignore for tapestats.").Default("^$").String()
)
type tapestatsCollector struct {
ignoredDevicesPattern *regexp.Regexp
ioNow *prometheus.Desc
ioTimeSeconds *prometheus.Desc
othersCompletedTotal *prometheus.Desc
readByteTotal *prometheus.Desc
readsCompletedTotal *prometheus.Desc
readTimeSeconds *prometheus.Desc
writtenByteTotal *prometheus.Desc
writesCompletedTotal *prometheus.Desc
writeTimeSeconds *prometheus.Desc
residualTotal *prometheus.Desc
fs sysfs.FS
logger log.Logger
}
func init() {
registerCollector("tapestats", defaultEnabled, NewTapestatsCollector)
}
// NewTapestatsCollector returns a new Collector exposing tape device stats.
// Docs from https://www.kernel.org/doc/html/latest/scsi/st.html#sysfs-and-statistics-for-tape-devices
func NewTapestatsCollector(logger log.Logger) (Collector, error) {
var tapeLabelNames = []string{"device"}
fs, err := sysfs.NewFS(*sysPath)
if err != nil {
return nil, fmt.Errorf("failed to open sysfs: %w", err)
}
tapeSubsystem := "tape"
return &tapestatsCollector{
ignoredDevicesPattern: regexp.MustCompile(*ignoredTapeDevices),
ioNow: prometheus.NewDesc(
prometheus.BuildFQName(namespace, tapeSubsystem, "io_now"),
"The number of I/Os currently outstanding to this device.",
tapeLabelNames, nil,
),
ioTimeSeconds: prometheus.NewDesc(
prometheus.BuildFQName(namespace, tapeSubsystem, "io_time_seconds_total"),
"The amount of time spent waiting for all I/O to complete (including read and write). This includes tape movement commands such as seeking between file or set marks and implicit tape movement such as when rewind on close tape devices are used.",
tapeLabelNames, nil,
),
othersCompletedTotal: prometheus.NewDesc(
prometheus.BuildFQName(namespace, tapeSubsystem, "io_others_total"),
"The number of I/Os issued to the tape drive other than read or write commands. The time taken to complete these commands uses the following calculation io_time_seconds_total-read_time_seconds_total-write_time_seconds_total",
tapeLabelNames, nil,
),
readByteTotal: prometheus.NewDesc(
prometheus.BuildFQName(namespace, tapeSubsystem, "read_bytes_total"),
"The number of bytes read from the tape drive.",
tapeLabelNames, nil,
),
readsCompletedTotal: prometheus.NewDesc(
prometheus.BuildFQName(namespace, tapeSubsystem, "reads_completed_total"),
"The number of read requests issued to the tape drive.",
tapeLabelNames, nil,
),
readTimeSeconds: prometheus.NewDesc(
prometheus.BuildFQName(namespace, tapeSubsystem, "read_time_seconds_total"),
"The amount of time spent waiting for read requests to complete.",
tapeLabelNames, nil,
),
writtenByteTotal: prometheus.NewDesc(
prometheus.BuildFQName(namespace, tapeSubsystem, "written_bytes_total"),
"The number of bytes written to the tape drive.",
tapeLabelNames, nil,
),
writesCompletedTotal: prometheus.NewDesc(
prometheus.BuildFQName(namespace, tapeSubsystem, "writes_completed_total"),
"The number of write requests issued to the tape drive.",
tapeLabelNames, nil,
),
writeTimeSeconds: prometheus.NewDesc(
prometheus.BuildFQName(namespace, tapeSubsystem, "write_time_seconds_total"),
"The amount of time spent waiting for write requests to complete.",
tapeLabelNames, nil,
),
residualTotal: prometheus.NewDesc(
prometheus.BuildFQName(namespace, tapeSubsystem, "residual_total"),
"The number of times during a read or write we found the residual amount to be non-zero. This should mean that a program is issuing a read larger thean the block size on tape. For write not all data made it to tape.",
tapeLabelNames, nil,
),
logger: logger,
fs: fs,
}, nil
}
func (c *tapestatsCollector) Update(ch chan<- prometheus.Metric) error {
tapes, err := c.fs.SCSITapeClass()
if err != nil {
if os.IsNotExist(err) {
level.Debug(c.logger).Log("msg", "scsi_tape stats not found, skipping")
return ErrNoData
}
return fmt.Errorf("error obtaining SCSITape class info: %s", err)
}
for _, tape := range tapes {
if c.ignoredDevicesPattern.MatchString(tape.Name) {
level.Debug(c.logger).Log("msg", "Ignoring device", "device", tape.Name)
continue
}
ch <- prometheus.MustNewConstMetric(c.ioNow, prometheus.GaugeValue, float64(tape.Counters.InFlight), tape.Name)
ch <- prometheus.MustNewConstMetric(c.ioTimeSeconds, prometheus.CounterValue, float64(tape.Counters.IoNs)*0.000000001, tape.Name)
ch <- prometheus.MustNewConstMetric(c.othersCompletedTotal, prometheus.CounterValue, float64(tape.Counters.OtherCnt), tape.Name)
ch <- prometheus.MustNewConstMetric(c.readByteTotal, prometheus.CounterValue, float64(tape.Counters.ReadByteCnt), tape.Name)
ch <- prometheus.MustNewConstMetric(c.readsCompletedTotal, prometheus.CounterValue, float64(tape.Counters.ReadCnt), tape.Name)
ch <- prometheus.MustNewConstMetric(c.readTimeSeconds, prometheus.CounterValue, float64(tape.Counters.ReadNs)*0.000000001, tape.Name)
ch <- prometheus.MustNewConstMetric(c.residualTotal, prometheus.CounterValue, float64(tape.Counters.ResidCnt), tape.Name)
ch <- prometheus.MustNewConstMetric(c.writtenByteTotal, prometheus.CounterValue, float64(tape.Counters.WriteByteCnt), tape.Name)
ch <- prometheus.MustNewConstMetric(c.writesCompletedTotal, prometheus.CounterValue, float64(tape.Counters.WriteCnt), tape.Name)
ch <- prometheus.MustNewConstMetric(c.writeTimeSeconds, prometheus.CounterValue, float64(tape.Counters.WriteNs)*0.000000001, tape.Name)
}
return nil
}