394 lines
9.1 KiB
Go
394 lines
9.1 KiB
Go
package mongodb
|
|
|
|
import (
|
|
"context"
|
|
"errors"
|
|
"fmt"
|
|
"strconv"
|
|
"strings"
|
|
"time"
|
|
|
|
"go.mongodb.org/mongo-driver/bson"
|
|
"go.mongodb.org/mongo-driver/bson/primitive"
|
|
"go.mongodb.org/mongo-driver/mongo"
|
|
"go.mongodb.org/mongo-driver/mongo/options"
|
|
|
|
"github.com/influxdata/telegraf"
|
|
)
|
|
|
|
type Server struct {
|
|
client *mongo.Client
|
|
hostname string
|
|
lastResult *MongoStatus
|
|
|
|
Log telegraf.Logger
|
|
}
|
|
|
|
func (s *Server) getDefaultTags() map[string]string {
|
|
tags := make(map[string]string)
|
|
tags["hostname"] = s.hostname
|
|
return tags
|
|
}
|
|
|
|
type oplogEntry struct {
|
|
Timestamp primitive.Timestamp `bson:"ts"`
|
|
}
|
|
|
|
func IsAuthorization(err error) bool {
|
|
return strings.Contains(err.Error(), "not authorized")
|
|
}
|
|
|
|
func (s *Server) ping() error {
|
|
ctx, cancel := context.WithTimeout(context.Background(), 1*time.Second)
|
|
defer cancel()
|
|
|
|
return s.client.Ping(ctx, nil)
|
|
}
|
|
|
|
func (s *Server) authLog(err error) {
|
|
if IsAuthorization(err) {
|
|
s.Log.Debug(err.Error())
|
|
} else {
|
|
s.Log.Error(err.Error())
|
|
}
|
|
}
|
|
|
|
func (s *Server) runCommand(database string, cmd interface{}, result interface{}) error {
|
|
r := s.client.Database(database).RunCommand(context.Background(), cmd)
|
|
if r.Err() != nil {
|
|
return r.Err()
|
|
}
|
|
return r.Decode(result)
|
|
}
|
|
|
|
func (s *Server) gatherServerStatus() (*ServerStatus, error) {
|
|
serverStatus := &ServerStatus{}
|
|
err := s.runCommand("admin", bson.D{
|
|
{
|
|
Key: "serverStatus",
|
|
Value: 1,
|
|
},
|
|
{
|
|
Key: "recordStats",
|
|
Value: 0,
|
|
},
|
|
}, serverStatus)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
return serverStatus, nil
|
|
}
|
|
|
|
func (s *Server) gatherReplSetStatus() (*ReplSetStatus, error) {
|
|
replSetStatus := &ReplSetStatus{}
|
|
err := s.runCommand("admin", bson.D{
|
|
{
|
|
Key: "replSetGetStatus",
|
|
Value: 1,
|
|
},
|
|
}, replSetStatus)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
return replSetStatus, nil
|
|
}
|
|
|
|
func (s *Server) gatherTopStatData() (*TopStats, error) {
|
|
var dest map[string]interface{}
|
|
err := s.runCommand("admin", bson.D{
|
|
{
|
|
Key: "top",
|
|
Value: 1,
|
|
},
|
|
}, &dest)
|
|
if err != nil {
|
|
return nil, fmt.Errorf("failed running admin cmd: %w", err)
|
|
}
|
|
|
|
totals, ok := dest["totals"].(map[string]interface{})
|
|
if !ok {
|
|
return nil, errors.New("collection totals not found or not a map")
|
|
}
|
|
delete(totals, "note")
|
|
|
|
recorded, err := bson.Marshal(totals)
|
|
if err != nil {
|
|
return nil, errors.New("unable to marshal totals")
|
|
}
|
|
|
|
topInfo := make(map[string]TopStatCollection)
|
|
if err := bson.Unmarshal(recorded, &topInfo); err != nil {
|
|
return nil, fmt.Errorf("failed unmarshalling records: %w", err)
|
|
}
|
|
|
|
return &TopStats{Totals: topInfo}, nil
|
|
}
|
|
|
|
func (s *Server) gatherClusterStatus() (*ClusterStatus, error) {
|
|
chunkCount, err := s.client.Database("config").Collection("chunks").CountDocuments(context.Background(), bson.M{"jumbo": true})
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
return &ClusterStatus{
|
|
JumboChunksCount: chunkCount,
|
|
}, nil
|
|
}
|
|
|
|
func poolStatsCommand(version string) (string, error) {
|
|
majorPart := string(version[0])
|
|
major, err := strconv.ParseInt(majorPart, 10, 64)
|
|
if err != nil {
|
|
return "", err
|
|
}
|
|
|
|
if major >= 5 {
|
|
return "connPoolStats", nil
|
|
}
|
|
return "shardConnPoolStats", nil
|
|
}
|
|
|
|
func (s *Server) gatherShardConnPoolStats(version string) (*ShardStats, error) {
|
|
command, err := poolStatsCommand(version)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
shardStats := &ShardStats{}
|
|
err = s.runCommand("admin", bson.D{
|
|
{
|
|
Key: command,
|
|
Value: 1,
|
|
},
|
|
}, &shardStats)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
return shardStats, nil
|
|
}
|
|
|
|
func (s *Server) gatherDBStats(name string) (*Db, error) {
|
|
stats := &DbStatsData{}
|
|
err := s.runCommand(name, bson.D{
|
|
{
|
|
Key: "dbStats",
|
|
Value: 1,
|
|
},
|
|
}, stats)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
return &Db{
|
|
Name: name,
|
|
DbStatsData: stats,
|
|
}, nil
|
|
}
|
|
|
|
func (s *Server) getOplogReplLag(collection string) (*OplogStats, error) {
|
|
query := bson.M{"ts": bson.M{"$exists": true}}
|
|
|
|
var first oplogEntry
|
|
firstResult := s.client.Database("local").Collection(collection).FindOne(context.Background(), query, options.FindOne().SetSort(bson.M{"$natural": 1}))
|
|
if firstResult.Err() != nil {
|
|
return nil, firstResult.Err()
|
|
}
|
|
if err := firstResult.Decode(&first); err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
var last oplogEntry
|
|
lastResult := s.client.Database("local").Collection(collection).FindOne(context.Background(), query, options.FindOne().SetSort(bson.M{"$natural": -1}))
|
|
if lastResult.Err() != nil {
|
|
return nil, lastResult.Err()
|
|
}
|
|
if err := lastResult.Decode(&last); err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
firstTime := time.Unix(int64(first.Timestamp.T), 0)
|
|
lastTime := time.Unix(int64(last.Timestamp.T), 0)
|
|
stats := &OplogStats{
|
|
TimeDiff: int64(lastTime.Sub(firstTime).Seconds()),
|
|
}
|
|
return stats, nil
|
|
}
|
|
|
|
// The "oplog.rs" collection is stored on all replica set members.
|
|
//
|
|
// The "oplog.$main" collection is created on the master node of a
|
|
// master-slave replicated deployment. As of MongoDB 3.2, master-slave
|
|
// replication has been deprecated.
|
|
func (s *Server) gatherOplogStats() (*OplogStats, error) {
|
|
stats, err := s.getOplogReplLag("oplog.rs")
|
|
if err == nil {
|
|
return stats, nil
|
|
}
|
|
|
|
return s.getOplogReplLag("oplog.$main")
|
|
}
|
|
|
|
func (s *Server) gatherCollectionStats(colStatsDbs []string) (*ColStats, error) {
|
|
names, err := s.client.ListDatabaseNames(context.Background(), bson.D{})
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
results := &ColStats{}
|
|
for _, dbName := range names {
|
|
if stringInSlice(dbName, colStatsDbs) || len(colStatsDbs) == 0 {
|
|
// skip views as they fail on collStats below
|
|
filter := bson.M{"type": bson.M{"$in": bson.A{"collection", "timeseries"}}}
|
|
|
|
var colls []string
|
|
colls, err = s.client.Database(dbName).ListCollectionNames(context.Background(), filter)
|
|
if err != nil {
|
|
s.Log.Errorf("Error getting collection names: %s", err.Error())
|
|
continue
|
|
}
|
|
for _, colName := range colls {
|
|
colStatLine := &ColStatsData{}
|
|
err = s.runCommand(dbName, bson.D{
|
|
{
|
|
Key: "collStats",
|
|
Value: colName,
|
|
},
|
|
}, colStatLine)
|
|
if err != nil {
|
|
s.authLog(fmt.Errorf("error getting col stats from %q: %w", colName, err))
|
|
continue
|
|
}
|
|
collection := &Collection{
|
|
Name: colName,
|
|
DbName: dbName,
|
|
ColStatsData: colStatLine,
|
|
}
|
|
results.Collections = append(results.Collections, *collection)
|
|
}
|
|
}
|
|
}
|
|
return results, nil
|
|
}
|
|
|
|
func (s *Server) gatherData(
|
|
acc telegraf.Accumulator,
|
|
gatherClusterStatus bool,
|
|
gatherDbStats bool,
|
|
gatherColStats bool,
|
|
gatherTopStat bool,
|
|
colStatsDbs []string,
|
|
) error {
|
|
serverStatus, err := s.gatherServerStatus()
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
// Get replica set status, an error indicates that the server is not a
|
|
// member of a replica set.
|
|
replSetStatus, err := s.gatherReplSetStatus()
|
|
if err != nil {
|
|
s.Log.Debugf("Unable to gather replica set status: %s", err.Error())
|
|
}
|
|
|
|
// Gather the oplog if we are a member of a replica set. Non-replica set
|
|
// members do not have the oplog collections.
|
|
var oplogStats *OplogStats
|
|
if replSetStatus != nil {
|
|
oplogStats, err = s.gatherOplogStats()
|
|
if err != nil {
|
|
s.authLog(fmt.Errorf("unable to get oplog stats: %w", err))
|
|
}
|
|
}
|
|
|
|
var clusterStatus *ClusterStatus
|
|
if gatherClusterStatus {
|
|
status, err := s.gatherClusterStatus()
|
|
if err != nil {
|
|
s.Log.Debugf("Unable to gather cluster status: %s", err.Error())
|
|
}
|
|
clusterStatus = status
|
|
}
|
|
|
|
shardStats, err := s.gatherShardConnPoolStats(serverStatus.Version)
|
|
if err != nil {
|
|
s.authLog(fmt.Errorf("unable to gather shard connection pool stats: %w", err))
|
|
}
|
|
|
|
var collectionStats *ColStats
|
|
if gatherColStats {
|
|
stats, err := s.gatherCollectionStats(colStatsDbs)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
collectionStats = stats
|
|
}
|
|
|
|
dbStats := &DbStats{}
|
|
if gatherDbStats {
|
|
names, err := s.client.ListDatabaseNames(context.Background(), bson.D{})
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
for _, name := range names {
|
|
db, err := s.gatherDBStats(name)
|
|
if err != nil {
|
|
s.Log.Debugf("Error getting db stats from %q: %s", name, err.Error())
|
|
}
|
|
dbStats.Dbs = append(dbStats.Dbs, *db)
|
|
}
|
|
}
|
|
|
|
topStatData := &TopStats{}
|
|
if gatherTopStat {
|
|
topStats, err := s.gatherTopStatData()
|
|
if err != nil {
|
|
s.Log.Debugf("Unable to gather top stat data: %s", err.Error())
|
|
return err
|
|
}
|
|
topStatData = topStats
|
|
}
|
|
|
|
result := &MongoStatus{
|
|
ServerStatus: serverStatus,
|
|
ReplSetStatus: replSetStatus,
|
|
ClusterStatus: clusterStatus,
|
|
DbStats: dbStats,
|
|
ColStats: collectionStats,
|
|
ShardStats: shardStats,
|
|
OplogStats: oplogStats,
|
|
TopStats: topStatData,
|
|
}
|
|
|
|
result.SampleTime = time.Now()
|
|
if s.lastResult != nil && result != nil {
|
|
duration := result.SampleTime.Sub(s.lastResult.SampleTime)
|
|
durationInSeconds := int64(duration.Seconds())
|
|
if durationInSeconds == 0 {
|
|
durationInSeconds = 1
|
|
}
|
|
data := NewMongodbData(
|
|
NewStatLine(*s.lastResult, *result, s.hostname, true, durationInSeconds),
|
|
s.getDefaultTags(),
|
|
)
|
|
data.AddDefaultStats()
|
|
data.AddDbStats()
|
|
data.AddColStats()
|
|
data.AddShardHostStats()
|
|
data.AddTopStats()
|
|
data.flush(acc)
|
|
}
|
|
|
|
s.lastResult = result
|
|
return nil
|
|
}
|
|
|
|
func stringInSlice(a string, list []string) bool {
|
|
for _, b := range list {
|
|
if b == a {
|
|
return true
|
|
}
|
|
}
|
|
return false
|
|
}
|