mirror of
https://gitee.com/rainbond/Rainbond.git
synced 2024-12-03 04:07:51 +08:00
200 lines
6.3 KiB
Go
200 lines
6.3 KiB
Go
// Copyright (C) 2014-2018 Goodrain Co., Ltd.
|
|
// RAINBOND, Application Management Platform
|
|
|
|
// This program is free software: you can redistribute it and/or modify
|
|
// it under the terms of the GNU General Public License as published by
|
|
// the Free Software Foundation, either version 3 of the License, or
|
|
// (at your option) any later version. For any non-GPL usage of Rainbond,
|
|
// one or multiple Commercial Licenses authorized by Goodrain Co., Ltd.
|
|
// must be obtained first.
|
|
|
|
// This program is distributed in the hope that it will be useful,
|
|
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
// GNU General Public License for more details.
|
|
|
|
// You should have received a copy of the GNU General Public License
|
|
// along with this program. If not, see <http://www.gnu.org/licenses/>.
|
|
|
|
package collector
|
|
|
|
import (
|
|
"os"
|
|
"strings"
|
|
"time"
|
|
|
|
"github.com/goodrain/rainbond/db/model"
|
|
|
|
"github.com/Sirupsen/logrus"
|
|
status "github.com/goodrain/rainbond/appruntimesync/client"
|
|
"github.com/goodrain/rainbond/db"
|
|
"github.com/prometheus/client_golang/prometheus"
|
|
"github.com/goodrain/rainbond/worker/discover"
|
|
)
|
|
|
|
//Exporter 收集器
|
|
type Exporter struct {
|
|
dsn string
|
|
error prometheus.Gauge
|
|
totalScrapes prometheus.Counter
|
|
scrapeErrors *prometheus.CounterVec
|
|
memoryUse *prometheus.GaugeVec
|
|
fsUse *prometheus.GaugeVec
|
|
workerUp prometheus.Gauge
|
|
dbmanager db.Manager
|
|
statusManager *status.AppRuntimeSyncClient
|
|
healthStatus prometheus.Gauge
|
|
taskNum prometheus.Gauge
|
|
taskError prometheus.Gauge
|
|
}
|
|
|
|
var scrapeDurationDesc = prometheus.NewDesc(
|
|
prometheus.BuildFQName(namespace, "exporter", "collector_duration_seconds"),
|
|
"Collector time duration.",
|
|
[]string{"collector"}, nil,
|
|
)
|
|
|
|
//Describe Describe
|
|
func (e *Exporter) Describe(ch chan<- *prometheus.Desc) {
|
|
metricCh := make(chan prometheus.Metric)
|
|
doneCh := make(chan struct{})
|
|
|
|
go func() {
|
|
for m := range metricCh {
|
|
ch <- m.Desc()
|
|
}
|
|
close(doneCh)
|
|
}()
|
|
|
|
e.Collect(metricCh)
|
|
close(metricCh)
|
|
<-doneCh
|
|
}
|
|
|
|
// Collect implements prometheus.Collector.
|
|
func (e *Exporter) Collect(ch chan<- prometheus.Metric) {
|
|
e.scrape(ch)
|
|
|
|
ch <- e.totalScrapes
|
|
ch <- e.error
|
|
e.fsUse.Collect(ch)
|
|
e.memoryUse.Collect(ch)
|
|
e.scrapeErrors.Collect(ch)
|
|
ch <- e.workerUp
|
|
}
|
|
|
|
func (e *Exporter) scrape(ch chan<- prometheus.Metric) {
|
|
e.totalScrapes.Inc()
|
|
var err error
|
|
scrapeTime := time.Now()
|
|
services, err := e.dbmanager.TenantServiceDao().GetAllServices()
|
|
if err != nil {
|
|
logrus.Errorln("Error scraping for tenant service when select db :", err)
|
|
e.scrapeErrors.WithLabelValues("db.getservices").Inc()
|
|
e.error.Set(1)
|
|
}
|
|
status, err := e.statusManager.GetNeedBillingStatus()
|
|
if err != nil {
|
|
logrus.Errorln("Error scraping for tenant service when select db :", err)
|
|
e.scrapeErrors.WithLabelValues("db.getservices").Inc()
|
|
e.error.Set(1)
|
|
}
|
|
localPath := os.Getenv("LOCAL_DATA_PATH")
|
|
sharePath := os.Getenv("SHARE_DATA_PATH")
|
|
if localPath == "" {
|
|
localPath = "/grlocaldata"
|
|
}
|
|
if sharePath == "" {
|
|
sharePath = "/grdata"
|
|
}
|
|
//获取内存使用情况
|
|
for _, service := range services {
|
|
if _, ok := status[service.ServiceID]; ok {
|
|
e.memoryUse.WithLabelValues(service.TenantID, service.ServiceID, "running").Set(float64(service.ContainerMemory * service.Replicas))
|
|
}
|
|
}
|
|
ch <- prometheus.MustNewConstMetric(scrapeDurationDesc, prometheus.GaugeValue, time.Since(scrapeTime).Seconds(), "collect.memory")
|
|
scrapeTime = time.Now()
|
|
diskcache := e.statusManager.GetAppDisk()
|
|
for k, v := range diskcache {
|
|
key := strings.Split(k, "_")
|
|
if len(key) == 2 {
|
|
e.fsUse.WithLabelValues(key[1], key[0], string(model.ShareFileVolumeType)).Set(v)
|
|
}
|
|
}
|
|
ch <- prometheus.MustNewConstMetric(scrapeDurationDesc, prometheus.GaugeValue, time.Since(scrapeTime).Seconds(), "collect.fs")
|
|
|
|
healthInfo := discover.HealthCheck()
|
|
healthStatus := healthInfo["status"]
|
|
var val float64
|
|
if healthStatus == "health" {
|
|
val = 1
|
|
} else {
|
|
val = 0
|
|
}
|
|
ch <- prometheus.MustNewConstMetric(e.healthStatus.Desc(), prometheus.GaugeValue, val)
|
|
ch <- prometheus.MustNewConstMetric(e.taskNum.Desc(), prometheus.GaugeValue, discover.TaskNum)
|
|
ch <- prometheus.MustNewConstMetric(e.taskError.Desc(), prometheus.GaugeValue, discover.TaskError)
|
|
}
|
|
|
|
var namespace = "app_resource"
|
|
|
|
//New 创建一个收集器
|
|
func New(statusManager *status.AppRuntimeSyncClient) *Exporter {
|
|
return &Exporter{
|
|
totalScrapes: prometheus.NewCounter(prometheus.CounterOpts{
|
|
Namespace: namespace,
|
|
Subsystem: "exporter",
|
|
Name: "scrapes_total",
|
|
Help: "Total number of times Worker was scraped for metrics.",
|
|
}),
|
|
scrapeErrors: prometheus.NewCounterVec(prometheus.CounterOpts{
|
|
Namespace: namespace,
|
|
Subsystem: "exporter",
|
|
Name: "scrape_errors_total",
|
|
Help: "Total number of times an error occurred scraping a Worker.",
|
|
}, []string{"collector"}),
|
|
error: prometheus.NewGauge(prometheus.GaugeOpts{
|
|
Namespace: namespace,
|
|
Subsystem: "exporter",
|
|
Name: "last_scrape_error",
|
|
Help: "Whether the last scrape of metrics from Worker resulted in an error (1 for error, 0 for success).",
|
|
}),
|
|
workerUp: prometheus.NewGauge(prometheus.GaugeOpts{
|
|
Namespace: namespace,
|
|
Name: "up",
|
|
Help: "Whether the Worker server is up.",
|
|
}),
|
|
memoryUse: prometheus.NewGaugeVec(prometheus.GaugeOpts{
|
|
Namespace: namespace,
|
|
Name: "appmemory",
|
|
Help: "tenant service memory used.",
|
|
}, []string{"tenant_id", "service_id", "service_status"}),
|
|
fsUse: prometheus.NewGaugeVec(prometheus.GaugeOpts{
|
|
Namespace: namespace,
|
|
Name: "appfs",
|
|
Help: "tenant service fs used.",
|
|
}, []string{"tenant_id", "service_id", "volume_type"}),
|
|
healthStatus: prometheus.NewGauge(prometheus.GaugeOpts{
|
|
Namespace: namespace,
|
|
Subsystem: "exporter",
|
|
Name: "worker_health_status",
|
|
Help: "worker component health status.",
|
|
}),
|
|
taskNum: prometheus.NewGauge(prometheus.GaugeOpts{
|
|
Namespace: namespace,
|
|
Subsystem: "exporter",
|
|
Name: "worker_task_number",
|
|
Help: "worker total number of tasks.",
|
|
}),
|
|
taskError: prometheus.NewGauge(prometheus.GaugeOpts{
|
|
Namespace: namespace,
|
|
Subsystem: "exporter",
|
|
Name: "worker_task_error",
|
|
Help: "worker number of task errors.",
|
|
}),
|
|
dbmanager: db.GetManager(),
|
|
statusManager: statusManager,
|
|
}
|
|
}
|