// Copyright (C) 2019-2020 Zilliz. All rights reserved. // // Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except in compliance // with the License. You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, software distributed under the License // is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express // or implied. See the License for the specific language governing permissions and limitations under the License. package querycoord import ( "context" "os" "github.com/milvus-io/milvus/internal/util/uniquegenerator" "github.com/milvus-io/milvus/internal/util/typeutil" "go.uber.org/zap" "github.com/milvus-io/milvus/internal/log" "github.com/milvus-io/milvus/internal/proto/commonpb" "github.com/milvus-io/milvus/internal/proto/milvuspb" "github.com/milvus-io/milvus/internal/util/metricsinfo" ) // TODO(dragondriver): add more detail metrics func getSystemInfoMetrics( ctx context.Context, req *milvuspb.GetMetricsRequest, qc *QueryCoord, ) (*milvuspb.GetMetricsResponse, error) { clusterTopology := metricsinfo.QueryClusterTopology{ Self: metricsinfo.QueryCoordInfos{ BaseComponentInfos: metricsinfo.BaseComponentInfos{ Name: metricsinfo.ConstructComponentName(typeutil.QueryCoordRole, Params.QueryCoordID), HardwareInfos: metricsinfo.HardwareMetrics{ IP: qc.session.Address, CPUCoreCount: metricsinfo.GetCPUCoreCount(false), CPUCoreUsage: metricsinfo.GetCPUUsage(), Memory: metricsinfo.GetMemoryCount(), MemoryUsage: metricsinfo.GetUsedMemoryCount(), Disk: metricsinfo.GetDiskCount(), DiskUsage: metricsinfo.GetDiskUsage(), }, SystemInfo: metricsinfo.DeployMetrics{ SystemVersion: os.Getenv(metricsinfo.GitCommitEnvKey), DeployMode: os.Getenv(metricsinfo.DeployModeEnvKey), }, CreatedTime: Params.CreatedTime.String(), UpdatedTime: Params.UpdatedTime.String(), Type: typeutil.QueryCoordRole, ID: qc.session.ServerID, }, SystemConfigurations: metricsinfo.QueryCoordConfiguration{ SearchChannelPrefix: Params.SearchChannelPrefix, SearchResultChannelPrefix: Params.SearchResultChannelPrefix, }, }, ConnectedNodes: make([]metricsinfo.QueryNodeInfos, 0), } nodesMetrics := qc.cluster.getMetrics(ctx, req) for _, nodeMetrics := range nodesMetrics { if nodeMetrics.err != nil { log.Warn("invalid metrics of query node was found", zap.Error(nodeMetrics.err)) clusterTopology.ConnectedNodes = append(clusterTopology.ConnectedNodes, metricsinfo.QueryNodeInfos{ BaseComponentInfos: metricsinfo.BaseComponentInfos{ HasError: true, ErrorReason: nodeMetrics.err.Error(), // Name doesn't matter here cause we can't get it when error occurs, using address as the Name? Name: "", ID: int64(uniquegenerator.GetUniqueIntGeneratorIns().GetInt()), }, }) continue } if nodeMetrics.resp.Status.ErrorCode != commonpb.ErrorCode_Success { log.Warn("invalid metrics of query node was found", zap.Any("error_code", nodeMetrics.resp.Status.ErrorCode), zap.Any("error_reason", nodeMetrics.resp.Status.Reason)) clusterTopology.ConnectedNodes = append(clusterTopology.ConnectedNodes, metricsinfo.QueryNodeInfos{ BaseComponentInfos: metricsinfo.BaseComponentInfos{ HasError: true, ErrorReason: nodeMetrics.resp.Status.Reason, Name: nodeMetrics.resp.ComponentName, ID: int64(uniquegenerator.GetUniqueIntGeneratorIns().GetInt()), }, }) continue } infos := metricsinfo.QueryNodeInfos{} err := metricsinfo.UnmarshalComponentInfos(nodeMetrics.resp.Response, &infos) if err != nil { log.Warn("invalid metrics of query node was found", zap.Error(err)) clusterTopology.ConnectedNodes = append(clusterTopology.ConnectedNodes, metricsinfo.QueryNodeInfos{ BaseComponentInfos: metricsinfo.BaseComponentInfos{ HasError: true, ErrorReason: err.Error(), Name: nodeMetrics.resp.ComponentName, ID: int64(uniquegenerator.GetUniqueIntGeneratorIns().GetInt()), }, }) continue } clusterTopology.ConnectedNodes = append(clusterTopology.ConnectedNodes, infos) } coordTopology := metricsinfo.QueryCoordTopology{ Cluster: clusterTopology, Connections: metricsinfo.ConnTopology{ Name: metricsinfo.ConstructComponentName(typeutil.QueryCoordRole, Params.QueryCoordID), // TODO(dragondriver): fill ConnectedComponents if necessary ConnectedComponents: []metricsinfo.ConnectionInfo{}, }, } resp, err := metricsinfo.MarshalTopology(coordTopology) if err != nil { return &milvuspb.GetMetricsResponse{ Status: &commonpb.Status{ ErrorCode: commonpb.ErrorCode_UnexpectedError, Reason: err.Error(), }, Response: "", ComponentName: metricsinfo.ConstructComponentName(typeutil.QueryCoordRole, Params.QueryCoordID), }, nil } return &milvuspb.GetMetricsResponse{ Status: &commonpb.Status{ ErrorCode: commonpb.ErrorCode_Success, Reason: "", }, Response: resp, ComponentName: metricsinfo.ConstructComponentName(typeutil.QueryCoordRole, Params.QueryCoordID), }, nil }