414 lines
11 KiB
Go
Raw Normal View History

2024-07-26 11:50:02 +05:30
package kafka
import (
"fmt"
"github.com/SigNoz/signoz/pkg/query-service/common"
"github.com/SigNoz/signoz/pkg/query-service/constants"
v3 "github.com/SigNoz/signoz/pkg/query-service/model/v3"
2024-07-26 11:50:02 +05:30
)
var defaultStepInterval int64 = 60
func BuildQueryRangeParams(messagingQueue *MessagingQueue, queryContext string) (*v3.QueryRangeParamsV3, error) {
if constants.KafkaSpanEval == "false" && queryContext == "producer-consumer-eval" {
return nil, fmt.Errorf("span evaluation feature is disabled and is experimental")
}
2024-07-26 13:02:45 +05:30
// ToDo: propagate this through APIs when there are different handlers
queueType := KafkaQueue
2024-07-26 13:02:45 +05:30
chq, err := BuildClickHouseQuery(messagingQueue, queueType, queryContext)
2024-07-26 15:23:31 +05:30
if err != nil {
return nil, err
2024-07-26 11:50:02 +05:30
}
cq, err := buildCompositeQuery(chq, queryContext)
if err != nil {
return nil, err
}
2024-07-26 15:23:31 +05:30
2024-07-26 11:50:02 +05:30
queryRangeParams := &v3.QueryRangeParamsV3{
Start: messagingQueue.Start,
End: messagingQueue.End,
Step: defaultStepInterval,
CompositeQuery: cq,
Version: "v4",
FormatForWeb: true,
}
return queryRangeParams, nil
}
2024-08-07 13:51:00 +05:30
func buildClickHouseQueryNetwork(messagingQueue *MessagingQueue, queueType string) (*v3.ClickHouseQuery, error) {
start := messagingQueue.Start
end := messagingQueue.End
2024-08-07 13:51:00 +05:30
consumerGroup, ok := messagingQueue.Variables["consumer_group"]
if !ok {
return nil, fmt.Errorf("consumer_group not found in the request")
}
2024-08-27 18:27:44 +05:30
partitionID, ok := messagingQueue.Variables["partition"]
if !ok {
return nil, fmt.Errorf("partition not found in the request")
}
query := generateNetworkLatencyThroughputSQL(start, end, consumerGroup, partitionID, queueType)
2024-08-07 13:51:00 +05:30
return &v3.ClickHouseQuery{
Query: query,
}, nil
}
func buildBuilderQueriesProducerBytes(
unixMilliStart, unixMilliEnd int64,
attributeCache *Clients,
) (map[string]*v3.BuilderQuery, error) {
bq := make(map[string]*v3.BuilderQuery)
queryName := "byte_rate"
chq := &v3.BuilderQuery{
QueryName: queryName,
StepInterval: common.MinAllowedStepInterval(unixMilliStart, unixMilliEnd),
DataSource: v3.DataSourceMetrics,
AggregateAttribute: v3.AttributeKey{
Key: "kafka_producer_byte_rate",
DataType: v3.AttributeKeyDataTypeFloat64,
Type: v3.AttributeKeyType("Gauge"),
IsColumn: true,
},
AggregateOperator: v3.AggregateOperatorAvg,
Temporality: v3.Unspecified,
TimeAggregation: v3.TimeAggregationAvg,
SpaceAggregation: v3.SpaceAggregationAvg,
Filters: &v3.FilterSet{
Operator: "AND",
Items: []v3.FilterItem{
{
Key: v3.AttributeKey{
Key: "service_name",
Type: v3.AttributeKeyTypeTag,
DataType: v3.AttributeKeyDataTypeString,
},
Operator: v3.FilterOperatorIn,
Value: attributeCache.ServiceName,
},
{
Key: v3.AttributeKey{
Key: "topic",
Type: v3.AttributeKeyTypeTag,
DataType: v3.AttributeKeyDataTypeString,
},
Operator: v3.FilterOperatorIn,
Value: attributeCache.TopicName,
},
},
},
Expression: queryName,
ReduceTo: v3.ReduceToOperatorAvg,
GroupBy: []v3.AttributeKey{
{
Key: "service_name",
DataType: v3.AttributeKeyDataTypeString,
Type: v3.AttributeKeyTypeTag,
},
{
Key: "topic",
DataType: v3.AttributeKeyDataTypeString,
Type: v3.AttributeKeyTypeTag,
},
},
2024-08-27 18:27:44 +05:30
}
bq[queryName] = chq
return bq, nil
2024-08-27 18:27:44 +05:30
}
2024-08-26 17:56:03 +05:30
func buildBuilderQueriesNetwork(
unixMilliStart, unixMilliEnd int64,
attributeCache *Clients,
) (map[string]*v3.BuilderQuery, error) {
2024-08-27 18:27:44 +05:30
bq := make(map[string]*v3.BuilderQuery)
queryName := "latency"
2024-08-27 18:27:44 +05:30
chq := &v3.BuilderQuery{
QueryName: queryName,
StepInterval: common.MinAllowedStepInterval(unixMilliStart, unixMilliEnd),
DataSource: v3.DataSourceMetrics,
AggregateAttribute: v3.AttributeKey{
Key: "kafka_consumer_fetch_latency_avg",
},
AggregateOperator: v3.AggregateOperatorAvg,
Temporality: v3.Unspecified,
TimeAggregation: v3.TimeAggregationAvg,
SpaceAggregation: v3.SpaceAggregationAvg,
Filters: &v3.FilterSet{
Operator: "AND",
Items: []v3.FilterItem{
{
Key: v3.AttributeKey{
Key: "service_name",
Type: v3.AttributeKeyTypeTag,
DataType: v3.AttributeKeyDataTypeString,
2024-08-26 17:56:03 +05:30
},
2024-08-27 18:27:44 +05:30
Operator: v3.FilterOperatorIn,
Value: attributeCache.ServiceName,
},
{
Key: v3.AttributeKey{
Key: "client_id",
Type: v3.AttributeKeyTypeTag,
DataType: v3.AttributeKeyDataTypeString,
2024-08-26 17:56:03 +05:30
},
2024-08-27 18:27:44 +05:30
Operator: v3.FilterOperatorIn,
Value: attributeCache.ClientID,
},
{
Key: v3.AttributeKey{
Key: "service_instance_id",
Type: v3.AttributeKeyTypeTag,
DataType: v3.AttributeKeyDataTypeString,
2024-08-26 17:56:03 +05:30
},
2024-08-27 18:27:44 +05:30
Operator: v3.FilterOperatorIn,
Value: attributeCache.ServiceInstanceID,
2024-08-26 17:56:03 +05:30
},
},
2024-08-27 18:27:44 +05:30
},
Expression: queryName,
ReduceTo: v3.ReduceToOperatorAvg,
GroupBy: []v3.AttributeKey{
{
Key: "service_name",
DataType: v3.AttributeKeyDataTypeString,
Type: v3.AttributeKeyTypeTag,
},
2024-08-27 18:27:44 +05:30
{
Key: "client_id",
2024-08-26 17:56:03 +05:30
DataType: v3.AttributeKeyDataTypeString,
Type: v3.AttributeKeyTypeTag,
},
2024-08-27 18:27:44 +05:30
{
Key: "service_instance_id",
DataType: v3.AttributeKeyDataTypeString,
Type: v3.AttributeKeyTypeTag,
2024-08-26 17:56:03 +05:30
},
2024-08-27 18:27:44 +05:30
},
2024-08-07 13:51:00 +05:30
}
2024-08-27 18:27:44 +05:30
bq[queryName] = chq
2024-08-26 17:56:03 +05:30
return bq, nil
2024-08-07 13:51:00 +05:30
}
func BuildBuilderQueriesKafkaOnboarding(messagingQueue *MessagingQueue) (*v3.QueryRangeParamsV3, error) {
bq := make(map[string]*v3.BuilderQuery)
unixMilliStart := messagingQueue.Start / 1000000
unixMilliEnd := messagingQueue.End / 1000000
buiderQuery := &v3.BuilderQuery{
QueryName: "fetch_latency",
StepInterval: common.MinAllowedStepInterval(unixMilliStart, unixMilliEnd),
DataSource: v3.DataSourceMetrics,
AggregateAttribute: v3.AttributeKey{
Key: "kafka_consumer_fetch_latency_avg",
},
AggregateOperator: v3.AggregateOperatorCount,
Temporality: v3.Unspecified,
TimeAggregation: v3.TimeAggregationCount,
SpaceAggregation: v3.SpaceAggregationSum,
Expression: "fetch_latency",
}
bq["fetch_latency"] = buiderQuery
buiderQuery = &v3.BuilderQuery{
QueryName: "consumer_lag",
StepInterval: common.MinAllowedStepInterval(unixMilliStart, unixMilliEnd),
DataSource: v3.DataSourceMetrics,
AggregateAttribute: v3.AttributeKey{
Key: "kafka_consumer_group_lag",
},
AggregateOperator: v3.AggregateOperatorCount,
Temporality: v3.Unspecified,
TimeAggregation: v3.TimeAggregationCount,
SpaceAggregation: v3.SpaceAggregationSum,
Expression: "consumer_lag",
}
bq["consumer_lag"] = buiderQuery
cq := &v3.CompositeQuery{
QueryType: v3.QueryTypeBuilder,
BuilderQueries: bq,
PanelType: v3.PanelTypeTable,
}
queryRangeParams := &v3.QueryRangeParamsV3{
Start: unixMilliStart,
End: unixMilliEnd,
Step: defaultStepInterval,
CompositeQuery: cq,
Version: "v4",
FormatForWeb: true,
}
return queryRangeParams, nil
}
func BuildQRParamsWithCache(
messagingQueue *MessagingQueue,
queryContext string,
attributeCache *Clients,
) (*v3.QueryRangeParamsV3, error) {
2024-08-07 13:51:00 +05:30
queueType := KafkaQueue
2024-08-07 13:51:00 +05:30
2024-08-27 14:04:00 +05:30
unixMilliStart := messagingQueue.Start / 1000000
unixMilliEnd := messagingQueue.End / 1000000
2024-08-07 13:51:00 +05:30
var cq *v3.CompositeQuery
var err error
2024-08-07 13:51:00 +05:30
if queryContext == "throughput" {
chq, err := buildClickHouseQueryNetwork(messagingQueue, queueType)
if err != nil {
return nil, err
}
cq, err = buildCompositeQuery(chq, queryContext)
2024-08-26 17:56:03 +05:30
2024-08-07 13:51:00 +05:30
} else if queryContext == "fetch-latency" {
2024-08-27 14:04:00 +05:30
bhq, err := buildBuilderQueriesNetwork(unixMilliStart, unixMilliEnd, attributeCache)
2024-08-07 13:51:00 +05:30
if err != nil {
return nil, err
}
cq = &v3.CompositeQuery{
2024-08-26 17:56:03 +05:30
QueryType: v3.QueryTypeBuilder,
BuilderQueries: bhq,
PanelType: v3.PanelTypeTable,
2024-08-07 13:51:00 +05:30
}
} else if queryContext == "producer-throughput-overview" {
start := messagingQueue.Start
end := messagingQueue.End
query := generateProducerPartitionThroughputSQL(start, end, queueType)
cq, err = buildCompositeQuery(&v3.ClickHouseQuery{
Query: query,
}, queryContext)
} else if queryContext == "producer-throughput-overview-byte-rate" {
bhq, err := buildBuilderQueriesProducerBytes(unixMilliStart, unixMilliEnd, attributeCache)
if err != nil {
return nil, err
}
cq = &v3.CompositeQuery{
QueryType: v3.QueryTypeBuilder,
BuilderQueries: bhq,
PanelType: v3.PanelTypeTable,
FillGaps: false,
}
2024-08-07 13:51:00 +05:30
}
queryRangeParams := &v3.QueryRangeParamsV3{
2024-08-27 14:04:00 +05:30
Start: unixMilliStart,
End: unixMilliEnd,
2024-08-07 13:51:00 +05:30
Step: defaultStepInterval,
CompositeQuery: cq,
Version: "v4",
FormatForWeb: true,
}
return queryRangeParams, err
2024-08-07 13:51:00 +05:30
}
func BuildClickHouseQuery(
messagingQueue *MessagingQueue,
queueType string,
queryContext string,
) (*v3.ClickHouseQuery, error) {
2024-07-26 11:50:02 +05:30
start := messagingQueue.Start
end := messagingQueue.End
2024-09-30 18:13:39 +05:30
var topic, partition string
if queryContext == "producer" ||
queryContext == "consumer" ||
queryContext == "consumer_partition_latency" ||
queryContext == "producer-throughput-details" ||
queryContext == "consumer-throughput-details" {
2024-09-30 18:13:39 +05:30
var ok bool
topic, ok = messagingQueue.Variables["topic"]
if !ok {
return nil, fmt.Errorf("invalid type for Topic")
}
if !(queryContext == "consumer-throughput-details" ||
queryContext == "producer-throughput-details") {
partition, ok = messagingQueue.Variables["partition"]
if !ok {
return nil, fmt.Errorf("invalid type for Partition")
}
2024-09-30 18:13:39 +05:30
}
2024-07-26 11:50:02 +05:30
}
2024-07-26 15:23:31 +05:30
var query string
switch queryContext {
case "producer":
2024-07-26 15:23:31 +05:30
query = generateProducerSQL(start, end, topic, partition, queueType)
case "consumer":
consumerGroup, ok := messagingQueue.Variables["consumer_group"]
if !ok {
return nil, fmt.Errorf("invalid type for consumer group")
}
2024-07-31 17:55:13 +05:30
query = generateConsumerSQL(start, end, topic, partition, consumerGroup, queueType)
case "producer-topic-throughput":
query = generatePartitionLatencySQL(start, end, queueType)
case "consumer_partition_latency":
query = generateConsumerPartitionLatencySQL(start, end, topic, partition, queueType)
case "producer-throughput-details":
svcName, ok := messagingQueue.Variables["service_name"]
if !ok {
return nil, fmt.Errorf("invalid type for service")
}
query = generateProducerTopicLatencySQL(start, end, topic, svcName, queueType)
case "consumer-throughput-overview":
query = generateConsumerLatencySQL(start, end, queueType)
case "consumer-throughput-details":
svcName, ok := messagingQueue.Variables["service_name"]
if !ok {
return nil, fmt.Errorf("invalid type for service")
}
query = generateConsumerServiceLatencySQL(start, end, topic, svcName, queueType)
case "producer-consumer-eval":
query = generateProducerConsumerEvalSQL(start, end, queueType, messagingQueue.EvalTime)
case "onboard_producers":
2024-09-30 18:13:39 +05:30
query = onboardProducersSQL(start, end, queueType)
case "onboard_consumers":
2024-09-30 18:13:39 +05:30
query = onboardConsumerSQL(start, end, queueType)
2024-07-26 11:50:02 +05:30
}
2024-07-26 11:50:02 +05:30
return &v3.ClickHouseQuery{
Query: query,
}, nil
}
2024-07-26 15:23:31 +05:30
func buildCompositeQuery(chq *v3.ClickHouseQuery, queryContext string) (*v3.CompositeQuery, error) {
if queryContext == "producer-consumer-eval" {
return &v3.CompositeQuery{
QueryType: v3.QueryTypeClickHouseSQL,
ClickHouseQueries: map[string]*v3.ClickHouseQuery{queryContext: chq},
PanelType: v3.PanelTypeList,
}, nil
}
2024-07-26 11:50:02 +05:30
return &v3.CompositeQuery{
QueryType: v3.QueryTypeClickHouseSQL,
2024-07-26 15:23:31 +05:30
ClickHouseQueries: map[string]*v3.ClickHouseQuery{queryContext: chq},
2024-07-26 11:50:02 +05:30
PanelType: v3.PanelTypeTable,
}, nil
}