mirror of
https://github.com/SigNoz/signoz.git
synced 2025-12-18 07:56:56 +00:00
754 lines
20 KiB
Go
754 lines
20 KiB
Go
package telemetrytraces
|
|
|
|
import (
|
|
"context"
|
|
"fmt"
|
|
"github.com/SigNoz/signoz/pkg/errors"
|
|
"github.com/SigNoz/signoz/pkg/querybuilder"
|
|
qbtypes "github.com/SigNoz/signoz/pkg/types/querybuildertypes/querybuildertypesv5"
|
|
"github.com/SigNoz/signoz/pkg/types/telemetrytypes"
|
|
"github.com/huandu/go-sqlbuilder"
|
|
"strings"
|
|
)
|
|
|
|
type cteNode struct {
|
|
name string
|
|
sql string
|
|
args []any
|
|
dependsOn []string
|
|
}
|
|
|
|
type traceOperatorCTEBuilder struct {
|
|
ctx context.Context
|
|
start uint64
|
|
end uint64
|
|
operator *qbtypes.QueryBuilderTraceOperator
|
|
stmtBuilder *traceOperatorStatementBuilder
|
|
queries map[string]*qbtypes.QueryBuilderQuery[qbtypes.TraceAggregation]
|
|
ctes []cteNode // Ordered list of CTEs
|
|
cteNameToIndex map[string]int
|
|
queryToCTEName map[string]string
|
|
compositeQuery *qbtypes.CompositeQuery
|
|
}
|
|
|
|
func (b *traceOperatorCTEBuilder) collectQueries() error {
|
|
referencedQueries := b.operator.CollectReferencedQueries(b.operator.ParsedExpression)
|
|
|
|
for _, queryEnv := range b.compositeQuery.Queries {
|
|
if queryEnv.Type == qbtypes.QueryTypeBuilder {
|
|
if traceQuery, ok := queryEnv.Spec.(qbtypes.QueryBuilderQuery[qbtypes.TraceAggregation]); ok {
|
|
for _, refName := range referencedQueries {
|
|
if traceQuery.Name == refName {
|
|
queryCopy := traceQuery // Make a copy
|
|
b.queries[refName] = &queryCopy
|
|
break
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
for _, refName := range referencedQueries {
|
|
if _, found := b.queries[refName]; !found {
|
|
return errors.NewInvalidInputf(errors.CodeInvalidInput, "referenced query '%s' not found", refName)
|
|
}
|
|
}
|
|
|
|
return nil
|
|
}
|
|
|
|
func (b *traceOperatorCTEBuilder) build(requestType qbtypes.RequestType) (*qbtypes.Statement, error) {
|
|
|
|
err := b.buildBaseSpansCTE()
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
// Build CTEs for the expression tree
|
|
rootCTEName, err := b.buildExpressionCTEs(b.operator.ParsedExpression)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
// Determine which CTE to select from
|
|
selectFromCTE := rootCTEName
|
|
if b.operator.ReturnSpansFrom != "" {
|
|
// Find the CTE that corresponds to this query
|
|
selectFromCTE = b.queryToCTEName[b.operator.ReturnSpansFrom]
|
|
if selectFromCTE == "" {
|
|
return nil, errors.NewInvalidInputf(errors.CodeInvalidInput,
|
|
"returnSpansFrom references query '%s' which has no corresponding CTE",
|
|
b.operator.ReturnSpansFrom)
|
|
}
|
|
}
|
|
|
|
// Build the final SELECT based on request type
|
|
finalStmt, err := b.buildFinalQuery(selectFromCTE, requestType)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
// Combine all CTEs
|
|
var cteFragments []string
|
|
var cteArgs [][]any
|
|
|
|
// Add time constants
|
|
timeConstantsCTE := b.buildTimeConstantsCTE()
|
|
cteFragments = append(cteFragments, timeConstantsCTE)
|
|
|
|
// Add all CTEs in order
|
|
for _, cte := range b.ctes {
|
|
cteFragments = append(cteFragments, fmt.Sprintf("%s AS (%s)", cte.name, cte.sql))
|
|
cteArgs = append(cteArgs, cte.args)
|
|
}
|
|
|
|
finalSQL := querybuilder.CombineCTEs(cteFragments) + finalStmt.Query
|
|
finalArgs := querybuilder.PrependArgs(cteArgs, finalStmt.Args)
|
|
|
|
return &qbtypes.Statement{
|
|
Query: finalSQL,
|
|
Args: finalArgs,
|
|
Warnings: finalStmt.Warnings,
|
|
}, nil
|
|
}
|
|
|
|
func (b *traceOperatorCTEBuilder) buildTimeConstantsCTE() string {
|
|
startBucket := b.start/querybuilder.NsToSeconds - querybuilder.BucketAdjustment
|
|
endBucket := b.end / querybuilder.NsToSeconds
|
|
|
|
return fmt.Sprintf(`
|
|
toDateTime64(%d, 9) AS t_from,
|
|
toDateTime64(%d, 9) AS t_to,
|
|
%d AS bucket_from,
|
|
%d AS bucket_to`,
|
|
b.start, b.end, startBucket, endBucket)
|
|
}
|
|
|
|
func (b *traceOperatorCTEBuilder) buildBaseSpansCTE() error {
|
|
sb := sqlbuilder.NewSelectBuilder()
|
|
|
|
// Select core span columns
|
|
sb.Select(
|
|
"trace_id",
|
|
"span_id",
|
|
"parent_span_id",
|
|
"name",
|
|
"timestamp",
|
|
"duration_nano AS durationNano",
|
|
sqlbuilder.Escape("resource_string_service$$name")+" AS serviceName",
|
|
sqlbuilder.Escape("resource_string_service$$name"), // Original column name for filters
|
|
sqlbuilder.Escape("resource_string_service$$name_exists"), // Exists flag column for filters
|
|
)
|
|
|
|
// Add any additional fields requested by the user
|
|
for _, field := range b.operator.SelectFields {
|
|
colExpr, err := b.stmtBuilder.fm.ColumnExpressionFor(b.ctx, &field, nil)
|
|
if err != nil {
|
|
return errors.NewInvalidInputf(
|
|
errors.CodeInvalidInput,
|
|
"failed to map select field '%s': %v",
|
|
field.Name,
|
|
err,
|
|
)
|
|
}
|
|
sb.SelectMore(sqlbuilder.Escape(colExpr))
|
|
}
|
|
|
|
// Set the table to query from
|
|
sb.From(fmt.Sprintf("%s.%s", DBName, SpanIndexV3TableName))
|
|
|
|
// Calculate bucket ranges for time-based partitioning
|
|
startBucket := b.start/querybuilder.NsToSeconds - querybuilder.BucketAdjustment
|
|
endBucket := b.end / querybuilder.NsToSeconds
|
|
|
|
// Add time and bucket filters
|
|
sb.Where(
|
|
sb.GE("timestamp", fmt.Sprintf("%d", b.start)),
|
|
sb.L("timestamp", fmt.Sprintf("%d", b.end)),
|
|
sb.GE("ts_bucket_start", startBucket),
|
|
sb.LE("ts_bucket_start", endBucket),
|
|
)
|
|
|
|
// Build the SQL and add as CTE
|
|
sql, args := sb.BuildWithFlavor(sqlbuilder.ClickHouse)
|
|
b.addCTE("base_spans", sql, args, nil)
|
|
return nil
|
|
}
|
|
|
|
func (b *traceOperatorCTEBuilder) buildExpressionCTEs(expr *qbtypes.TraceOperand) (string, error) {
|
|
if expr == nil {
|
|
return "", errors.NewInvalidInputf(errors.CodeInvalidInput, "expression is nil")
|
|
}
|
|
|
|
if expr.QueryRef != nil {
|
|
// Leaf node - build CTE for the query
|
|
return b.buildQueryCTE(expr.QueryRef.Name)
|
|
}
|
|
|
|
// Operator node - build CTEs for children first
|
|
var leftCTE, rightCTE string
|
|
var err error
|
|
|
|
if expr.Left != nil {
|
|
leftCTE, err = b.buildExpressionCTEs(expr.Left)
|
|
if err != nil {
|
|
return "", err
|
|
}
|
|
}
|
|
|
|
if expr.Right != nil {
|
|
rightCTE, err = b.buildExpressionCTEs(expr.Right)
|
|
if err != nil {
|
|
return "", err
|
|
}
|
|
}
|
|
|
|
// Build CTE for this operator
|
|
return b.buildOperatorCTE(*expr.Operator, leftCTE, rightCTE)
|
|
}
|
|
|
|
func (b *traceOperatorCTEBuilder) buildQueryCTE(queryName string) (string, error) {
|
|
query, exists := b.queries[queryName]
|
|
if !exists {
|
|
return "", errors.NewInvalidInputf(errors.CodeInvalidInput, "query %s not found", queryName)
|
|
}
|
|
|
|
cteName := queryName
|
|
b.queryToCTEName[queryName] = cteName
|
|
|
|
// Check if already built
|
|
if _, exists := b.cteNameToIndex[cteName]; exists {
|
|
return cteName, nil
|
|
}
|
|
|
|
// Get key selectors for the query
|
|
keySelectors := getKeySelectors(*query)
|
|
keys, _, err := b.stmtBuilder.metadataStore.GetKeysMulti(b.ctx, keySelectors)
|
|
if err != nil {
|
|
return "", err
|
|
}
|
|
|
|
sb := sqlbuilder.NewSelectBuilder()
|
|
sb.Select(
|
|
"trace_id",
|
|
"span_id",
|
|
"parent_span_id",
|
|
"name",
|
|
"timestamp",
|
|
"durationNano",
|
|
"serviceName",
|
|
fmt.Sprintf("'%s' AS level", cteName),
|
|
)
|
|
sb.From("base_spans AS s")
|
|
|
|
// Add filter conditions if present
|
|
if query.Filter != nil && query.Filter.Expression != "" {
|
|
filterWhereClause, err := querybuilder.PrepareWhereClause(
|
|
query.Filter.Expression,
|
|
querybuilder.FilterExprVisitorOpts{
|
|
FieldMapper: b.stmtBuilder.fm,
|
|
ConditionBuilder: b.stmtBuilder.cb,
|
|
FieldKeys: keys,
|
|
},
|
|
)
|
|
if err != nil {
|
|
return "", err
|
|
}
|
|
if filterWhereClause != nil {
|
|
sb.AddWhereClause(filterWhereClause.WhereClause)
|
|
}
|
|
}
|
|
|
|
sql, args := sb.BuildWithFlavor(sqlbuilder.ClickHouse)
|
|
b.addCTE(cteName, sql, args, []string{"base_spans"})
|
|
|
|
return cteName, nil
|
|
}
|
|
|
|
func sanitizeForSQL(s string) string {
|
|
// Replace special characters with safe alternatives
|
|
replacements := map[string]string{
|
|
"=>": "DIRECT_DESC",
|
|
"->": "INDIRECT_DESC",
|
|
"&&": "AND",
|
|
"||": "OR",
|
|
"NOT": "NOT",
|
|
" ": "_",
|
|
}
|
|
|
|
result := s
|
|
for old, new := range replacements {
|
|
result = strings.ReplaceAll(result, old, new)
|
|
}
|
|
return result
|
|
}
|
|
|
|
func (b *traceOperatorCTEBuilder) buildOperatorCTE(op qbtypes.TraceOperatorType, leftCTE, rightCTE string) (string, error) {
|
|
sanitizedOp := sanitizeForSQL(op.StringValue())
|
|
cteName := fmt.Sprintf("%s_%s_%s", leftCTE, sanitizedOp, rightCTE)
|
|
|
|
if _, exists := b.cteNameToIndex[cteName]; exists {
|
|
return cteName, nil
|
|
}
|
|
|
|
var sql string
|
|
var args []any
|
|
var dependsOn []string
|
|
|
|
switch op {
|
|
case qbtypes.TraceOperatorDirectDescendant:
|
|
sql, args, dependsOn = b.buildDirectDescendantCTE(leftCTE, rightCTE)
|
|
case qbtypes.TraceOperatorAnd:
|
|
sql, args, dependsOn = b.buildAndCTE(leftCTE, rightCTE)
|
|
case qbtypes.TraceOperatorOr:
|
|
sql, dependsOn = b.buildOrCTE(leftCTE, rightCTE)
|
|
args = nil // OR operations don't need args
|
|
case qbtypes.TraceOperatorNot, qbtypes.TraceOperatorExclude:
|
|
sql, args, dependsOn = b.buildNotCTE(leftCTE, rightCTE)
|
|
default:
|
|
return "", errors.NewInvalidInputf(errors.CodeInvalidInput, "unsupported operator: %s", op.StringValue())
|
|
}
|
|
|
|
b.addCTE(cteName, sql, args, dependsOn)
|
|
return cteName, nil
|
|
}
|
|
|
|
func (b *traceOperatorCTEBuilder) buildDirectDescendantCTE(parentCTE, childCTE string) (string, []any, []string) {
|
|
sb := sqlbuilder.NewSelectBuilder()
|
|
sb.Select(
|
|
"c.trace_id",
|
|
"c.span_id",
|
|
"c.parent_span_id",
|
|
"c.name",
|
|
"c.timestamp",
|
|
"c.durationNano",
|
|
"c.serviceName",
|
|
fmt.Sprintf("'%s' AS level", childCTE),
|
|
)
|
|
sb.From(fmt.Sprintf("%s AS c", childCTE))
|
|
sb.JoinWithOption(
|
|
sqlbuilder.InnerJoin,
|
|
fmt.Sprintf("%s AS p", parentCTE),
|
|
"p.trace_id = c.trace_id AND p.span_id = c.parent_span_id",
|
|
)
|
|
|
|
sql, args := sb.BuildWithFlavor(sqlbuilder.ClickHouse)
|
|
return sql, args, []string{parentCTE, childCTE}
|
|
}
|
|
|
|
func (b *traceOperatorCTEBuilder) buildAndCTE(leftCTE, rightCTE string) (string, []any, []string) {
|
|
sb := sqlbuilder.NewSelectBuilder()
|
|
sb.Select(
|
|
"l.trace_id",
|
|
"l.span_id",
|
|
"l.parent_span_id",
|
|
"l.name",
|
|
"l.timestamp",
|
|
"l.durationNano",
|
|
"l.serviceName",
|
|
"l.level",
|
|
)
|
|
sb.From(fmt.Sprintf("%s AS l", leftCTE))
|
|
sb.JoinWithOption(
|
|
sqlbuilder.InnerJoin,
|
|
fmt.Sprintf("%s AS r", rightCTE),
|
|
"l.trace_id = r.trace_id AND l.span_id = r.span_id",
|
|
)
|
|
|
|
sql, args := sb.BuildWithFlavor(sqlbuilder.ClickHouse)
|
|
return sql, args, []string{leftCTE, rightCTE}
|
|
}
|
|
|
|
func (b *traceOperatorCTEBuilder) buildOrCTE(leftCTE, rightCTE string) (string, []string) {
|
|
sql := fmt.Sprintf(`
|
|
SELECT * FROM %s
|
|
UNION DISTINCT
|
|
SELECT * FROM %s
|
|
`, leftCTE, rightCTE)
|
|
|
|
return sql, []string{leftCTE, rightCTE}
|
|
}
|
|
|
|
func (b *traceOperatorCTEBuilder) buildNotCTE(leftCTE, rightCTE string) (string, []any, []string) {
|
|
sb := sqlbuilder.NewSelectBuilder()
|
|
sb.Select(
|
|
"l.trace_id",
|
|
"l.span_id",
|
|
"l.parent_span_id",
|
|
"l.name",
|
|
"l.timestamp",
|
|
"l.durationNano",
|
|
"l.serviceName",
|
|
"l.level",
|
|
)
|
|
sb.From(fmt.Sprintf("%s AS l", leftCTE))
|
|
sb.Where(fmt.Sprintf(
|
|
"NOT EXISTS (SELECT 1 FROM %s AS r WHERE r.trace_id = l.trace_id AND r.span_id = l.span_id)",
|
|
rightCTE,
|
|
))
|
|
|
|
sql, args := sb.BuildWithFlavor(sqlbuilder.ClickHouse)
|
|
return sql, args, []string{leftCTE, rightCTE}
|
|
}
|
|
|
|
func (b *traceOperatorCTEBuilder) buildFinalQuery(selectFromCTE string, requestType qbtypes.RequestType) (*qbtypes.Statement, error) {
|
|
switch requestType {
|
|
case qbtypes.RequestTypeRaw:
|
|
return b.buildListQuery(selectFromCTE)
|
|
case qbtypes.RequestTypeTimeSeries:
|
|
return b.buildTimeSeriesQuery(selectFromCTE)
|
|
case qbtypes.RequestTypeScalar:
|
|
return b.buildScalarQuery(selectFromCTE)
|
|
default:
|
|
return nil, fmt.Errorf("unsupported request type: %s", requestType)
|
|
}
|
|
}
|
|
|
|
func (b *traceOperatorCTEBuilder) buildListQuery(selectFromCTE string) (*qbtypes.Statement, error) {
|
|
sb := sqlbuilder.NewSelectBuilder()
|
|
|
|
// Select default columns
|
|
sb.Select(
|
|
"timestamp",
|
|
"trace_id",
|
|
"span_id",
|
|
"name",
|
|
"serviceName",
|
|
"durationNano",
|
|
"parent_span_id",
|
|
)
|
|
|
|
for _, field := range b.operator.SelectFields {
|
|
colExpr, err := b.stmtBuilder.fm.ColumnExpressionFor(b.ctx, &field, nil)
|
|
if err != nil {
|
|
return nil, errors.NewInvalidInputf(
|
|
errors.CodeInvalidInput,
|
|
"failed to map select field '%s' in list query: %v",
|
|
field.Name,
|
|
err,
|
|
)
|
|
}
|
|
sb.SelectMore(sqlbuilder.Escape(colExpr))
|
|
}
|
|
|
|
sb.From(selectFromCTE)
|
|
|
|
// For span results, only timestamp ordering makes sense
|
|
sb.OrderBy("timestamp DESC")
|
|
|
|
// Add limit
|
|
if b.operator.Limit > 0 {
|
|
sb.Limit(b.operator.Limit)
|
|
} else {
|
|
sb.Limit(100)
|
|
}
|
|
|
|
sql, args := sb.BuildWithFlavor(sqlbuilder.ClickHouse)
|
|
return &qbtypes.Statement{
|
|
Query: sql,
|
|
Args: args,
|
|
}, nil
|
|
}
|
|
|
|
func (b *traceOperatorCTEBuilder) getKeySelectors() []*telemetrytypes.FieldKeySelector {
|
|
var keySelectors []*telemetrytypes.FieldKeySelector
|
|
|
|
// Add selectors for aggregation expressions
|
|
for _, agg := range b.operator.Aggregations {
|
|
selectors := querybuilder.QueryStringToKeysSelectors(agg.Expression)
|
|
keySelectors = append(keySelectors, selectors...)
|
|
}
|
|
|
|
// Add selectors for filter expression
|
|
if b.operator.Filter != nil && b.operator.Filter.Expression != "" {
|
|
selectors := querybuilder.QueryStringToKeysSelectors(b.operator.Filter.Expression)
|
|
keySelectors = append(keySelectors, selectors...)
|
|
}
|
|
|
|
// Add selectors for group by fields
|
|
for _, gb := range b.operator.GroupBy {
|
|
selectors := querybuilder.QueryStringToKeysSelectors(gb.TelemetryFieldKey.Name)
|
|
keySelectors = append(keySelectors, selectors...)
|
|
}
|
|
|
|
// Add selectors for order by fields
|
|
for _, order := range b.operator.Order {
|
|
keySelectors = append(keySelectors, &telemetrytypes.FieldKeySelector{
|
|
Name: order.Key.Name,
|
|
Signal: telemetrytypes.SignalTraces,
|
|
FieldContext: order.Key.FieldContext,
|
|
FieldDataType: order.Key.FieldDataType,
|
|
})
|
|
}
|
|
|
|
// Set signal type for all selectors
|
|
for i := range keySelectors {
|
|
keySelectors[i].Signal = telemetrytypes.SignalTraces
|
|
}
|
|
|
|
return keySelectors
|
|
}
|
|
|
|
func (b *traceOperatorCTEBuilder) buildTimeSeriesQuery(selectFromCTE string) (*qbtypes.Statement, error) {
|
|
sb := sqlbuilder.NewSelectBuilder()
|
|
|
|
stepIntervalSeconds := int64(b.operator.StepInterval.Seconds())
|
|
if stepIntervalSeconds <= 0 {
|
|
timeRangeSeconds := (b.end - b.start) / querybuilder.NsToSeconds
|
|
if timeRangeSeconds > 3600 {
|
|
stepIntervalSeconds = 300
|
|
} else if timeRangeSeconds > 1800 {
|
|
stepIntervalSeconds = 120
|
|
} else {
|
|
stepIntervalSeconds = 60
|
|
}
|
|
|
|
b.stmtBuilder.logger.WarnContext(b.ctx,
|
|
"trace operator stepInterval not set, using default",
|
|
"defaultSeconds", stepIntervalSeconds)
|
|
}
|
|
|
|
sb.Select(fmt.Sprintf(
|
|
"toStartOfInterval(timestamp, INTERVAL %d SECOND) AS ts",
|
|
stepIntervalSeconds,
|
|
))
|
|
|
|
// Get keys for field mapping
|
|
keySelectors := b.getKeySelectors()
|
|
keys, _, err := b.stmtBuilder.metadataStore.GetKeysMulti(b.ctx, keySelectors)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
var allGroupByArgs []any
|
|
|
|
// Add group by fields using proper field mapper
|
|
for _, gb := range b.operator.GroupBy {
|
|
expr, args, err := querybuilder.CollisionHandledFinalExpr(
|
|
b.ctx,
|
|
&gb.TelemetryFieldKey,
|
|
b.stmtBuilder.fm,
|
|
b.stmtBuilder.cb,
|
|
keys,
|
|
telemetrytypes.FieldDataTypeString,
|
|
)
|
|
if err != nil {
|
|
return nil, errors.NewInvalidInputf(
|
|
errors.CodeInvalidInput,
|
|
"failed to map group by field '%s': %v",
|
|
gb.TelemetryFieldKey.Name,
|
|
err,
|
|
)
|
|
}
|
|
colExpr := fmt.Sprintf("toString(%s) AS `%s`", expr, gb.TelemetryFieldKey.Name)
|
|
allGroupByArgs = append(allGroupByArgs, args...)
|
|
sb.SelectMore(colExpr)
|
|
}
|
|
|
|
// Add aggregations using proper aggregation expression rewriter
|
|
var allAggChArgs []any
|
|
for i, agg := range b.operator.Aggregations {
|
|
rewritten, chArgs, err := b.stmtBuilder.aggExprRewriter.Rewrite(
|
|
b.ctx,
|
|
agg.Expression,
|
|
uint64(stepIntervalSeconds), // Use validated step interval
|
|
keys,
|
|
)
|
|
if err != nil {
|
|
return nil, errors.NewInvalidInputf(
|
|
errors.CodeInvalidInput,
|
|
"failed to rewrite aggregation expression '%s': %v",
|
|
agg.Expression,
|
|
err,
|
|
)
|
|
}
|
|
allAggChArgs = append(allAggChArgs, chArgs...)
|
|
|
|
// Use alias if provided, otherwise use default naming
|
|
alias := fmt.Sprintf("__result_%d", i)
|
|
if agg.Alias != "" {
|
|
alias = agg.Alias
|
|
}
|
|
|
|
sb.SelectMore(fmt.Sprintf("%s AS %s", rewritten, alias))
|
|
}
|
|
|
|
sb.From(selectFromCTE)
|
|
|
|
// Group by time and all group by fields
|
|
sb.GroupBy("ts")
|
|
if len(b.operator.GroupBy) > 0 {
|
|
groupByKeys := make([]string, len(b.operator.GroupBy))
|
|
for i, gb := range b.operator.GroupBy {
|
|
groupByKeys[i] = fmt.Sprintf("`%s`", gb.TelemetryFieldKey.Name)
|
|
}
|
|
sb.GroupBy(groupByKeys...)
|
|
}
|
|
|
|
// Combine all arguments
|
|
combinedArgs := append(allGroupByArgs, allAggChArgs...)
|
|
|
|
sql, args := sb.BuildWithFlavor(sqlbuilder.ClickHouse, combinedArgs...)
|
|
return &qbtypes.Statement{
|
|
Query: sql,
|
|
Args: args,
|
|
}, nil
|
|
}
|
|
|
|
func (b *traceOperatorCTEBuilder) buildScalarQuery(selectFromCTE string) (*qbtypes.Statement, error) {
|
|
sb := sqlbuilder.NewSelectBuilder()
|
|
|
|
// Get keys for field mapping
|
|
keySelectors := b.getKeySelectors()
|
|
keys, _, err := b.stmtBuilder.metadataStore.GetKeysMulti(b.ctx, keySelectors)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
var allGroupByArgs []any
|
|
|
|
// Add group by fields using proper field mapper
|
|
for _, gb := range b.operator.GroupBy {
|
|
expr, args, err := querybuilder.CollisionHandledFinalExpr(
|
|
b.ctx,
|
|
&gb.TelemetryFieldKey,
|
|
b.stmtBuilder.fm,
|
|
b.stmtBuilder.cb,
|
|
keys,
|
|
telemetrytypes.FieldDataTypeString,
|
|
)
|
|
if err != nil {
|
|
return nil, errors.NewInvalidInputf(
|
|
errors.CodeInvalidInput,
|
|
"failed to map group by field '%s': %v",
|
|
gb.TelemetryFieldKey.Name,
|
|
err,
|
|
)
|
|
}
|
|
colExpr := fmt.Sprintf("toString(%s) AS `%s`", expr, gb.TelemetryFieldKey.Name)
|
|
allGroupByArgs = append(allGroupByArgs, args...)
|
|
sb.SelectMore(colExpr)
|
|
}
|
|
|
|
rateInterval := (b.end - b.start) / querybuilder.NsToSeconds
|
|
|
|
var allAggChArgs []any
|
|
for i, agg := range b.operator.Aggregations {
|
|
rewritten, chArgs, err := b.stmtBuilder.aggExprRewriter.Rewrite(
|
|
b.ctx,
|
|
agg.Expression,
|
|
rateInterval,
|
|
keys,
|
|
)
|
|
if err != nil {
|
|
return nil, errors.NewInvalidInputf(
|
|
errors.CodeInvalidInput,
|
|
"failed to rewrite aggregation expression '%s': %v",
|
|
agg.Expression,
|
|
err,
|
|
)
|
|
}
|
|
allAggChArgs = append(allAggChArgs, chArgs...)
|
|
|
|
// Use alias if provided, otherwise use default naming
|
|
alias := fmt.Sprintf("__result_%d", i)
|
|
if agg.Alias != "" {
|
|
alias = agg.Alias
|
|
}
|
|
|
|
sb.SelectMore(fmt.Sprintf("%s AS %s", rewritten, alias))
|
|
}
|
|
|
|
traceSubquery := fmt.Sprintf("SELECT DISTINCT trace_id FROM %s", selectFromCTE)
|
|
|
|
sb.Select(
|
|
"any(root.timestamp) as timestamp", // Add timestamp for consistent response structure
|
|
"any(root.serviceName) as `subQuery.serviceName`",
|
|
"any(root.name) as `subQuery.name`",
|
|
"count(bs.span_id) as span_count",
|
|
"any(root.durationNano) as `subQuery.durationNano`",
|
|
"result.trace_id as `subQuery.traceID`",
|
|
)
|
|
|
|
sb.From(fmt.Sprintf("(%s) result", traceSubquery))
|
|
sb.JoinWithOption(sqlbuilder.InnerJoin, "base_spans bs", "result.trace_id = bs.trace_id")
|
|
sb.JoinWithOption(sqlbuilder.InnerJoin, "base_spans root",
|
|
"result.trace_id = root.trace_id AND root.parent_span_id = ''")
|
|
|
|
sb.GroupBy("result.trace_id")
|
|
if len(b.operator.GroupBy) > 0 {
|
|
groupByKeys := make([]string, len(b.operator.GroupBy))
|
|
for i, gb := range b.operator.GroupBy {
|
|
groupByKeys[i] = fmt.Sprintf("`%s`", gb.TelemetryFieldKey.Name)
|
|
}
|
|
sb.GroupBy(groupByKeys...)
|
|
}
|
|
|
|
// Handle ordering
|
|
orderApplied := false
|
|
for _, orderBy := range b.operator.Order {
|
|
switch orderBy.Key.Name {
|
|
case qbtypes.OrderByTraceDuration.StringValue():
|
|
sb.OrderBy(fmt.Sprintf("`subQuery.durationNano` %s", orderBy.Direction.StringValue()))
|
|
orderApplied = true
|
|
case qbtypes.OrderBySpanCount.StringValue():
|
|
sb.OrderBy(fmt.Sprintf("span_count %s", orderBy.Direction.StringValue()))
|
|
orderApplied = true
|
|
case "timestamp":
|
|
// For timestamp ordering in scalar queries, use timestamp field
|
|
sb.OrderBy(fmt.Sprintf("timestamp %s", orderBy.Direction.StringValue()))
|
|
orderApplied = true
|
|
default:
|
|
// For aggregation results or other fields
|
|
aggIndex := -1
|
|
for i, agg := range b.operator.Aggregations {
|
|
if orderBy.Key.Name == agg.Alias || orderBy.Key.Name == fmt.Sprintf("__result_%d", i) {
|
|
aggIndex = i
|
|
break
|
|
}
|
|
}
|
|
if aggIndex >= 0 {
|
|
alias := fmt.Sprintf("__result_%d", aggIndex)
|
|
if b.operator.Aggregations[aggIndex].Alias != "" {
|
|
alias = b.operator.Aggregations[aggIndex].Alias
|
|
}
|
|
sb.OrderBy(fmt.Sprintf("%s %s", alias, orderBy.Direction.StringValue()))
|
|
orderApplied = true
|
|
} else {
|
|
b.stmtBuilder.logger.WarnContext(b.ctx,
|
|
"ignoring order by field that's not available in scalar trace context",
|
|
"field", orderBy.Key.Name)
|
|
}
|
|
}
|
|
}
|
|
|
|
// Default order by trace duration DESC if no order specified
|
|
if !orderApplied {
|
|
sb.OrderBy("`subQuery.durationNano` DESC")
|
|
}
|
|
|
|
// Add limit if specified
|
|
if b.operator.Limit > 0 {
|
|
sb.Limit(b.operator.Limit)
|
|
}
|
|
|
|
// Combine all arguments
|
|
combinedArgs := append(allGroupByArgs, allAggChArgs...)
|
|
|
|
sql, args := sb.BuildWithFlavor(sqlbuilder.ClickHouse, combinedArgs...)
|
|
return &qbtypes.Statement{
|
|
Query: sql,
|
|
Args: args,
|
|
}, nil
|
|
}
|
|
|
|
func (b *traceOperatorCTEBuilder) addCTE(name, sql string, args []any, dependsOn []string) {
|
|
b.ctes = append(b.ctes, cteNode{
|
|
name: name,
|
|
sql: sql,
|
|
args: args,
|
|
dependsOn: dependsOn,
|
|
})
|
|
b.cteNameToIndex[name] = len(b.ctes) - 1
|
|
}
|