From f527396d7e75e02ec36afb45a52802b9be5cce85 Mon Sep 17 00:00:00 2001 From: Krzysztof Kiewicz Date: Fri, 1 Nov 2024 21:16:05 +0100 Subject: [PATCH] Quickfix to remove nondeterminism for pipeline aggr with multiple parents (#943) All dashboards work after this Again, hacky, but when we implement fully correct `bucket_script`, hacks will disappear. --- .../auto_date_histogram.go | 2 +- .../pipeline_aggregations/bucket_script.go | 10 +- quesma/queryparser/pipeline_aggregations.go | 15 +- quesma/testdata/clients/clover.go | 170 ++++++++++++++++++ 4 files changed, 186 insertions(+), 11 deletions(-) diff --git a/quesma/model/bucket_aggregations/auto_date_histogram.go b/quesma/model/bucket_aggregations/auto_date_histogram.go index d46c8ec33..287d641ee 100644 --- a/quesma/model/bucket_aggregations/auto_date_histogram.go +++ b/quesma/model/bucket_aggregations/auto_date_histogram.go @@ -39,7 +39,7 @@ func (query *AutoDateHistogram) TranslateSqlResponseToJson(rows []model.QueryRes return model.JsonMap{ "buckets": []model.JsonMap{{ "key": query.key, - "key_as_string": time.UnixMilli(query.key).Format("2006-01-02T15:04:05.000-07:00"), + "key_as_string": time.UnixMilli(query.key).UTC().Format("2006-01-02T15:04:05.000"), "doc_count": rows[0].LastColValue(), }}, "interval": "100y", // seems working for bucketsNr=1 case. Will have to be changed for other cases. diff --git a/quesma/model/pipeline_aggregations/bucket_script.go b/quesma/model/pipeline_aggregations/bucket_script.go index d4b5b4f0f..055636271 100644 --- a/quesma/model/pipeline_aggregations/bucket_script.go +++ b/quesma/model/pipeline_aggregations/bucket_script.go @@ -80,11 +80,13 @@ func (query BucketScript) findFilterValue(rows []model.QueryResultRow, filterNam for _, row := range rows { for _, col := range row.Cols { colName := col.ColName - if !strings.HasSuffix(colName, "_col_0") { - continue + switch { // remove possible suffix + case strings.HasSuffix(colName, "_col_0"): + colName = strings.TrimSuffix(colName, "_col_0") + case strings.HasSuffix(colName, "__count"): + colName = strings.TrimSuffix(colName, "__count") } - colName = strings.TrimSuffix(colName, "_col_0") - if strings.HasSuffix(colName, "-"+filterName) { + if strings.HasSuffix(colName, filterName) { return util.ExtractNumeric64(col.Value) } } diff --git a/quesma/queryparser/pipeline_aggregations.go b/quesma/queryparser/pipeline_aggregations.go index f3a007ad5..dc76b6e9d 100644 --- a/quesma/queryparser/pipeline_aggregations.go +++ b/quesma/queryparser/pipeline_aggregations.go @@ -6,6 +6,7 @@ import ( "quesma/logger" "quesma/model" "quesma/model/pipeline_aggregations" + "quesma/util" "strings" ) @@ -225,14 +226,16 @@ func (cw *ClickhouseQueryTranslator) parseBucketsPath(shouldBeQueryMap any, aggr case QueryMap: // TODO: handle arbitrary nr of keys (and arbitrary scripts, because we also handle only one special case) if len(bucketsPath) == 1 || len(bucketsPath) == 2 { - for _, bucketPath := range bucketsPath { - if _, ok = bucketPath.(string); !ok { - logger.WarnWithCtx(cw.Ctx).Msgf("buckets_path is not a map with string values, but %T. Skipping this aggregation", bucketPath) + // We return just 1 value here (for smallest key) (determinism here important, returning any of them is incorrect) + // Seems iffy, but works for all cases so far. + // After fixing the TODO above, it should also get fixed. + for _, key := range util.MapKeysSorted(bucketsPath) { + if path, ok := bucketsPath[key].(string); ok { + return path, true + } else { + logger.WarnWithCtx(cw.Ctx).Msgf("buckets_path is not a map with string values, but %T. Skipping this aggregation", path) return } - // Kinda weird to return just the first value, but seems working on all cases so far. - // After fixing the TODO above, it should also get fixed. - return bucketPath.(string), true } } else { logger.WarnWithCtx(cw.Ctx).Msgf("buckets_path is not a map with one or two keys, but %d. Skipping this aggregation", len(bucketsPath)) diff --git a/quesma/testdata/clients/clover.go b/quesma/testdata/clients/clover.go index 32657d218..365b45dfc 100644 --- a/quesma/testdata/clients/clover.go +++ b/quesma/testdata/clients/clover.go @@ -473,4 +473,174 @@ var CloverTests = []testdata.AggregationTestCase{ fromUnixTimestamp64Milli(1728635627125))`, AdditionalAcceptableDifference: []string{"key_as_string"}, // timezone differences between local and github runs... There's always 2h difference between those, need to investigate. Maybe come back to .UTC() so there's no "+timezone" (e.g. +02:00)? }, + { // [6] + TestName: "bucket_script with multiple buckets_path", + QueryRequestJson: ` + { + "aggs": { + "timeseries": { + "aggs": { + "f2": { + "bucket_script": { + "buckets_path": { + "denominator": "f2-denominator>_count", + "numerator": "f2-numerator>_count" + }, + "script": "params.numerator != null && params.denominator != null && params.denominator != 0 ? params.numerator / params.denominator : 0" + } + }, + "f2-denominator": { + "filter": { + "bool": { + "filter": [], + "must": [], + "must_not": [], + "should": [] + } + } + }, + "f2-numerator": { + "filter": { + "bool": { + "filter": [], + "must": [ + { + "query_string": { + "analyze_wildcard": true, + "query": "!_exists_:a.b_str" + } + } + ], + "must_not": [], + "should": [] + } + } + } + }, + "auto_date_histogram": { + "buckets": 1, + "field": "@timestamp" + }, + "meta": { + "indexPatternString": "ab*", + "intervalString": "9075600000ms", + "normalized": true, + "panelId": "f0", + "seriesId": "f1", + "timeField": "@timestamp" + } + } + }, + "query": { + "bool": { + "filter": [], + "must": [ + { + "range": { + "@timestamp": { + "format": "strict_date_optional_time", + "gte": "2024-07-19T14:38:24.783Z", + "lte": "2024-11-01T15:38:24.783Z" + } + } + }, + { + "bool": { + "filter": [], + "must": [], + "must_not": [], + "should": [] + } + }, + { + "bool": { + "filter": [], + "must": [], + "must_not": [], + "should": [] + } + } + ], + "must_not": [], + "should": [] + } + }, + "runtime_mappings": {}, + "size": 0, + "timeout": "30000ms", + "track_total_hits": true + }`, + ExpectedResponse: ` + { + "completion_status": 200, + "completion_time_in_millis": 1730475504882, + "expiration_time_in_millis": 1730898929116, + "id": "quesma_async_0192e860-b4cb-7be4-a193-43d38686c80d", + "is_partial": false, + "is_running": false, + "response": { + "_shards": { + "failed": 0, + "skipped": 0, + "successful": 1, + "total": 1 + }, + "aggregations": { + "timeseries": { + "buckets": [ + { + "f2": { + "value": 0.178 + }, + "f2-denominator": { + "doc_count": 1000 + }, + "f2-numerator": { + "doc_count": 178 + }, + "doc_count": 1000, + "key": 1721399904783, + "key_as_string": "2024-07-19T14:38:24.783" + } + ], + "interval": "100y", + "meta": { + "indexPatternString": "ab*", + "intervalString": "9075600000ms", + "normalized": true, + "panelId": "f0", + "seriesId": "f1", + "timeField": "@timestamp" + } + } + }, + "hits": { + "hits": [], + "max_score": null, + "total": { + "relation": "eq", + "value": 1000 + } + }, + "timed_out": false, + "took": 0 + }, + "start_time_in_millis": 0 + }`, + ExpectedPancakeResults: []model.QueryResultRow{ + {Cols: []model.QueryResultCol{ + model.NewQueryResultCol("aggr__timeseries__count", int64(1000)), + model.NewQueryResultCol("metric__timeseries__f2-numerator_col_0", int64(178)), + model.NewQueryResultCol("aggr__timeseries__f2-denominator__count", int64(1000)), + }}, + }, + ExpectedPancakeSQL: ` + SELECT count(*) AS "aggr__timeseries__count", + countIf(NOT ("a.b_str" IS NOT NULL)) AS + "metric__timeseries__f2-numerator_col_0", + countIf(true) AS "aggr__timeseries__f2-denominator__count" + FROM __quesma_table_name + WHERE ("@timestamp">=fromUnixTimestamp64Milli(1721399904783) AND "@timestamp"<= + fromUnixTimestamp64Milli(1730475504783))`, + }, }