Skip to content

Commit

Permalink
feat(config): add 'wildcard-min-distance' config option (#296)
Browse files Browse the repository at this point in the history
  • Loading branch information
mchrome authored Dec 16, 2024
1 parent c608a1c commit a088cee
Show file tree
Hide file tree
Showing 8 changed files with 317 additions and 2 deletions.
1 change: 1 addition & 0 deletions config/config.go
Original file line number Diff line number Diff line change
Expand Up @@ -221,6 +221,7 @@ type ClickHouse struct {
TagsAdaptiveQueries int `toml:"tags-adaptive-queries" json:"tags-adaptive-queries" comment:"Tags adaptive queries (based on load average) for increase/decrease concurrent queries"`
TagsLimiter limiter.ServerLimiter `toml:"-" json:"-"`

WildcardMinDistance int `toml:"wildcard-min-distance" json:"wildcard-min-distance" comment:"If a wildcard appears both at the start and the end of a plain query at a distance (in terms of nodes) less than wildcard-min-distance, then it will be discarded. This parameter can be used to discard expensive queries."`
TagsMinInQuery int `toml:"tags-min-in-query" json:"tags-min-in-query" comment:"Minimum tags in seriesByTag query"`
TagsMinInAutocomplete int `toml:"tags-min-in-autocomplete" json:"tags-min-in-autocomplete" comment:"Minimum tags in autocomplete query"`

Expand Down
2 changes: 2 additions & 0 deletions doc/config.md
Original file line number Diff line number Diff line change
Expand Up @@ -311,6 +311,8 @@ Only one tag used as filter for index field Tag1, see graphite_tagged table [str
tags-concurrent-queries = 0
# Tags adaptive queries (based on load average) for increase/decrease concurrent queries
tags-adaptive-queries = 0
# If a wildcard appears both at the start and the end of a plain query at a distance (in terms of nodes) less than wildcard-min-distance, then it will be discarded. This parameter can be used to discard expensive queries.
wildcard-min-distance = 0
# Minimum tags in seriesByTag query
tags-min-in-query = 0
# Minimum tags in autocomplete query
Expand Down
11 changes: 9 additions & 2 deletions finder/index.go
Original file line number Diff line number Diff line change
Expand Up @@ -155,15 +155,22 @@ func (idx *IndexFinder) whereFilter(query string, from int64, until int64) *wher
return w
}

func (idx *IndexFinder) validatePlainQuery(query string) error {
func (idx *IndexFinder) validatePlainQuery(query string, wildcardMinDistance int) error {
if where.HasUnmatchedBrackets(query) {
return errs.NewErrorWithCode("query has unmatched brackets", http.StatusBadRequest)
}

var maxDist = where.MaxWildcardDistance(query)

if maxDist != -1 && maxDist < wildcardMinDistance {
return errs.NewErrorWithCode("query has wildcards way too early at the start and at the end of it", http.StatusBadRequest)
}

return nil
}

func (idx *IndexFinder) Execute(ctx context.Context, config *config.Config, query string, from int64, until int64, stat *FinderStat) (err error) {
err = idx.validatePlainQuery(query)
err = idx.validatePlainQuery(query, config.ClickHouse.WildcardMinDistance)
if err != nil {
return err
}
Expand Down
13 changes: 13 additions & 0 deletions pkg/where/where.go
Original file line number Diff line number Diff line change
Expand Up @@ -77,6 +77,19 @@ func IndexWildcard(target string) int {
return strings.IndexAny(target, "[]{}*?")
}

func MaxWildcardDistance(query string) int {
if !HasWildcard(query) {
return -1
}

w := IndexWildcard(query)
firstWildcardNode := strings.Count(query[:w], ".")
w = IndexLastWildcard(query)
lastWildcardNode := strings.Count(query[w:], ".")

return max(firstWildcardNode, lastWildcardNode)
}

func NonRegexpPrefix(expr string) string {
s := regexp.QuoteMeta(expr)
for i := 0; i < len(expr); i++ {
Expand Down
20 changes: 20 additions & 0 deletions pkg/where/where_test.go
Original file line number Diff line number Diff line change
Expand Up @@ -72,3 +72,23 @@ func TestNonRegexpPrefix(t *testing.T) {
assert.Equal(t, test.prefix, prefix, testName)
}
}

func TestMaxWildcardDistance(t *testing.T) {
table := []struct {
glob string
dist int
}{
{`a.b.c.d.e`, -1},
{`test.*.foo.bar`, 2},
{`test.foo.*.*.bar.count`, 2},
{`test.foo.bar.*.bar.foo.test`, 3},
{`test.foo.bar.foobar.*.middle.*.foobar.bar.foo.test`, 4},
{`*.test.foo.bar.*`, 0},
}

for _, test := range table {
testName := fmt.Sprintf("glob: %#v", test.glob)
dist := MaxWildcardDistance(test.glob)
assert.Equal(t, test.dist, dist, testName)
}
}
45 changes: 45 additions & 0 deletions tests/wildcard_min_distance/carbon-clickhouse.conf.tpl
Original file line number Diff line number Diff line change
@@ -0,0 +1,45 @@
[common]

[data]
path = "/etc/carbon-clickhouse/data"
chunk-interval = "1s"
chunk-auto-interval = ""

[upload.graphite_index]
type = "index"
table = "graphite_index"
url = "{{ .CLICKHOUSE_URL }}/"
timeout = "2m30s"
cache-ttl = "1h"

[upload.graphite_tags]
type = "tagged"
table = "graphite_tags"
threads = 3
url = "{{ .CLICKHOUSE_URL }}/"
timeout = "2m30s"
cache-ttl = "1h"

[upload.graphite_reverse]
type = "points-reverse"
table = "graphite_reverse"
url = "{{ .CLICKHOUSE_URL }}/"
timeout = "2m30s"
zero-timestamp = false

[upload.graphite]
type = "points"
table = "graphite"
url = "{{ .CLICKHOUSE_URL }}/"
timeout = "2m30s"
zero-timestamp = false

[tcp]
listen = ":2003"
enabled = true
drop-future = "0s"
drop-past = "0s"

[logging]
file = "/etc/carbon-clickhouse/carbon-clickhouse.log"
level = "debug"
35 changes: 35 additions & 0 deletions tests/wildcard_min_distance/graphite-clickhouse.conf.tpl
Original file line number Diff line number Diff line change
@@ -0,0 +1,35 @@
[common]
listen = "{{ .GCH_ADDR }}"
max-cpu = 0
max-metrics-in-render-answer = 10000
max-metrics-per-target = 10000
headers-to-log = [ "X-Ctx-Carbonapi-Uuid" ]

[clickhouse]
url = "{{ .CLICKHOUSE_URL }}/?max_rows_to_read=500000000&max_result_bytes=1073741824&readonly=2&log_queries=1"
data-timeout = "30s"

wildcard-min-distance = 1

index-table = "graphite_index"
index-use-daily = true
index-timeout = "1m"
internal-aggregation = true

tagged-table = "graphite_tags"
tagged-autocomplete-days = 1

[[data-table]]
# # clickhouse table name
table = "graphite"
# # points in table are stored with reverse path
reverse = false
rollup-conf = "auto"

[[logging]]
logger = ""
file = "{{ .GCH_DIR }}/graphite-clickhouse.log"
level = "info"
encoding = "json"
encoding-time = "iso8601"
encoding-duration = "seconds"
192 changes: 192 additions & 0 deletions tests/wildcard_min_distance/test.toml
Original file line number Diff line number Diff line change
@@ -0,0 +1,192 @@
[test]
precision = "10s"

[[test.clickhouse]]
version = "21.3"
dir = "tests/clickhouse/rollup"

[[test.clickhouse]]
version = "22.8"
dir = "tests/clickhouse/rollup"

[[test.clickhouse]]
version = "24.2"
dir = "tests/clickhouse/rollup"

[test.carbon_clickhouse]
template = "carbon-clickhouse.conf.tpl"

[[test.graphite_clickhouse]]
template = "graphite-clickhouse.conf.tpl"

[[test.input]]
name = "team_one.prod.test.metric_one"
points = [{value = 1.0, time = "rnow-10"}]

[[test.input]]
name = "team_two.stage.test.metric_one"
points = [{value = 1.0, time = "rnow-10"}]

[[test.input]]
name = "team_one.dev.test.metric_two"
points = [{value = 1.0, time = "rnow-10"}]

[[test.input]]
name = "team_one.dev.nontest.metric_one"
points = [{value = 1.0, time = "rnow-10"}]

[[test.render_checks]]
from = "rnow-10"
until = "rnow+1"
timeout = "1h"
targets = [
"team_one.prod.test.metric_one",
]

[[test.render_checks.result]]
name = "team_one.prod.test.metric_one"
path = "team_one.prod.test.metric_one"
consolidation = "avg"
start = "rnow-10"
stop = "rnow+10"
step = 10
req_start = "rnow-10"
req_stop = "rnow+10"
values = [1.0, nan]


[[test.render_checks]]
from = "rnow-10"
until = "rnow+1"
timeout = "1h"
targets = [
"*.dev.test.metric_two",
]

[[test.render_checks.result]]
name = "team_one.dev.test.metric_two"
path = "*.dev.test.metric_two"
consolidation = "avg"
start = "rnow-10"
stop = "rnow+10"
step = 10
req_start = "rnow-10"
req_stop = "rnow+10"
values = [1.0, nan]

[[test.render_checks]]
from = "rnow-10"
until = "rnow+1"
timeout = "1h"
targets = [
"*.*.test.metric_one",
]

[[test.render_checks.result]]
name = "team_one.prod.test.metric_one"
path = "*.*.test.metric_one"
consolidation = "avg"
start = "rnow-10"
stop = "rnow+10"
step = 10
req_start = "rnow-10"
req_stop = "rnow+10"
values = [1.0, nan]

[[test.render_checks.result]]
name = "team_two.stage.test.metric_one"
path = "*.*.test.metric_one"
consolidation = "avg"
start = "rnow-10"
stop = "rnow+10"
step = 10
req_start = "rnow-10"
req_stop = "rnow+10"
values = [1.0, nan]


[[test.render_checks]]
from = "rnow-10"
until = "rnow+1"
timeout = "1h"
targets = [
"team_two.stage.test.*",
]

[[test.render_checks.result]]
name = "team_two.stage.test.metric_one"
path = "team_two.stage.test.*"
consolidation = "avg"
start = "rnow-10"
stop = "rnow+10"
step = 10
req_start = "rnow-10"
req_stop = "rnow+10"
values = [1.0, nan]

[[test.render_checks]]
from = "rnow-10"
until = "rnow+1"
timeout = "1h"
targets = [
"team_one.*.test.*",
]

[[test.render_checks.result]]
name = "team_one.prod.test.metric_one"
path = "team_one.*.test.*"
consolidation = "avg"
start = "rnow-10"
stop = "rnow+10"
step = 10
req_start = "rnow-10"
req_stop = "rnow+10"
values = [1.0, nan]

[[test.render_checks.result]]
name = "team_one.dev.test.metric_two"
path = "team_one.*.test.*"
consolidation = "avg"
start = "rnow-10"
stop = "rnow+10"
step = 10
req_start = "rnow-10"
req_stop = "rnow+10"
values = [1.0, nan]

[[test.render_checks]]
from = "rnow-10"
until = "rnow+1"
timeout = "1h"
targets = [
"*.prod.test.*",
]
error_regexp = "^400: query has wildcards way too early at the start and at the end of it"

[[test.render_checks]]
from = "rnow-10"
until = "rnow+1"
timeout = "1h"
targets = [
"*.*.test.*",
]
error_regexp = "^400: query has wildcards way too early at the start and at the end of it"

[[test.render_checks]]
from = "rnow-10"
until = "rnow+1"
timeout = "1h"
targets = [
"*.*.*.*",
]
error_regexp = "^400: query has wildcards way too early at the start and at the end of it"


[[test.render_checks]]
from = "rnow-10"
until = "rnow+1"
timeout = "1h"
targets = [
"*.*",
]
error_regexp = "^400: query has wildcards way too early at the start and at the end of it"

0 comments on commit a088cee

Please sign in to comment.