2018-05-14 12:36:24 +00:00
|
|
|
// Copyright 2018 Prometheus Team
|
|
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
// you may not use this file except in compliance with the License.
|
|
|
|
// You may obtain a copy of the License at
|
|
|
|
//
|
|
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
//
|
|
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
// See the License for the specific language governing permissions and
|
|
|
|
// limitations under the License.
|
|
|
|
|
2019-09-16 08:56:29 +00:00
|
|
|
package labels
|
2017-03-16 10:16:10 +00:00
|
|
|
|
|
|
|
import (
|
|
|
|
"regexp"
|
|
|
|
"strings"
|
2020-12-23 20:48:56 +00:00
|
|
|
"unicode/utf8"
|
2020-06-02 14:13:31 +00:00
|
|
|
|
|
|
|
"github.com/pkg/errors"
|
2017-03-16 10:16:10 +00:00
|
|
|
)
|
|
|
|
|
|
|
|
var (
|
2021-06-23 09:05:49 +00:00
|
|
|
// '=~' has to come before '=' because otherwise only the '='
|
|
|
|
// will be consumed, and the '~' will be part of the 3rd token.
|
|
|
|
re = regexp.MustCompile(`^\s*([a-zA-Z_:][a-zA-Z0-9_:]*)\s*(=~|=|!=|!~)\s*((?s).*?)\s*$`)
|
2019-09-16 08:56:29 +00:00
|
|
|
typeMap = map[string]MatchType{
|
|
|
|
"=": MatchEqual,
|
|
|
|
"!=": MatchNotEqual,
|
|
|
|
"=~": MatchRegexp,
|
|
|
|
"!~": MatchNotRegexp,
|
2017-03-16 10:16:10 +00:00
|
|
|
}
|
|
|
|
)
|
|
|
|
|
2020-12-23 19:47:35 +00:00
|
|
|
// ParseMatchers parses a comma-separated list of Matchers. A leading '{' and/or
|
|
|
|
// a trailing '}' is optional and will be trimmed before further
|
|
|
|
// parsing. Individual Matchers are separated by commas outside of quoted parts
|
2021-01-13 17:49:06 +00:00
|
|
|
// of the input string. Those commas may be surrounded by whitespace. Parts of the
|
2020-12-23 19:47:35 +00:00
|
|
|
// string inside unescaped double quotes ('"…"') are considered quoted (and
|
|
|
|
// commas don't act as separators there). If double quotes are escaped with a
|
|
|
|
// single backslash ('\"'), they are ignored for the purpose of identifying
|
|
|
|
// quoted parts of the input string. If the input string, after trimming the
|
|
|
|
// optional trailing '}', ends with a comma, followed by optional whitespace,
|
|
|
|
// this comma and whitespace will be trimmed.
|
|
|
|
//
|
|
|
|
// Examples for valid input strings:
|
|
|
|
// {foo = "bar", dings != "bums", }
|
|
|
|
// foo=bar,dings!=bums
|
2021-01-13 17:49:06 +00:00
|
|
|
// foo=bar, dings!=bums
|
2020-12-23 19:47:35 +00:00
|
|
|
// {quote="She said: \"Hi, ladies! That's gender-neutral…\""}
|
|
|
|
// statuscode=~"5.."
|
|
|
|
//
|
2021-01-13 17:49:06 +00:00
|
|
|
// See ParseMatcher for details on how an individual Matcher is parsed.
|
2019-09-16 08:56:29 +00:00
|
|
|
func ParseMatchers(s string) ([]*Matcher, error) {
|
|
|
|
matchers := []*Matcher{}
|
2019-01-04 14:37:33 +00:00
|
|
|
s = strings.TrimPrefix(s, "{")
|
|
|
|
s = strings.TrimSuffix(s, "}")
|
2017-03-16 10:16:10 +00:00
|
|
|
|
2020-12-23 21:37:12 +00:00
|
|
|
var (
|
|
|
|
insideQuotes bool
|
|
|
|
escaped bool
|
|
|
|
token strings.Builder
|
|
|
|
tokens []string
|
|
|
|
)
|
2018-05-28 09:36:47 +00:00
|
|
|
for _, r := range s {
|
2020-12-23 21:37:12 +00:00
|
|
|
switch r {
|
|
|
|
case ',':
|
|
|
|
if !insideQuotes {
|
|
|
|
tokens = append(tokens, token.String())
|
|
|
|
token.Reset()
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
case '"':
|
|
|
|
if !escaped {
|
|
|
|
insideQuotes = !insideQuotes
|
|
|
|
} else {
|
|
|
|
escaped = false
|
|
|
|
}
|
|
|
|
case '\\':
|
|
|
|
escaped = !escaped
|
|
|
|
default:
|
|
|
|
escaped = false
|
2018-05-28 09:36:47 +00:00
|
|
|
}
|
2020-12-23 21:37:12 +00:00
|
|
|
token.WriteRune(r)
|
2018-05-28 09:36:47 +00:00
|
|
|
}
|
2020-12-23 21:37:12 +00:00
|
|
|
if s := strings.TrimSpace(token.String()); s != "" {
|
|
|
|
tokens = append(tokens, s)
|
2018-05-28 09:36:47 +00:00
|
|
|
}
|
|
|
|
for _, token := range tokens {
|
2019-09-16 08:56:29 +00:00
|
|
|
m, err := ParseMatcher(token)
|
2017-03-16 10:16:10 +00:00
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
matchers = append(matchers, m)
|
|
|
|
}
|
2018-05-28 09:36:47 +00:00
|
|
|
|
2017-03-16 10:16:10 +00:00
|
|
|
return matchers, nil
|
|
|
|
}
|
|
|
|
|
2020-12-23 19:47:35 +00:00
|
|
|
// ParseMatcher parses a matcher with a syntax inspired by PromQL and
|
|
|
|
// OpenMetrics. This syntax is convenient to describe filters and selectors in
|
|
|
|
// UIs and config files. To support the interactive nature of the use cases, the
|
|
|
|
// parser is in various aspects fairly tolerant.
|
|
|
|
//
|
|
|
|
// The syntax of a matcher consists of three tokens: (1) A valid Prometheus
|
|
|
|
// label name. (2) One of '=', '!=', '=~', or '!~', with the same meaning as
|
|
|
|
// known from PromQL selectors. (3) A UTF-8 string, which may be enclosed in
|
|
|
|
// double quotes. Before or after each token, there may be any amount of
|
|
|
|
// whitespace, which will be discarded. The 3rd token may be the empty
|
|
|
|
// string. Within the 3rd token, OpenMetrics escaping rules apply: '\"' for a
|
|
|
|
// double-quote, '\n' for a line feed, '\\' for a literal backslash. Unescaped
|
|
|
|
// '"' must not occur inside the 3rd token (only as the 1st or last
|
|
|
|
// character). However, literal line feed characters are tolerated, as are
|
|
|
|
// single '\' characters not followed by '\', 'n', or '"'. They act as a literal
|
|
|
|
// backslash in that case.
|
2021-06-23 09:05:49 +00:00
|
|
|
func ParseMatcher(s string) (_ *Matcher, err error) {
|
2017-04-20 09:04:17 +00:00
|
|
|
ms := re.FindStringSubmatch(s)
|
2020-12-23 20:48:56 +00:00
|
|
|
if len(ms) == 0 {
|
2020-06-02 14:13:31 +00:00
|
|
|
return nil, errors.Errorf("bad matcher format: %s", s)
|
2017-04-20 09:04:17 +00:00
|
|
|
}
|
|
|
|
|
2020-12-23 20:48:56 +00:00
|
|
|
var (
|
2022-09-30 10:51:17 +00:00
|
|
|
rawValue = ms[3]
|
2021-06-23 09:05:49 +00:00
|
|
|
value strings.Builder
|
|
|
|
escaped bool
|
|
|
|
expectTrailingQuote bool
|
2020-12-23 20:48:56 +00:00
|
|
|
)
|
2019-09-16 08:56:29 +00:00
|
|
|
|
2022-09-30 10:51:17 +00:00
|
|
|
if strings.HasPrefix(rawValue, "\"") {
|
2021-06-23 09:05:49 +00:00
|
|
|
rawValue = strings.TrimPrefix(rawValue, "\"")
|
|
|
|
expectTrailingQuote = true
|
|
|
|
}
|
|
|
|
|
2020-12-23 20:48:56 +00:00
|
|
|
if !utf8.ValidString(rawValue) {
|
2021-06-23 09:05:49 +00:00
|
|
|
return nil, errors.Errorf("matcher value not valid UTF-8: %s", ms[3])
|
2019-09-16 08:56:29 +00:00
|
|
|
}
|
2017-04-20 09:04:17 +00:00
|
|
|
|
2020-12-23 20:48:56 +00:00
|
|
|
// Unescape the rawValue:
|
|
|
|
for i, r := range rawValue {
|
|
|
|
if escaped {
|
|
|
|
escaped = false
|
|
|
|
switch r {
|
|
|
|
case 'n':
|
|
|
|
value.WriteByte('\n')
|
|
|
|
case '"', '\\':
|
|
|
|
value.WriteRune(r)
|
|
|
|
default:
|
|
|
|
// This was a spurious escape, so treat the '\' as literal.
|
|
|
|
value.WriteByte('\\')
|
|
|
|
value.WriteRune(r)
|
|
|
|
}
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
switch r {
|
|
|
|
case '\\':
|
|
|
|
if i < len(rawValue)-1 {
|
|
|
|
escaped = true
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
// '\' encountered as last byte. Treat it as literal.
|
|
|
|
value.WriteByte('\\')
|
|
|
|
case '"':
|
2021-06-23 09:05:49 +00:00
|
|
|
if !expectTrailingQuote || i < len(rawValue)-1 {
|
|
|
|
return nil, errors.Errorf("matcher value contains unescaped double quote: %s", ms[3])
|
2020-12-23 20:48:56 +00:00
|
|
|
}
|
2021-06-23 09:05:49 +00:00
|
|
|
expectTrailingQuote = false
|
2020-12-23 20:48:56 +00:00
|
|
|
default:
|
|
|
|
value.WriteRune(r)
|
|
|
|
}
|
2017-04-20 09:04:17 +00:00
|
|
|
}
|
|
|
|
|
2021-06-23 09:05:49 +00:00
|
|
|
if expectTrailingQuote {
|
|
|
|
return nil, errors.Errorf("matcher value contains unescaped double quote: %s", ms[3])
|
|
|
|
}
|
|
|
|
|
2020-12-23 20:48:56 +00:00
|
|
|
return NewMatcher(typeMap[ms[2]], ms[1], value.String())
|
2017-04-20 09:04:17 +00:00
|
|
|
}
|