forked from mirrors/statsd_exporter
implement backtrack
Signed-off-by: Wangchong Zhou <fffonion@gmail.com>
This commit is contained in:
parent
dad04e9c8b
commit
c2742aa299
2 changed files with 136 additions and 73 deletions
|
@ -48,9 +48,7 @@ type mapperConfigDefaults struct {
|
||||||
}
|
}
|
||||||
|
|
||||||
type mappingState struct {
|
type mappingState struct {
|
||||||
transitionsMap map[string]*mappingState
|
transitions map[string]*mappingState
|
||||||
transitionsArray []*mappingState
|
|
||||||
// use to compare length upfront to avoid unnecessary backtrack
|
|
||||||
minRemainingLength int
|
minRemainingLength int
|
||||||
maxRemainingLength int
|
maxRemainingLength int
|
||||||
// result is nil unless there's a metric ends with this state
|
// result is nil unless there's a metric ends with this state
|
||||||
|
@ -76,9 +74,13 @@ type templateFormatter struct {
|
||||||
fmtString string
|
fmtString string
|
||||||
}
|
}
|
||||||
|
|
||||||
type fsmBacktrackRecord struct {
|
type fsmBacktrackStackCursor struct {
|
||||||
fieldIndex int
|
fieldIndex int
|
||||||
|
captureIdx int
|
||||||
|
currentCapture string
|
||||||
state *mappingState
|
state *mappingState
|
||||||
|
prev *fsmBacktrackStackCursor
|
||||||
|
next *fsmBacktrackStackCursor
|
||||||
}
|
}
|
||||||
|
|
||||||
type matchMetricType string
|
type matchMetricType string
|
||||||
|
@ -188,11 +190,11 @@ func (m *MetricMapper) InitFromYAMLString(fileContents string) error {
|
||||||
maxPossibleTransitions := len(n.Mappings)
|
maxPossibleTransitions := len(n.Mappings)
|
||||||
|
|
||||||
n.FSM = &mappingState{}
|
n.FSM = &mappingState{}
|
||||||
n.FSM.transitionsMap = make(map[string]*mappingState, 3)
|
n.FSM.transitions = make(map[string]*mappingState, 3)
|
||||||
for _, field := range []MetricType{MetricTypeCounter, MetricTypeTimer, MetricTypeGauge, ""} {
|
for _, field := range []MetricType{MetricTypeCounter, MetricTypeTimer, MetricTypeGauge, ""} {
|
||||||
state := &mappingState{}
|
state := &mappingState{}
|
||||||
(*state).transitionsMap = make(map[string]*mappingState, maxPossibleTransitions)
|
(*state).transitions = make(map[string]*mappingState, maxPossibleTransitions)
|
||||||
n.FSM.transitionsMap[string(field)] = state
|
n.FSM.transitions[string(field)] = state
|
||||||
}
|
}
|
||||||
|
|
||||||
for i := range n.Mappings {
|
for i := range n.Mappings {
|
||||||
|
@ -234,25 +236,25 @@ func (m *MetricMapper) InitFromYAMLString(fileContents string) error {
|
||||||
roots := []*mappingState{}
|
roots := []*mappingState{}
|
||||||
if currentMapping.MatchMetricType == "" {
|
if currentMapping.MatchMetricType == "" {
|
||||||
for _, metricType := range []MetricType{MetricTypeCounter, MetricTypeTimer, MetricTypeGauge, ""} {
|
for _, metricType := range []MetricType{MetricTypeCounter, MetricTypeTimer, MetricTypeGauge, ""} {
|
||||||
roots = append(roots, n.FSM.transitionsMap[string(metricType)])
|
roots = append(roots, n.FSM.transitions[string(metricType)])
|
||||||
}
|
}
|
||||||
} else {
|
} else {
|
||||||
roots = append(roots, n.FSM.transitionsMap[string(currentMapping.MatchMetricType)])
|
roots = append(roots, n.FSM.transitions[string(currentMapping.MatchMetricType)])
|
||||||
}
|
}
|
||||||
var captureCount int
|
var captureCount int
|
||||||
for _, root := range roots {
|
for _, root := range roots {
|
||||||
captureCount = 0
|
captureCount = 0
|
||||||
for i, field := range matchFields {
|
for i, field := range matchFields {
|
||||||
state, prs := root.transitionsMap[field]
|
state, prs := root.transitions[field]
|
||||||
if !prs {
|
if !prs {
|
||||||
state = &mappingState{}
|
state = &mappingState{}
|
||||||
(*state).transitionsMap = make(map[string]*mappingState, maxPossibleTransitions)
|
(*state).transitions = make(map[string]*mappingState, maxPossibleTransitions)
|
||||||
(*state).maxRemainingLength = len(matchFields) - i - 1
|
(*state).maxRemainingLength = len(matchFields) - i - 1
|
||||||
(*state).minRemainingLength = len(matchFields) - i - 1
|
(*state).minRemainingLength = len(matchFields) - i - 1
|
||||||
root.transitionsMap[field] = state
|
root.transitions[field] = state
|
||||||
// if this is last field, set result to currentMapping instance
|
// if this is last field, set result to currentMapping instance
|
||||||
if i == len(matchFields)-1 {
|
if i == len(matchFields)-1 {
|
||||||
root.transitionsMap[field].result = currentMapping
|
root.transitions[field].result = currentMapping
|
||||||
}
|
}
|
||||||
} else {
|
} else {
|
||||||
(*state).maxRemainingLength = max(len(matchFields)-i-1, (*state).maxRemainingLength)
|
(*state).maxRemainingLength = max(len(matchFields)-i-1, (*state).maxRemainingLength)
|
||||||
|
@ -322,7 +324,7 @@ func (m *MetricMapper) InitFromYAMLString(fileContents string) error {
|
||||||
|
|
||||||
m.Defaults = n.Defaults
|
m.Defaults = n.Defaults
|
||||||
m.Mappings = n.Mappings
|
m.Mappings = n.Mappings
|
||||||
if len(n.FSM.transitionsMap) > 0 || len(n.FSM.transitionsArray) > 0 {
|
if len(n.FSM.transitions) > 0 {
|
||||||
m.FSM = n.FSM
|
m.FSM = n.FSM
|
||||||
m.doRegex = n.doRegex
|
m.doRegex = n.doRegex
|
||||||
if m.dumpFSMPath != "" {
|
if m.dumpFSMPath != "" {
|
||||||
|
@ -335,7 +337,7 @@ func (m *MetricMapper) InitFromYAMLString(fileContents string) error {
|
||||||
backtrackingRules := findBacktrackRules(&n)
|
backtrackingRules := findBacktrackRules(&n)
|
||||||
if len(backtrackingRules) > 0 {
|
if len(backtrackingRules) > 0 {
|
||||||
for _, rule := range backtrackingRules {
|
for _, rule := range backtrackingRules {
|
||||||
log.Infof("backtracking required for match \"%s\", matching performance may be degraded\n", rule)
|
log.Warnf("backtracking required because of match \"%s\", matching performance may be degraded\n", rule)
|
||||||
}
|
}
|
||||||
m.FSMNeedsBacktracking = true
|
m.FSMNeedsBacktracking = true
|
||||||
}
|
}
|
||||||
|
@ -366,7 +368,7 @@ func findBacktrackRules(n *MetricMapper) []string {
|
||||||
if mapping.MatchType != MatchTypeGlob {
|
if mapping.MatchType != MatchTypeGlob {
|
||||||
continue
|
continue
|
||||||
}
|
}
|
||||||
l := len(mapping.Match)
|
l := len(strings.Split(mapping.Match, "."))
|
||||||
ruleByLength[l] = append(ruleByLength[l], mapping.Match)
|
ruleByLength[l] = append(ruleByLength[l], mapping.Match)
|
||||||
|
|
||||||
metricRe := strings.Replace(mapping.Match, ".", "\\.", -1)
|
metricRe := strings.Replace(mapping.Match, ".", "\\.", -1)
|
||||||
|
@ -375,6 +377,7 @@ func findBacktrackRules(n *MetricMapper) []string {
|
||||||
if err != nil {
|
if err != nil {
|
||||||
log.Warnf("invalid match %s. cannot compile regex in mapping: %v", mapping.Match, err)
|
log.Warnf("invalid match %s. cannot compile regex in mapping: %v", mapping.Match, err)
|
||||||
}
|
}
|
||||||
|
// put into array no matter there's error or not, we will skip later if regex is nil
|
||||||
ruleREByLength[l] = append(ruleREByLength[l], regex)
|
ruleREByLength[l] = append(ruleREByLength[l], regex)
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -393,9 +396,8 @@ func findBacktrackRules(n *MetricMapper) []string {
|
||||||
}
|
}
|
||||||
for _, r2 := range rules {
|
for _, r2 := range rules {
|
||||||
if r2 != r1 && len(re1.FindStringSubmatchIndex(r2)) > 0 {
|
if r2 != r1 && len(re1.FindStringSubmatchIndex(r2)) > 0 {
|
||||||
fmt.Println("subset", r1, "of", r2)
|
log.Warnf("rule \"%s\" is a super set of rule \"%s\", the later will never be matched\n", r1, r2)
|
||||||
hasSubset = true
|
hasSubset = true
|
||||||
break
|
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
if !hasSubset {
|
if !hasSubset {
|
||||||
|
@ -419,13 +421,13 @@ func dumpFSM(fileName string, root *mappingState) {
|
||||||
w.WriteString("node [ label=\"\",style=filled,fillcolor=white,shape=circle ]\n") // remove label of node
|
w.WriteString("node [ label=\"\",style=filled,fillcolor=white,shape=circle ]\n") // remove label of node
|
||||||
|
|
||||||
for idx < len(states) {
|
for idx < len(states) {
|
||||||
for field, transition := range states[idx].transitionsMap {
|
for field, transition := range states[idx].transitions {
|
||||||
states[len(states)] = transition
|
states[len(states)] = transition
|
||||||
w.WriteString(fmt.Sprintf("%d -> %d [label = \"%s\"];\n", idx, len(states)-1, field))
|
w.WriteString(fmt.Sprintf("%d -> %d [label = \"%s\"];\n", idx, len(states)-1, field))
|
||||||
if idx == 0 {
|
if idx == 0 {
|
||||||
// color for metric types
|
// color for metric types
|
||||||
w.WriteString(fmt.Sprintf("%d [color=\"#D6B656\",fillcolor=\"#FFF2CC\"];\n", len(states)-1))
|
w.WriteString(fmt.Sprintf("%d [color=\"#D6B656\",fillcolor=\"#FFF2CC\"];\n", len(states)-1))
|
||||||
} else if transition.transitionsMap == nil || len(transition.transitionsMap) == 0 {
|
} else if transition.transitions == nil || len(transition.transitions) == 0 {
|
||||||
// color for end state
|
// color for end state
|
||||||
w.WriteString(fmt.Sprintf("%d [color=\"#82B366\",fillcolor=\"#D5E8D4\"];\n", len(states)-1))
|
w.WriteString(fmt.Sprintf("%d [color=\"#82B366\",fillcolor=\"#D5E8D4\"];\n", len(states)-1))
|
||||||
}
|
}
|
||||||
|
@ -450,26 +452,48 @@ func (m *MetricMapper) InitFromFile(fileName string) error {
|
||||||
func (m *MetricMapper) GetMapping(statsdMetric string, statsdMetricType MetricType) (*MetricMapping, prometheus.Labels, bool) {
|
func (m *MetricMapper) GetMapping(statsdMetric string, statsdMetricType MetricType) (*MetricMapping, prometheus.Labels, bool) {
|
||||||
// glob matching
|
// glob matching
|
||||||
if root := m.FSM; root != nil {
|
if root := m.FSM; root != nil {
|
||||||
root = root.transitionsMap[string(statsdMetricType)]
|
root = root.transitions[string(statsdMetricType)]
|
||||||
matchFields := strings.Split(statsdMetric, ".")
|
matchFields := strings.Split(statsdMetric, ".")
|
||||||
captures := make(map[int]string, len(matchFields))
|
captures := make(map[int]string, len(matchFields))
|
||||||
captureIdx := 0
|
captureIdx := 0
|
||||||
|
var backtrackCursor *fsmBacktrackStackCursor
|
||||||
|
backtrackCursor = nil
|
||||||
filedsCount := len(matchFields)
|
filedsCount := len(matchFields)
|
||||||
for i, field := range matchFields {
|
i := 0
|
||||||
if root.transitionsMap == nil {
|
for {
|
||||||
|
for i < filedsCount {
|
||||||
|
if root.transitions == nil {
|
||||||
break
|
break
|
||||||
}
|
}
|
||||||
state, prs := root.transitionsMap[field]
|
field := matchFields[i]
|
||||||
|
state, prs := root.transitions[field]
|
||||||
fieldsLeft := filedsCount - i - 1
|
fieldsLeft := filedsCount - i - 1
|
||||||
|
// also compare length upfront to avoid unnecessary loop or backtrack
|
||||||
if !prs || fieldsLeft > state.maxRemainingLength || fieldsLeft < state.minRemainingLength {
|
if !prs || fieldsLeft > state.maxRemainingLength || fieldsLeft < state.minRemainingLength {
|
||||||
state, prs = root.transitionsMap["*"]
|
state, prs = root.transitions["*"]
|
||||||
if !prs || fieldsLeft > state.maxRemainingLength || fieldsLeft < state.minRemainingLength {
|
if !prs || fieldsLeft > state.maxRemainingLength || fieldsLeft < state.minRemainingLength {
|
||||||
break
|
break
|
||||||
}
|
} else {
|
||||||
captures[captureIdx] = field
|
captures[captureIdx] = field
|
||||||
captureIdx++
|
captureIdx++
|
||||||
}
|
}
|
||||||
if state.result != nil && i == filedsCount-1 {
|
} else if m.FSMNeedsBacktracking {
|
||||||
|
otherState, prs := root.transitions["*"]
|
||||||
|
if !prs || fieldsLeft > otherState.maxRemainingLength || fieldsLeft < otherState.minRemainingLength {
|
||||||
|
} else {
|
||||||
|
newCursor := fsmBacktrackStackCursor{prev: backtrackCursor, state: otherState,
|
||||||
|
fieldIndex: i + 1,
|
||||||
|
captureIdx: captureIdx + 1, currentCapture: field,
|
||||||
|
}
|
||||||
|
if backtrackCursor != nil {
|
||||||
|
backtrackCursor.next = &newCursor
|
||||||
|
}
|
||||||
|
backtrackCursor = &newCursor
|
||||||
|
}
|
||||||
|
|
||||||
|
}
|
||||||
|
// found!
|
||||||
|
if state != nil && state.result != nil && i == filedsCount-1 {
|
||||||
mapping := *state.result
|
mapping := *state.result
|
||||||
state.result.Name = formatTemplate(mapping.NameFormatter, captures)
|
state.result.Name = formatTemplate(mapping.NameFormatter, captures)
|
||||||
|
|
||||||
|
@ -480,11 +504,25 @@ func (m *MetricMapper) GetMapping(statsdMetric string, statsdMetricType MetricTy
|
||||||
return state.result, labels, true
|
return state.result, labels, true
|
||||||
}
|
}
|
||||||
root = state
|
root = state
|
||||||
|
i++
|
||||||
}
|
}
|
||||||
|
// if we are not doing backtracking or all path has been travesaled
|
||||||
|
if backtrackCursor == nil {
|
||||||
// if there's no regex match type, return immediately
|
// if there's no regex match type, return immediately
|
||||||
if !m.doRegex {
|
if !m.doRegex {
|
||||||
return nil, nil, false
|
return nil, nil, false
|
||||||
|
} else {
|
||||||
|
break
|
||||||
|
}
|
||||||
|
} else {
|
||||||
|
// pop one from stack
|
||||||
|
root = backtrackCursor.state
|
||||||
|
i = backtrackCursor.fieldIndex
|
||||||
|
captureIdx = backtrackCursor.captureIdx
|
||||||
|
// put the * capture back
|
||||||
|
captures[captureIdx-1] = backtrackCursor.currentCapture
|
||||||
|
backtrackCursor = backtrackCursor.prev
|
||||||
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
|
@ -139,6 +139,56 @@ mappings:
|
||||||
},
|
},
|
||||||
},
|
},
|
||||||
},
|
},
|
||||||
|
//Config with backtracking
|
||||||
|
{
|
||||||
|
config: `
|
||||||
|
mappings:
|
||||||
|
- match: test.*.bbb
|
||||||
|
name: "testb"
|
||||||
|
labels:
|
||||||
|
label: "${1}_foo"
|
||||||
|
- match: test.justatest.aaa
|
||||||
|
name: "testa"
|
||||||
|
labels:
|
||||||
|
label: "${1}_foo"
|
||||||
|
`,
|
||||||
|
mappings: mappings{
|
||||||
|
"test.good.bbb": {
|
||||||
|
name: "testb",
|
||||||
|
labels: map[string]string{
|
||||||
|
"label": "good_foo",
|
||||||
|
},
|
||||||
|
},
|
||||||
|
"test.justatest.bbb": {
|
||||||
|
name: "testb",
|
||||||
|
labels: map[string]string{
|
||||||
|
"label": "justatest_foo",
|
||||||
|
},
|
||||||
|
},
|
||||||
|
},
|
||||||
|
},
|
||||||
|
//Config with super sets
|
||||||
|
{
|
||||||
|
config: `
|
||||||
|
mappings:
|
||||||
|
- match: test.*.bbb
|
||||||
|
name: "testb"
|
||||||
|
labels:
|
||||||
|
label: "${1}_foo"
|
||||||
|
- match: test.*.*
|
||||||
|
name: "testa"
|
||||||
|
labels:
|
||||||
|
label: "${1}_foo"
|
||||||
|
`,
|
||||||
|
mappings: mappings{
|
||||||
|
"test.good.bbb": {
|
||||||
|
name: "testb",
|
||||||
|
labels: map[string]string{
|
||||||
|
"label": "good_foo",
|
||||||
|
},
|
||||||
|
},
|
||||||
|
},
|
||||||
|
},
|
||||||
// Config with bad regex reference.
|
// Config with bad regex reference.
|
||||||
{
|
{
|
||||||
config: `---
|
config: `---
|
||||||
|
@ -471,31 +521,6 @@ mappings:
|
||||||
},
|
},
|
||||||
},
|
},
|
||||||
},
|
},
|
||||||
//Config with backtracking
|
|
||||||
{
|
|
||||||
config: `mappings:
|
|
||||||
- match: foo.*.ccc
|
|
||||||
name: "fooc"
|
|
||||||
labels: {}
|
|
||||||
- match: foo.bbb.aaa
|
|
||||||
name: "foob"
|
|
||||||
labels: {}
|
|
||||||
`,
|
|
||||||
mappings: mappings{
|
|
||||||
"foo.bbb.ccc": {
|
|
||||||
name: "fooc",
|
|
||||||
labels: map[string]string{},
|
|
||||||
},
|
|
||||||
"foo.ddd.ccc": {
|
|
||||||
name: "fooc",
|
|
||||||
labels: map[string]string{},
|
|
||||||
},
|
|
||||||
"foo.bbb.aaa": {
|
|
||||||
name: "foob",
|
|
||||||
labels: map[string]string{},
|
|
||||||
},
|
|
||||||
},
|
|
||||||
},
|
|
||||||
}
|
}
|
||||||
|
|
||||||
mapper := MetricMapper{}
|
mapper := MetricMapper{}
|
||||||
|
|
Loading…
Reference in a new issue