summaryrefslogtreecommitdiffstats
path: root/src/go/collectors/go.d.plugin/pkg/logs/regexp.go
blob: e0dee1d022db5ef67b6301861bc1b0a89f6fba46 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
// SPDX-License-Identifier: GPL-3.0-or-later

package logs

import (
	"bufio"
	"errors"
	"fmt"
	"io"
	"regexp"
)

type (
	RegExpConfig struct {
		Pattern string `yaml:"pattern" json:"pattern"`
	}

	RegExpParser struct {
		r       *bufio.Reader
		pattern *regexp.Regexp
	}
)

func NewRegExpParser(config RegExpConfig, in io.Reader) (*RegExpParser, error) {
	if config.Pattern == "" {
		return nil, errors.New("empty pattern")
	}

	pattern, err := regexp.Compile(config.Pattern)
	if err != nil {
		return nil, fmt.Errorf("compile: %w", err)
	}

	if pattern.NumSubexp() == 0 {
		return nil, errors.New("pattern has no named subgroups")
	}

	p := &RegExpParser{
		r:       bufio.NewReader(in),
		pattern: pattern,
	}
	return p, nil
}

func (p *RegExpParser) ReadLine(line LogLine) error {
	row, err := p.r.ReadSlice('\n')
	if err != nil && len(row) == 0 {
		return err
	}
	if len(row) > 0 && row[len(row)-1] == '\n' {
		row = row[:len(row)-1]
	}
	return p.Parse(row, line)
}

func (p *RegExpParser) Parse(row []byte, line LogLine) error {
	match := p.pattern.FindSubmatch(row)
	if len(match) == 0 {
		return &ParseError{msg: "regexp parse: unmatched line"}
	}

	for i, name := range p.pattern.SubexpNames() {
		if name == "" || match[i] == nil {
			continue
		}
		err := line.Assign(name, string(match[i]))
		if err != nil {
			return &ParseError{msg: fmt.Sprintf("regexp parse: %v", err), err: err}
		}
	}
	return nil
}

func (p RegExpParser) Info() string {
	return fmt.Sprintf("regexp: %s", p.pattern)
}