2024-06-03 22:59:25 +00:00
|
|
|
package logstorage
|
|
|
|
|
|
|
|
import (
|
|
|
|
"strconv"
|
|
|
|
"strings"
|
|
|
|
"sync"
|
|
|
|
"time"
|
|
|
|
|
|
|
|
"github.com/VictoriaMetrics/VictoriaMetrics/lib/bytesutil"
|
|
|
|
"github.com/VictoriaMetrics/VictoriaMetrics/lib/fasttime"
|
|
|
|
)
|
|
|
|
|
|
|
|
func getSyslogParser(currentYear int) *syslogParser {
|
|
|
|
v := syslogParserPool.Get()
|
|
|
|
if v == nil {
|
|
|
|
v = &syslogParser{}
|
|
|
|
}
|
|
|
|
p := v.(*syslogParser)
|
|
|
|
p.currentYear = currentYear
|
|
|
|
return p
|
|
|
|
}
|
|
|
|
|
|
|
|
func putSyslogParser(p *syslogParser) {
|
|
|
|
p.reset()
|
|
|
|
syslogParserPool.Put(p)
|
|
|
|
}
|
|
|
|
|
|
|
|
var syslogParserPool sync.Pool
|
|
|
|
|
|
|
|
type syslogParser struct {
|
|
|
|
currentYear int
|
|
|
|
|
|
|
|
buf []byte
|
|
|
|
fields []Field
|
|
|
|
}
|
|
|
|
|
|
|
|
func (p *syslogParser) reset() {
|
|
|
|
p.currentYear = 0
|
|
|
|
p.resetFields()
|
|
|
|
}
|
|
|
|
|
|
|
|
func (p *syslogParser) resetFields() {
|
|
|
|
p.buf = p.buf[:0]
|
|
|
|
|
|
|
|
clear(p.fields)
|
|
|
|
p.fields = p.fields[:0]
|
|
|
|
}
|
|
|
|
|
|
|
|
func (p *syslogParser) addField(name, value string) {
|
|
|
|
p.fields = append(p.fields, Field{
|
|
|
|
Name: name,
|
|
|
|
Value: value,
|
|
|
|
})
|
|
|
|
}
|
|
|
|
|
|
|
|
func (p *syslogParser) parse(s string) {
|
|
|
|
p.resetFields()
|
|
|
|
|
|
|
|
if len(s) == 0 {
|
|
|
|
// Cannot parse syslog message
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
if s[0] != '<' {
|
|
|
|
p.parseNoHeader(s)
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
// parse priority
|
|
|
|
s = s[1:]
|
|
|
|
n := strings.IndexByte(s, '>')
|
|
|
|
if n < 0 {
|
|
|
|
// Cannot parse priority
|
|
|
|
return
|
|
|
|
}
|
|
|
|
priorityStr := s[:n]
|
|
|
|
s = s[n+1:]
|
|
|
|
|
|
|
|
p.addField("priority", priorityStr)
|
|
|
|
priority, ok := tryParseUint64(priorityStr)
|
|
|
|
if !ok {
|
|
|
|
// Cannot parse priority
|
|
|
|
return
|
|
|
|
}
|
|
|
|
facility := priority / 8
|
|
|
|
severity := priority % 8
|
|
|
|
|
|
|
|
bufLen := len(p.buf)
|
|
|
|
p.buf = marshalUint64String(p.buf, facility)
|
|
|
|
p.addField("facility", bytesutil.ToUnsafeString(p.buf[bufLen:]))
|
|
|
|
|
|
|
|
bufLen = len(p.buf)
|
|
|
|
p.buf = marshalUint64String(p.buf, severity)
|
|
|
|
p.addField("severity", bytesutil.ToUnsafeString(p.buf[bufLen:]))
|
|
|
|
|
|
|
|
p.parseNoHeader(s)
|
|
|
|
}
|
|
|
|
|
|
|
|
func (p *syslogParser) parseNoHeader(s string) {
|
|
|
|
if len(s) == 0 {
|
|
|
|
return
|
|
|
|
}
|
|
|
|
if strings.HasPrefix(s, "1 ") {
|
|
|
|
p.parseRFC5424(s[2:])
|
|
|
|
} else {
|
|
|
|
p.parseRFC3164(s)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func (p *syslogParser) parseRFC5424(s string) {
|
|
|
|
// See https://datatracker.ietf.org/doc/html/rfc5424
|
|
|
|
|
2024-06-05 01:18:12 +00:00
|
|
|
p.addField("format", "rfc5424")
|
|
|
|
|
2024-06-03 22:59:25 +00:00
|
|
|
if len(s) == 0 {
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
// Parse timestamp
|
|
|
|
n := strings.IndexByte(s, ' ')
|
|
|
|
if n < 0 {
|
|
|
|
p.addField("timestamp", s)
|
|
|
|
return
|
|
|
|
}
|
|
|
|
p.addField("timestamp", s[:n])
|
|
|
|
s = s[n+1:]
|
|
|
|
|
|
|
|
// Parse hostname
|
|
|
|
n = strings.IndexByte(s, ' ')
|
|
|
|
if n < 0 {
|
|
|
|
p.addField("hostname", s)
|
|
|
|
return
|
|
|
|
}
|
|
|
|
p.addField("hostname", s[:n])
|
|
|
|
s = s[n+1:]
|
|
|
|
|
|
|
|
// Parse app-name
|
|
|
|
n = strings.IndexByte(s, ' ')
|
|
|
|
if n < 0 {
|
|
|
|
p.addField("app_name", s)
|
|
|
|
return
|
|
|
|
}
|
|
|
|
p.addField("app_name", s[:n])
|
|
|
|
s = s[n+1:]
|
|
|
|
|
|
|
|
// Parse procid
|
|
|
|
n = strings.IndexByte(s, ' ')
|
|
|
|
if n < 0 {
|
|
|
|
p.addField("proc_id", s)
|
|
|
|
return
|
|
|
|
}
|
|
|
|
p.addField("proc_id", s[:n])
|
|
|
|
s = s[n+1:]
|
|
|
|
|
|
|
|
// Parse msgID
|
|
|
|
n = strings.IndexByte(s, ' ')
|
|
|
|
if n < 0 {
|
|
|
|
p.addField("msg_id", s)
|
|
|
|
return
|
|
|
|
}
|
|
|
|
p.addField("msg_id", s[:n])
|
|
|
|
s = s[n+1:]
|
|
|
|
|
|
|
|
// Parse structured data
|
|
|
|
tail, ok := p.parseRFC5424SD(s)
|
|
|
|
if !ok {
|
|
|
|
return
|
|
|
|
}
|
|
|
|
s = tail
|
|
|
|
|
|
|
|
// Parse message
|
|
|
|
p.addField("message", s)
|
|
|
|
}
|
|
|
|
|
|
|
|
func (p *syslogParser) parseRFC5424SD(s string) (string, bool) {
|
|
|
|
if strings.HasPrefix(s, "- ") {
|
|
|
|
return s[2:], true
|
|
|
|
}
|
|
|
|
|
|
|
|
for {
|
|
|
|
tail, ok := p.parseRFC5424SDLine(s)
|
|
|
|
if !ok {
|
|
|
|
return tail, false
|
|
|
|
}
|
|
|
|
s = tail
|
|
|
|
if strings.HasPrefix(s, " ") {
|
|
|
|
s = s[1:]
|
|
|
|
return s, true
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func (p *syslogParser) parseRFC5424SDLine(s string) (string, bool) {
|
|
|
|
if len(s) == 0 || s[0] != '[' {
|
|
|
|
return s, false
|
|
|
|
}
|
|
|
|
s = s[1:]
|
|
|
|
|
|
|
|
n := strings.IndexAny(s, " ]")
|
|
|
|
if n < 0 {
|
|
|
|
return s, false
|
|
|
|
}
|
|
|
|
sdID := s[:n]
|
|
|
|
s = s[n:]
|
|
|
|
|
|
|
|
// Parse structured data
|
|
|
|
i := 0
|
|
|
|
for i < len(s) && s[i] != ']' {
|
|
|
|
// skip whitespace
|
|
|
|
if s[i] != ' ' {
|
|
|
|
return s, false
|
|
|
|
}
|
|
|
|
i++
|
|
|
|
|
|
|
|
// Parse name
|
|
|
|
n := strings.IndexByte(s[i:], '=')
|
|
|
|
if n < 0 {
|
|
|
|
return s, false
|
|
|
|
}
|
|
|
|
i += n + 1
|
|
|
|
|
|
|
|
// Parse value
|
|
|
|
qp, err := strconv.QuotedPrefix(s[i:])
|
|
|
|
if err != nil {
|
|
|
|
return s, false
|
|
|
|
}
|
|
|
|
i += len(qp)
|
|
|
|
}
|
|
|
|
if i == len(s) {
|
|
|
|
return s, false
|
|
|
|
}
|
|
|
|
|
|
|
|
sdValue := strings.TrimSpace(s[:i])
|
|
|
|
p.addField(sdID, sdValue)
|
|
|
|
s = s[i+1:]
|
|
|
|
return s, true
|
|
|
|
}
|
|
|
|
|
|
|
|
func (p *syslogParser) parseRFC3164(s string) {
|
|
|
|
// See https://datatracker.ietf.org/doc/html/rfc3164
|
|
|
|
|
2024-06-10 16:42:19 +00:00
|
|
|
p.addField("format", "rfc3164")
|
|
|
|
|
2024-06-03 22:59:25 +00:00
|
|
|
// Parse timestamp
|
|
|
|
n := len(time.Stamp)
|
|
|
|
if len(s) < n {
|
2024-06-10 16:42:19 +00:00
|
|
|
p.addField("message", s)
|
2024-06-03 22:59:25 +00:00
|
|
|
return
|
|
|
|
}
|
2024-06-05 01:18:12 +00:00
|
|
|
|
2024-06-03 22:59:25 +00:00
|
|
|
t, err := time.Parse(time.Stamp, s[:n])
|
|
|
|
if err != nil {
|
|
|
|
// TODO: fall back to parsing ISO8601 timestamp?
|
2024-06-10 16:42:19 +00:00
|
|
|
p.addField("message", s)
|
2024-06-03 22:59:25 +00:00
|
|
|
return
|
|
|
|
}
|
|
|
|
s = s[n:]
|
|
|
|
|
|
|
|
t = t.UTC()
|
|
|
|
t = time.Date(p.currentYear, t.Month(), t.Day(), t.Hour(), t.Minute(), t.Second(), t.Nanosecond(), time.UTC)
|
|
|
|
if uint64(t.Unix())-24*3600 > fasttime.UnixTimestamp() {
|
|
|
|
// Adjust time to the previous year
|
|
|
|
t = time.Date(t.Year()-1, t.Month(), t.Day(), t.Hour(), t.Minute(), t.Second(), t.Nanosecond(), time.UTC)
|
|
|
|
}
|
|
|
|
|
|
|
|
bufLen := len(p.buf)
|
|
|
|
p.buf = marshalTimestampISO8601String(p.buf, t.UnixNano())
|
|
|
|
p.addField("timestamp", bytesutil.ToUnsafeString(p.buf[bufLen:]))
|
|
|
|
|
|
|
|
if len(s) == 0 || s[0] != ' ' {
|
|
|
|
// Missing space after the time field
|
2024-06-10 16:42:19 +00:00
|
|
|
if len(s) > 0 {
|
|
|
|
p.addField("message", s)
|
|
|
|
}
|
2024-06-03 22:59:25 +00:00
|
|
|
return
|
|
|
|
}
|
|
|
|
s = s[1:]
|
|
|
|
|
|
|
|
// Parse hostname
|
|
|
|
n = strings.IndexByte(s, ' ')
|
|
|
|
if n < 0 {
|
|
|
|
p.addField("hostname", s)
|
|
|
|
return
|
|
|
|
}
|
|
|
|
p.addField("hostname", s[:n])
|
|
|
|
s = s[n+1:]
|
|
|
|
|
|
|
|
// Parse tag (aka app_name)
|
|
|
|
n = strings.IndexAny(s, "[: ")
|
|
|
|
if n < 0 {
|
|
|
|
p.addField("app_name", s)
|
|
|
|
return
|
|
|
|
}
|
|
|
|
p.addField("app_name", s[:n])
|
|
|
|
s = s[n:]
|
|
|
|
|
|
|
|
// Parse proc_id
|
|
|
|
if len(s) == 0 {
|
|
|
|
return
|
|
|
|
}
|
|
|
|
if s[0] == '[' {
|
|
|
|
s = s[1:]
|
|
|
|
n = strings.IndexByte(s, ']')
|
|
|
|
if n < 0 {
|
|
|
|
return
|
|
|
|
}
|
|
|
|
p.addField("proc_id", s[:n])
|
|
|
|
s = s[n+1:]
|
|
|
|
}
|
|
|
|
|
|
|
|
// Skip optional ': ' in front of message
|
|
|
|
s = strings.TrimPrefix(s, ":")
|
|
|
|
s = strings.TrimPrefix(s, " ")
|
|
|
|
|
|
|
|
if len(s) > 0 {
|
|
|
|
p.addField("message", s)
|
|
|
|
}
|
|
|
|
}
|