app/vminsert/opentsdbhttp: skip invalid rows and continue parsing the remaining rows

Invalid rows are logged and counted in `vm_rows_invalid_total{type="opentsdb-http"}` metric
This commit is contained in:
Aliaksandr Valialkin 2019-08-24 13:05:20 +03:00
parent 38b9615c53
commit a283023d16
4 changed files with 31 additions and 33 deletions

View file

@ -4,6 +4,8 @@ import (
"fmt" "fmt"
"github.com/VictoriaMetrics/VictoriaMetrics/lib/bytesutil" "github.com/VictoriaMetrics/VictoriaMetrics/lib/bytesutil"
"github.com/VictoriaMetrics/VictoriaMetrics/lib/logger"
"github.com/VictoriaMetrics/metrics"
"github.com/valyala/fastjson" "github.com/valyala/fastjson"
"github.com/valyala/fastjson/fastfloat" "github.com/valyala/fastjson/fastfloat"
) )
@ -34,10 +36,8 @@ func (rs *Rows) Reset() {
// See http://opentsdb.net/docs/build/html/api_http/put.html // See http://opentsdb.net/docs/build/html/api_http/put.html
// //
// s must be unchanged until rs is in use. // s must be unchanged until rs is in use.
func (rs *Rows) Unmarshal(av *fastjson.Value) error { func (rs *Rows) Unmarshal(av *fastjson.Value) {
var err error rs.Rows, rs.tagsPool = unmarshalRows(rs.Rows[:0], av, rs.tagsPool[:0])
rs.Rows, rs.tagsPool, err = unmarshalRows(rs.Rows[:0], av, rs.tagsPool[:0])
return err
} }
// Row is a single OpenTSDB row. // Row is a single OpenTSDB row.
@ -122,26 +122,24 @@ func getFloat64(v *fastjson.Value) (float64, error) {
} }
} }
func unmarshalRows(dst []Row, av *fastjson.Value, tagsPool []Tag) ([]Row, []Tag, error) { func unmarshalRows(dst []Row, av *fastjson.Value, tagsPool []Tag) ([]Row, []Tag) {
switch av.Type() { switch av.Type() {
case fastjson.TypeObject: case fastjson.TypeObject:
return unmarshalRow(dst, av, tagsPool) return unmarshalRow(dst, av, tagsPool)
case fastjson.TypeArray: case fastjson.TypeArray:
a, _ := av.Array() a, _ := av.Array()
for i, o := range a { for _, o := range a {
var err error dst, tagsPool = unmarshalRow(dst, o, tagsPool)
dst, tagsPool, err = unmarshalRow(dst, o, tagsPool)
if err != nil {
return dst, tagsPool, fmt.Errorf("cannot unmarshal %d object out of %d objects: %s", i, len(a), err)
} }
} return dst, tagsPool
return dst, tagsPool, nil
default: default:
return dst, tagsPool, fmt.Errorf("OpenTSDB body must be either object or array; got %s; body=%s", av.Type(), av) logger.Errorf("OpenTSDB JSON must be either object or array; got %s; body=%s", av.Type(), av)
invalidLines.Inc()
return dst, tagsPool
} }
} }
func unmarshalRow(dst []Row, o *fastjson.Value, tagsPool []Tag) ([]Row, []Tag, error) { func unmarshalRow(dst []Row, o *fastjson.Value, tagsPool []Tag) ([]Row, []Tag) {
if cap(dst) > len(dst) { if cap(dst) > len(dst) {
dst = dst[:len(dst)+1] dst = dst[:len(dst)+1]
} else { } else {
@ -151,11 +149,15 @@ func unmarshalRow(dst []Row, o *fastjson.Value, tagsPool []Tag) ([]Row, []Tag, e
var err error var err error
tagsPool, err = r.unmarshal(o, tagsPool) tagsPool, err = r.unmarshal(o, tagsPool)
if err != nil { if err != nil {
return dst, tagsPool, fmt.Errorf("cannot unmarshal OpenTSDB object %s: %s", o, err) dst = dst[:len(dst)-1]
logger.Errorf("cannot unmarshal OpenTSDB object %s: %s", o, err)
invalidLines.Inc()
} }
return dst, tagsPool, nil return dst, tagsPool
} }
var invalidLines = metrics.NewCounter(`vm_rows_invalid_total{type="opentsdb-http"}`)
func unmarshalTags(dst []Tag, o *fastjson.Object) ([]Tag, error) { func unmarshalTags(dst []Tag, o *fastjson.Object) ([]Tag, error) {
var err error var err error
o.Visit(func(k []byte, v *fastjson.Value) { o.Visit(func(k []byte, v *fastjson.Value) {

View file

@ -17,12 +17,14 @@ func TestRowsUnmarshalFailure(t *testing.T) {
return return
} }
// Verify OpenTSDB body parsing error // Verify OpenTSDB body parsing error
if err := rows.Unmarshal(v); err == nil { rows.Unmarshal(v)
t.Fatalf("expecting non-nil error when parsing %q", s) if len(rows.Rows) != 0 {
t.Fatalf("unexpected number of rows parsed; got %d; want 0", len(rows.Rows))
} }
// Try again // Try again
if err := rows.Unmarshal(v); err == nil { rows.Unmarshal(v)
t.Fatalf("expecting non-nil error when parsing %q", s) if len(rows.Rows) != 0 {
t.Fatalf("unexpected number of rows parsed; got %d; want 0", len(rows.Rows))
} }
} }
@ -73,7 +75,7 @@ func TestRowsUnmarshalFailure(t *testing.T) {
f(`{"metric": "aaa", "timestamp": 1122, "value": 0.45, "tags": {"foo": 1}}`) f(`{"metric": "aaa", "timestamp": 1122, "value": 0.45, "tags": {"foo": 1}}`)
// Invalid multiline // Invalid multiline
f(`[{"metric": "aaa", "timestamp": 1122, "value": "trt", "tags":{"foo":"bar"}}, {"metric": "aaa", "timestamp": 1122, "value": 111}]`) f(`[{"metric": "aaa", "timestamp": 1122, "value": "trt", "tags":{"foo":"bar"}}, {"metric": "aaa", "timestamp": [1122], "value": 111}]`)
} }
func TestRowsUnmarshalSuccess(t *testing.T) { func TestRowsUnmarshalSuccess(t *testing.T) {
@ -87,17 +89,13 @@ func TestRowsUnmarshalSuccess(t *testing.T) {
if err != nil { if err != nil {
t.Fatalf("cannot parse json %s: %s", s, err) t.Fatalf("cannot parse json %s: %s", s, err)
} }
if err := rows.Unmarshal(v); err != nil { rows.Unmarshal(v)
t.Fatalf("cannot unmarshal %s: %s", v, err)
}
if !reflect.DeepEqual(rows.Rows, rowsExpected.Rows) { if !reflect.DeepEqual(rows.Rows, rowsExpected.Rows) {
t.Fatalf("unexpected rows;\ngot\n%+v;\nwant\n%+v", rows.Rows, rowsExpected.Rows) t.Fatalf("unexpected rows;\ngot\n%+v;\nwant\n%+v", rows.Rows, rowsExpected.Rows)
} }
// Try unmarshaling again // Try unmarshaling again
if err := rows.Unmarshal(v); err != nil { rows.Unmarshal(v)
t.Fatalf("cannot unmarshal %s: %s", v, err)
}
if !reflect.DeepEqual(rows.Rows, rowsExpected.Rows) { if !reflect.DeepEqual(rows.Rows, rowsExpected.Rows) {
t.Fatalf("unexpected rows;\ngot\n%+v;\nwant\n%+v", rows.Rows, rowsExpected.Rows) t.Fatalf("unexpected rows;\ngot\n%+v;\nwant\n%+v", rows.Rows, rowsExpected.Rows)
} }

View file

@ -24,8 +24,9 @@ func BenchmarkRowsUnmarshal(b *testing.B) {
if err != nil { if err != nil {
panic(fmt.Errorf("cannot parse %q: %s", s, err)) panic(fmt.Errorf("cannot parse %q: %s", s, err))
} }
if err := rows.Unmarshal(v); err != nil { rows.Unmarshal(v)
panic(fmt.Errorf("cannot unmarshal %q: %s", s, err)) if len(rows.Rows) != 4 {
panic(fmt.Errorf("unexpected number of rows unmarshaled; got %d; want 4", len(rows.Rows)))
} }
} }
}) })

View file

@ -72,10 +72,7 @@ func insertHandlerInternal(at *auth.Token, req *http.Request, maxSize int64) err
opentsdbUnmarshalErrors.Inc() opentsdbUnmarshalErrors.Inc()
return fmt.Errorf("cannot parse HTTP OpenTSDB json: %s", err) return fmt.Errorf("cannot parse HTTP OpenTSDB json: %s", err)
} }
if err := ctx.Rows.Unmarshal(v); err != nil { ctx.Rows.Unmarshal(v)
opentsdbUnmarshalErrors.Inc()
return fmt.Errorf("cannot unmarshal HTTP OpenTSDB json %s, %s", err, v)
}
// Fill in missing timestamps // Fill in missing timestamps
currentTimestamp := time.Now().Unix() currentTimestamp := time.Now().Unix()