2019-05-22 21:16:55 +00:00
package influx
import (
2019-06-14 06:57:13 +00:00
"flag"
2019-05-22 21:16:55 +00:00
"fmt"
"io"
"net/http"
"runtime"
"sync"
"time"
"github.com/VictoriaMetrics/VictoriaMetrics/app/vminsert/common"
"github.com/VictoriaMetrics/VictoriaMetrics/app/vminsert/concurrencylimiter"
"github.com/VictoriaMetrics/VictoriaMetrics/lib/bytesutil"
2020-01-24 14:52:48 +00:00
"github.com/VictoriaMetrics/VictoriaMetrics/lib/protoparser/influx"
2019-05-22 21:16:55 +00:00
"github.com/VictoriaMetrics/VictoriaMetrics/lib/storage"
"github.com/VictoriaMetrics/metrics"
)
2019-06-14 06:57:13 +00:00
var (
2019-06-25 10:32:57 +00:00
measurementFieldSeparator = flag . String ( "influxMeasurementFieldSeparator" , "_" , "Separator for `{measurement}{separator}{field_name}` metric name when inserted via Influx line protocol" )
2019-06-14 07:51:57 +00:00
skipSingleField = flag . Bool ( "influxSkipSingleField" , false , "Uses `{measurement}` instead of `{measurement}{separator}{field_name}` for metic name if Influx line contains only a single field" )
2019-06-14 06:57:13 +00:00
)
2019-07-27 10:20:47 +00:00
var (
rowsInserted = metrics . NewCounter ( ` vm_rows_inserted_total { type="influx"} ` )
rowsPerInsert = metrics . NewSummary ( ` vm_rows_per_insert { type="influx"} ` )
)
2019-05-22 21:16:55 +00:00
// InsertHandler processes remote write for influx line protocol.
//
// See https://github.com/influxdata/influxdb/blob/4cbdc197b8117fee648d62e2e5be75c6575352f0/tsdb/README.md
func InsertHandler ( req * http . Request ) error {
return concurrencylimiter . Do ( func ( ) error {
return insertHandlerInternal ( req )
} )
}
func insertHandlerInternal ( req * http . Request ) error {
2019-12-09 14:40:10 +00:00
readCalls . Inc ( )
2019-05-22 21:16:55 +00:00
r := req . Body
if req . Header . Get ( "Content-Encoding" ) == "gzip" {
2019-08-22 09:27:18 +00:00
zr , err := common . GetGzipReader ( r )
2019-05-22 21:16:55 +00:00
if err != nil {
return fmt . Errorf ( "cannot read gzipped influx line protocol data: %s" , err )
}
2019-08-22 09:27:18 +00:00
defer common . PutGzipReader ( zr )
2019-05-22 21:16:55 +00:00
r = zr
}
q := req . URL . Query ( )
tsMultiplier := int64 ( 1e6 )
switch q . Get ( "precision" ) {
case "ns" :
tsMultiplier = 1e6
case "u" :
tsMultiplier = 1e3
case "ms" :
tsMultiplier = 1
case "s" :
tsMultiplier = - 1e3
case "m" :
tsMultiplier = - 1e3 * 60
case "h" :
tsMultiplier = - 1e3 * 3600
}
// Read db tag from https://docs.influxdata.com/influxdb/v1.7/tools/api/#write-http-endpoint
db := q . Get ( "db" )
ctx := getPushCtx ( )
defer putPushCtx ( ctx )
for ctx . Read ( r , tsMultiplier ) {
if err := ctx . InsertRows ( db ) ; err != nil {
return err
}
}
return ctx . Error ( )
}
func ( ctx * pushCtx ) InsertRows ( db string ) error {
rows := ctx . Rows . Rows
rowsLen := 0
for i := range rows {
2019-12-09 18:58:19 +00:00
rowsLen += len ( rows [ i ] . Fields )
2019-05-22 21:16:55 +00:00
}
ic := & ctx . Common
ic . Reset ( rowsLen )
2019-07-27 10:20:47 +00:00
rowsTotal := 0
2019-05-22 21:16:55 +00:00
for i := range rows {
r := & rows [ i ]
ic . Labels = ic . Labels [ : 0 ]
2019-08-24 10:51:51 +00:00
hasDBLabel := false
2019-05-22 21:16:55 +00:00
for j := range r . Tags {
tag := & r . Tags [ j ]
2019-08-24 10:51:51 +00:00
if tag . Key == "db" {
hasDBLabel = true
}
2019-05-22 21:16:55 +00:00
ic . AddLabel ( tag . Key , tag . Value )
}
2019-08-24 10:51:51 +00:00
if len ( db ) > 0 && ! hasDBLabel {
ic . AddLabel ( "db" , db )
}
2019-05-22 21:16:55 +00:00
ctx . metricNameBuf = storage . MarshalMetricNameRaw ( ctx . metricNameBuf [ : 0 ] , ic . Labels )
ctx . metricGroupBuf = append ( ctx . metricGroupBuf [ : 0 ] , r . Measurement ... )
2019-06-14 07:51:57 +00:00
skipFieldKey := len ( r . Fields ) == 1 && * skipSingleField
2019-11-30 19:54:34 +00:00
if len ( ctx . metricGroupBuf ) > 0 && ! skipFieldKey {
2019-06-14 07:51:57 +00:00
ctx . metricGroupBuf = append ( ctx . metricGroupBuf , * measurementFieldSeparator ... )
}
2019-05-22 21:16:55 +00:00
metricGroupPrefixLen := len ( ctx . metricGroupBuf )
for j := range r . Fields {
f := & r . Fields [ j ]
2019-06-14 07:51:57 +00:00
if ! skipFieldKey {
ctx . metricGroupBuf = append ( ctx . metricGroupBuf [ : metricGroupPrefixLen ] , f . Key ... )
}
2019-05-22 21:16:55 +00:00
metricGroup := bytesutil . ToUnsafeString ( ctx . metricGroupBuf )
ic . Labels = ic . Labels [ : 0 ]
ic . AddLabel ( "" , metricGroup )
ic . WriteDataPoint ( ctx . metricNameBuf , ic . Labels [ : 1 ] , r . Timestamp , f . Value )
}
2019-07-27 10:20:47 +00:00
rowsTotal += len ( r . Fields )
2019-05-22 21:16:55 +00:00
}
2019-07-27 10:20:47 +00:00
rowsInserted . Add ( rowsTotal )
rowsPerInsert . Update ( float64 ( rowsTotal ) )
2019-05-22 21:16:55 +00:00
return ic . FlushBufs ( )
}
func ( ctx * pushCtx ) Read ( r io . Reader , tsMultiplier int64 ) bool {
if ctx . err != nil {
return false
}
2019-05-28 14:31:35 +00:00
ctx . reqBuf , ctx . tailBuf , ctx . err = common . ReadLinesBlock ( r , ctx . reqBuf , ctx . tailBuf )
if ctx . err != nil {
if ctx . err != io . EOF {
2019-12-09 14:40:10 +00:00
readErrors . Inc ( )
2019-05-28 14:31:35 +00:00
ctx . err = fmt . Errorf ( "cannot read influx line protocol data: %s" , ctx . err )
}
2019-05-22 21:16:55 +00:00
return false
}
2019-08-24 08:40:21 +00:00
ctx . Rows . Unmarshal ( bytesutil . ToUnsafeString ( ctx . reqBuf ) )
2019-05-22 21:16:55 +00:00
// Adjust timestamps according to tsMultiplier
currentTs := time . Now ( ) . UnixNano ( ) / 1e6
if tsMultiplier >= 1 {
for i := range ctx . Rows . Rows {
row := & ctx . Rows . Rows [ i ]
if row . Timestamp == 0 {
row . Timestamp = currentTs
} else {
row . Timestamp /= tsMultiplier
}
}
} else if tsMultiplier < 0 {
tsMultiplier = - tsMultiplier
2019-08-01 21:24:06 +00:00
currentTs -= currentTs % tsMultiplier
2019-05-22 21:16:55 +00:00
for i := range ctx . Rows . Rows {
row := & ctx . Rows . Rows [ i ]
if row . Timestamp == 0 {
row . Timestamp = currentTs
} else {
row . Timestamp *= tsMultiplier
}
}
}
return true
}
var (
2019-12-09 14:40:10 +00:00
readCalls = metrics . NewCounter ( ` vm_read_calls_total { name="influx"} ` )
readErrors = metrics . NewCounter ( ` vm_read_errors_total { name="influx"} ` )
2019-05-22 21:16:55 +00:00
)
type pushCtx struct {
2020-01-24 14:52:48 +00:00
Rows influx . Rows
2019-05-22 21:16:55 +00:00
Common common . InsertCtx
2019-05-28 14:31:35 +00:00
reqBuf [ ] byte
2019-05-22 21:16:55 +00:00
tailBuf [ ] byte
metricNameBuf [ ] byte
metricGroupBuf [ ] byte
err error
}
func ( ctx * pushCtx ) Error ( ) error {
if ctx . err == io . EOF {
return nil
}
return ctx . err
}
func ( ctx * pushCtx ) reset ( ) {
ctx . Rows . Reset ( )
ctx . Common . Reset ( 0 )
2019-05-28 14:31:35 +00:00
ctx . reqBuf = ctx . reqBuf [ : 0 ]
2019-05-22 21:16:55 +00:00
ctx . tailBuf = ctx . tailBuf [ : 0 ]
ctx . metricNameBuf = ctx . metricNameBuf [ : 0 ]
ctx . metricGroupBuf = ctx . metricGroupBuf [ : 0 ]
ctx . err = nil
}
func getPushCtx ( ) * pushCtx {
select {
case ctx := <- pushCtxPoolCh :
return ctx
default :
if v := pushCtxPool . Get ( ) ; v != nil {
return v . ( * pushCtx )
}
return & pushCtx { }
}
}
func putPushCtx ( ctx * pushCtx ) {
ctx . reset ( )
select {
case pushCtxPoolCh <- ctx :
default :
pushCtxPool . Put ( ctx )
}
}
var pushCtxPool sync . Pool
var pushCtxPoolCh = make ( chan * pushCtx , runtime . GOMAXPROCS ( - 1 ) )