mirror of
https://github.com/VictoriaMetrics/VictoriaMetrics.git
synced 2025-01-20 15:16:42 +00:00
25e54d2b50
add progress bars to the VM importer The new progress bars supposed to display the processing speed per each VM importer worker. This info should help to identify if there is a bottleneck on the VM side during the import process, without waiting for its finish. The new progress bars can be disabled by passing `vm-disable-progress-bar` flag. Plotting multiple progress bars requires using experimental progress bar pool from github.com/cheggaaa/pb/v3. Switch to progress bar pool required changes in all import modes. The openTSDB mode wasn't changed due to its implementation, which implies individual progress bars per each series. Because of this, using the pool wasn't possible. Signed-off-by: dmitryk-dk <kozlovdmitriyy@gmail.com> Co-authored-by: hagen1778 <roman@victoriametrics.com>
152 lines
3.1 KiB
Go
152 lines
3.1 KiB
Go
package main
|
|
|
|
import (
|
|
"fmt"
|
|
"io"
|
|
"log"
|
|
"sync"
|
|
|
|
"github.com/VictoriaMetrics/VictoriaMetrics/app/vmctl/barpool"
|
|
"github.com/VictoriaMetrics/VictoriaMetrics/app/vmctl/influx"
|
|
"github.com/VictoriaMetrics/VictoriaMetrics/app/vmctl/vm"
|
|
)
|
|
|
|
type influxProcessor struct {
|
|
ic *influx.Client
|
|
im *vm.Importer
|
|
cc int
|
|
separator string
|
|
}
|
|
|
|
func newInfluxProcessor(ic *influx.Client, im *vm.Importer, cc int, separator string) *influxProcessor {
|
|
if cc < 1 {
|
|
cc = 1
|
|
}
|
|
return &influxProcessor{
|
|
ic: ic,
|
|
im: im,
|
|
cc: cc,
|
|
separator: separator,
|
|
}
|
|
}
|
|
|
|
func (ip *influxProcessor) run(silent, verbose bool) error {
|
|
series, err := ip.ic.Explore()
|
|
if err != nil {
|
|
return fmt.Errorf("explore query failed: %s", err)
|
|
}
|
|
if len(series) < 1 {
|
|
return fmt.Errorf("found no timeseries to import")
|
|
}
|
|
|
|
question := fmt.Sprintf("Found %d timeseries to import. Continue?", len(series))
|
|
if !silent && !prompt(question) {
|
|
return nil
|
|
}
|
|
|
|
bar := barpool.AddWithTemplate(fmt.Sprintf(barTpl, "Processing series"), len(series))
|
|
if err := barpool.Start(); err != nil {
|
|
return err
|
|
}
|
|
|
|
seriesCh := make(chan *influx.Series)
|
|
errCh := make(chan error)
|
|
ip.im.ResetStats()
|
|
|
|
var wg sync.WaitGroup
|
|
wg.Add(ip.cc)
|
|
for i := 0; i < ip.cc; i++ {
|
|
go func() {
|
|
defer wg.Done()
|
|
for s := range seriesCh {
|
|
if err := ip.do(s); err != nil {
|
|
errCh <- fmt.Errorf("request failed for %q.%q: %s", s.Measurement, s.Field, err)
|
|
return
|
|
}
|
|
bar.Increment()
|
|
}
|
|
}()
|
|
}
|
|
|
|
// any error breaks the import
|
|
for _, s := range series {
|
|
select {
|
|
case infErr := <-errCh:
|
|
return fmt.Errorf("influx error: %s", infErr)
|
|
case vmErr := <-ip.im.Errors():
|
|
return fmt.Errorf("import process failed: %s", wrapErr(vmErr, verbose))
|
|
case seriesCh <- s:
|
|
}
|
|
}
|
|
|
|
close(seriesCh)
|
|
wg.Wait()
|
|
ip.im.Close()
|
|
// drain import errors channel
|
|
for vmErr := range ip.im.Errors() {
|
|
if vmErr.Err != nil {
|
|
return fmt.Errorf("import process failed: %s", wrapErr(vmErr, verbose))
|
|
}
|
|
}
|
|
barpool.Stop()
|
|
log.Println("Import finished!")
|
|
log.Print(ip.im.Stats())
|
|
return nil
|
|
}
|
|
|
|
const dbLabel = "db"
|
|
|
|
func (ip *influxProcessor) do(s *influx.Series) error {
|
|
cr, err := ip.ic.FetchDataPoints(s)
|
|
if err != nil {
|
|
return fmt.Errorf("failed to fetch datapoints: %s", err)
|
|
}
|
|
defer func() {
|
|
_ = cr.Close()
|
|
}()
|
|
var name string
|
|
if s.Measurement != "" {
|
|
name = fmt.Sprintf("%s%s%s", s.Measurement, ip.separator, s.Field)
|
|
} else {
|
|
name = s.Field
|
|
}
|
|
|
|
labels := make([]vm.LabelPair, len(s.LabelPairs))
|
|
var containsDBLabel bool
|
|
for i, lp := range s.LabelPairs {
|
|
if lp.Name == dbLabel {
|
|
containsDBLabel = true
|
|
break
|
|
}
|
|
labels[i] = vm.LabelPair{
|
|
Name: lp.Name,
|
|
Value: lp.Value,
|
|
}
|
|
}
|
|
if !containsDBLabel {
|
|
labels = append(labels, vm.LabelPair{
|
|
Name: dbLabel,
|
|
Value: ip.ic.Database(),
|
|
})
|
|
}
|
|
|
|
for {
|
|
time, values, err := cr.Next()
|
|
if err != nil {
|
|
if err == io.EOF {
|
|
return nil
|
|
}
|
|
return err
|
|
}
|
|
// skip empty results
|
|
if len(time) < 1 {
|
|
continue
|
|
}
|
|
ip.im.Input() <- &vm.TimeSeries{
|
|
Name: name,
|
|
LabelPairs: labels,
|
|
Timestamps: time,
|
|
Values: values,
|
|
}
|
|
}
|
|
}
|