Skip to content

Commit

Permalink
[exporterhelper] Add default batching for OTLP data type
Browse files Browse the repository at this point in the history
Make the exporter batching capability to be available for the regular exporter helper without using custom requests.
  • Loading branch information
dmitryax committed Mar 11, 2024
1 parent 2413346 commit d47257b
Show file tree
Hide file tree
Showing 5 changed files with 340 additions and 12 deletions.
17 changes: 10 additions & 7 deletions exporter/exporterhelper/batch_sender.go
Original file line number Diff line number Diff line change
Expand Up @@ -45,14 +45,17 @@ type batchSender struct {
}

// newBatchSender returns a new batch consumer component.
func newBatchSender(cfg exporterbatcher.Config, set exporter.CreateSettings) *batchSender {
func newBatchSender(cfg exporterbatcher.Config, set exporter.CreateSettings,
mf exporterbatcher.BatchMergeFunc[Request], msf exporterbatcher.BatchMergeSplitFunc[Request]) *batchSender {
bs := &batchSender{
activeBatch: newEmptyBatch(),
cfg: cfg,
logger: set.Logger,
shutdownCh: make(chan struct{}),
stopped: &atomic.Bool{},
resetTimerCh: make(chan struct{}),
activeBatch: newEmptyBatch(),
cfg: cfg,
logger: set.Logger,
mergeFunc: mf,
mergeSplitFunc: msf,
shutdownCh: make(chan struct{}),
stopped: &atomic.Bool{},
resetTimerCh: make(chan struct{}),
}
return bs
}
Expand Down
29 changes: 25 additions & 4 deletions exporter/exporterhelper/common.go
Original file line number Diff line number Diff line change
Expand Up @@ -148,13 +148,20 @@ func WithCapabilities(capabilities consumer.Capabilities) Option {
}

// BatcherOption apply changes to batcher sender.
type BatcherOption func(*batchSender)
type BatcherOption func(*batchSender) error

// WithRequestBatchFuncs sets the functions for merging and splitting batches for an exporter built for custom request types.
func WithRequestBatchFuncs(mf exporterbatcher.BatchMergeFunc[Request], msf exporterbatcher.BatchMergeSplitFunc[Request]) BatcherOption {
return func(bs *batchSender) {
return func(bs *batchSender) error {
if mf == nil || msf == nil {
return fmt.Errorf("WithRequestBatchFuncs must be provided with non-nil functions")
}

Check warning on line 158 in exporter/exporterhelper/common.go

View check run for this annotation

Codecov / codecov/patch

exporter/exporterhelper/common.go#L157-L158

Added lines #L157 - L158 were not covered by tests
if bs.mergeFunc != nil || bs.mergeSplitFunc != nil {
return fmt.Errorf("WithRequestBatchFuncs can be used only once with request-based exporters")
}

Check warning on line 161 in exporter/exporterhelper/common.go

View check run for this annotation

Codecov / codecov/patch

exporter/exporterhelper/common.go#L160-L161

Added lines #L160 - L161 were not covered by tests
bs.mergeFunc = mf
bs.mergeSplitFunc = msf
return nil
}
}

Expand All @@ -166,7 +173,7 @@ func WithRequestBatchFuncs(mf exporterbatcher.BatchMergeFunc[Request], msf expor
// until https://github.com/open-telemetry/opentelemetry-collector/issues/8122 is resolved.
func WithBatcher(cfg exporterbatcher.Config, opts ...BatcherOption) Option {
return func(o *baseExporter) error {
bs := newBatchSender(cfg, o.set)
bs := newBatchSender(cfg, o.set, o.batchMergeFunc, o.batchMergeSplitfunc)
for _, opt := range opts {
opt(bs)
}
Expand Down Expand Up @@ -196,14 +203,28 @@ func withUnmarshaler(unmarshaler exporterqueue.Unmarshaler[Request]) Option {
}
}

// withBatchFuncs is used to set the functions for merging and splitting batches for OLTP-based exporters.
// It must be provided as the first option when creating a new exporter helper.
func withBatchFuncs(mf exporterbatcher.BatchMergeFunc[Request], msf exporterbatcher.BatchMergeSplitFunc[Request]) Option {
return func(o *baseExporter) error {
o.batchMergeFunc = mf
o.batchMergeSplitfunc = msf
return nil
}
}

// baseExporter contains common fields between different exporter types.
type baseExporter struct {
component.StartFunc
component.ShutdownFunc

signal component.DataType

batchMergeFunc exporterbatcher.BatchMergeFunc[Request]
batchMergeSplitfunc exporterbatcher.BatchMergeSplitFunc[Request]

marshaler exporterqueue.Marshaler[Request]
unmarshaler exporterqueue.Unmarshaler[Request]
signal component.DataType

set exporter.CreateSettings
obsrep *ObsReport
Expand Down
7 changes: 6 additions & 1 deletion exporter/exporterhelper/logs.go
Original file line number Diff line number Diff line change
Expand Up @@ -26,6 +26,8 @@ type logsRequest struct {
pusher consumer.ConsumeLogsFunc
}

var _ Request = (*logsRequest)(nil)

func newLogsRequest(ld plog.Logs, pusher consumer.ConsumeLogsFunc) Request {
return &logsRequest{
ld: ld,
Expand Down Expand Up @@ -82,7 +84,10 @@ func NewLogsExporter(
if pusher == nil {
return nil, errNilPushLogsData
}
logsOpts := []Option{withMarshaler(logsRequestMarshaler), withUnmarshaler(newLogsRequestUnmarshalerFunc(pusher))}
logsOpts := []Option{
withMarshaler(logsRequestMarshaler), withUnmarshaler(newLogsRequestUnmarshalerFunc(pusher)),
withBatchFuncs(mergeLogs, mergeSplitLogs),
}
return NewLogsRequestExporter(ctx, set, requestFromLogs(pusher), append(logsOpts, options...)...)
}

Expand Down
135 changes: 135 additions & 0 deletions exporter/exporterhelper/logs_batch.go
Original file line number Diff line number Diff line change
@@ -0,0 +1,135 @@
// Copyright The OpenTelemetry Authors
// SPDX-License-Identifier: Apache-2.0

package exporterhelper

import (
"context"
"errors"

"go.opentelemetry.io/collector/exporter/exporterbatcher"
"go.opentelemetry.io/collector/pdata/plog"
)

// mergeLogs merges two logs requests into one.
func mergeLogs(_ context.Context, r1 Request, r2 Request) (Request, error) {
lr1, ok1 := r1.(*logsRequest)
lr2, ok2 := r2.(*logsRequest)
if !ok1 || !ok2 {
return nil, errors.New("invalid input type")
}
lr2.ld.ResourceLogs().MoveAndAppendTo(lr1.ld.ResourceLogs())
return lr1, nil
}

// mergeSplitLogs splits and/or merges the logs into multiple requests based on the MaxSizeConfig.
func mergeSplitLogs(_ context.Context, cfg exporterbatcher.MaxSizeConfig, r1 Request, r2 Request) ([]Request, error) {
var (
res []Request
destReq *logsRequest
capacityLeft = cfg.MaxSizeItems
)
for _, req := range []Request{r1, r2} {
if req == nil {
continue
}
srcReq, ok := req.(*logsRequest)
if !ok {
return nil, errors.New("invalid input type")
}
if srcReq.ld.LogRecordCount() <= capacityLeft {
if destReq == nil {
destReq = srcReq
} else {
srcReq.ld.ResourceLogs().MoveAndAppendTo(destReq.ld.ResourceLogs())
}
capacityLeft = cfg.MaxSizeItems - destReq.ld.LogRecordCount()
continue
}

for {
extractedLogs := extractLogs(srcReq.ld, capacityLeft)
if extractedLogs.LogRecordCount() == 0 {
break
}
capacityLeft -= extractedLogs.LogRecordCount()
if destReq == nil {
destReq = &logsRequest{ld: extractedLogs, pusher: srcReq.pusher}
} else {
extractedLogs.ResourceLogs().MoveAndAppendTo(destReq.ld.ResourceLogs())
}
if capacityLeft == 0 {
res = append(res, destReq)
destReq = nil
capacityLeft = cfg.MaxSizeItems
}
}
}

if destReq != nil {
res = append(res, destReq)
}
return res, nil
}

// extractLogs extracts logs from the input logs and returns a new logs with the specified number of log records.
func extractLogs(srcLogs plog.Logs, count int) plog.Logs {
destLogs := plog.NewLogs()
srcLogs.ResourceLogs().RemoveIf(func(srcRL plog.ResourceLogs) bool {
if resourceLogsCount(srcRL) <= count {
count -= resourceLogsCount(srcRL)
srcRL.MoveTo(destLogs.ResourceLogs().AppendEmpty())
return true
}
extractedRL := extractResourceLogs(srcRL, count)
if resourceLogsCount(extractedRL) > 0 {
extractedRL.MoveTo(destLogs.ResourceLogs().AppendEmpty())
}
return resourceLogsCount(srcRL) == 0
})
return destLogs
}

// extractResourceLogs extracts resource logs and returns a new resource logs with the specified number of log records.
func extractResourceLogs(srcRL plog.ResourceLogs, count int) plog.ResourceLogs {
destRL := plog.NewResourceLogs()
srcRL.Resource().CopyTo(destRL.Resource())
destRL.SetSchemaUrl(srcRL.SchemaUrl())
srcRL.ScopeLogs().RemoveIf(func(srcSL plog.ScopeLogs) bool {
if srcSL.LogRecords().Len() <= count {
count -= srcSL.LogRecords().Len()
srcSL.MoveTo(destRL.ScopeLogs().AppendEmpty())
return true
}
extractedSL := extractScopeLogs(srcSL, count)
if extractedSL.LogRecords().Len() > 0 {
extractedSL.MoveTo(destRL.ScopeLogs().AppendEmpty())
}
return srcSL.LogRecords().Len() == 0
})
return destRL
}

// extractScopeLogs extracts scope logs and returns a new scope logs with the specified number of log records.
func extractScopeLogs(srcSL plog.ScopeLogs, count int) plog.ScopeLogs {
destSL := plog.NewScopeLogs()
destSL.SetSchemaUrl(srcSL.SchemaUrl())
srcSL.LogRecords().RemoveIf(func(srcLR plog.LogRecord) bool {
if count > 0 {
srcLR.MoveTo(destSL.LogRecords().AppendEmpty())
count--
return true
}
return false
})
return destSL
}

// resourceLogsCount calculates the total number of log records in the plog.ResourceLogs.
func resourceLogsCount(rl plog.ResourceLogs) int {
count := 0
for k := 0; k < rl.ScopeLogs().Len(); k++ {
count += rl.ScopeLogs().At(k).LogRecords().Len()
}
return count
}
Loading

0 comments on commit d47257b

Please sign in to comment.