Skip to content

Commit

Permalink
[processor/redaction] add support for redacting metrics and logs attr…
Browse files Browse the repository at this point in the history
…ibutes (#34609)

**Description:** This PR extends the redaction processor to also support
the redaction of attributes within logs and metrics.

**Link to tracking Issue:** #34479 

**Testing:** Extended the existing unit tests to also cover the
redaction of logs and metrics

**Documentation:** Adapted the readme to reflect the changes

---------

Signed-off-by: Florian Bacher <[email protected]>
  • Loading branch information
bacherfl authored Aug 30, 2024
1 parent 0ec84e6 commit 184e954
Show file tree
Hide file tree
Showing 9 changed files with 582 additions and 145 deletions.
27 changes: 27 additions & 0 deletions .chloggen/redaction-add-metrics-and-logs.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,27 @@
# Use this changelog template to create an entry for release notes.

# One of 'breaking', 'deprecation', 'new_component', 'enhancement', 'bug_fix'
change_type: enhancement

# The name of the component, or a single word describing the area of concern, (e.g. filelogreceiver)
component: redactionprocessor

# A brief description of the change. Surround your text with quotes ("") if it needs to start with a backtick (`).
note: Add support for logs and metrics

# Mandatory: One or more tracking issues related to the change. You can use the PR number here if no issue exists.
issues: [34479]

# (Optional) One or more lines of additional information to render under the primary note.
# These lines will be padded with 2 spaces and then inserted directly into the document.
# Use pipe (|) for multiline entries.
subtext:

# If your change doesn't affect end users or the exported elements of any package,
# you should instead start your pull request title with [chore] or use the "Skip Changelog" label.
# Optional: The change log or logs in which this entry should be included.
# e.g. '[user]' or '[user, api]'
# Include 'user' if the change is relevant to end users.
# Include 'api' if there is a change to a library API.
# Default: '[user]'
change_logs: []
22 changes: 12 additions & 10 deletions processor/redactionprocessor/README.md
Original file line number Diff line number Diff line change
Expand Up @@ -3,19 +3,21 @@
<!-- status autogenerated section -->
| Status | |
| ------------- |-----------|
| Stability | [beta]: traces |
| Stability | [alpha]: logs, metrics |
| | [beta]: traces |
| Distributions | [contrib] |
| Issues | [![Open issues](https://img.shields.io/github/issues-search/open-telemetry/opentelemetry-collector-contrib?query=is%3Aissue%20is%3Aopen%20label%3Aprocessor%2Fredaction%20&label=open&color=orange&logo=opentelemetry)](https://github.com/open-telemetry/opentelemetry-collector-contrib/issues?q=is%3Aopen+is%3Aissue+label%3Aprocessor%2Fredaction) [![Closed issues](https://img.shields.io/github/issues-search/open-telemetry/opentelemetry-collector-contrib?query=is%3Aissue%20is%3Aclosed%20label%3Aprocessor%2Fredaction%20&label=closed&color=blue&logo=opentelemetry)](https://github.com/open-telemetry/opentelemetry-collector-contrib/issues?q=is%3Aclosed+is%3Aissue+label%3Aprocessor%2Fredaction) |
| [Code Owners](https://github.com/open-telemetry/opentelemetry-collector-contrib/blob/main/CONTRIBUTING.md#becoming-a-code-owner) | [@dmitryax](https://www.github.com/dmitryax), [@mx-psi](https://www.github.com/mx-psi), [@TylerHelmuth](https://www.github.com/TylerHelmuth) |
| Emeritus | [@leonsp-ai](https://www.github.com/leonsp-ai) |

[alpha]: https://github.com/open-telemetry/opentelemetry-collector#alpha
[beta]: https://github.com/open-telemetry/opentelemetry-collector#beta
[contrib]: https://github.com/open-telemetry/opentelemetry-collector-releases/tree/main/distributions/otelcol-contrib
<!-- end autogenerated section -->

This processor deletes span attributes that don't match a list of allowed span
attributes. It also masks span attribute values that match a blocked value
list. Span attributes that aren't on the allowed list are removed before any
This processor deletes span, log, and metric datapoint attributes that don't match a list of allowed
attributes. It also masks attribute values that match a blocked value
list. Attributes that aren't on the allowed list are removed before any
value checks are done.

## Use Cases
Expand Down Expand Up @@ -57,9 +59,9 @@ processors:
# allowed_keys list. The list of blocked_values is applied regardless. If
# you just want to block values, set this to true.
allow_all_keys: false
# allowed_keys is a list of span attribute keys that are kept on the span and
# allowed_keys is a list of span/log/datapoint attribute keys that are kept on the span/log/datapoint and
# processed. The list is designed to fail closed. If allowed_keys is empty,
# no span attributes are allowed and all span attributes are removed. To
# no attributes are allowed and all span attributes are removed. To
# allow all keys, set allow_all_keys to true.
allowed_keys:
- description
Expand All @@ -76,7 +78,7 @@ processors:
- "4[0-9]{12}(?:[0-9]{3})?" ## Visa credit card number
- "(5[1-5][0-9]{14})" ## MasterCard number
# summary controls the verbosity level of the diagnostic attributes that
# the processor adds to the spans when it redacts or masks other
# the processor adds to the spans/logs/datapoints when it redacts or masks other
# attributes. In some contexts a list of redacted attributes leaks
# information, while it is valuable when integrating and testing a new
# configuration. Possible values:
Expand All @@ -93,16 +95,16 @@ Ignored attributes are processed first so they're always allowed and never
blocked. This field should only be used where you know the data is always
safe to send to the telemetry system.
Only span attributes included on the list of allowed keys list are retained.
If `allowed_keys` is empty, then no span attributes are allowed. All span
Only span/log/datapoint attributes included on the list of allowed keys list are retained.
If `allowed_keys` is empty, then no attributes are allowed. All
attributes are removed in that case. To keep all span attributes, you should
explicitly set `allow_all_keys` to true.

`blocked_values` applies to the values of the allowed keys. If the value of an
allowed key matches the regular expression for a blocked value, the matching
part of the value is then masked with a fixed length of asterisks.

For example, if `notes` is on the list of allowed keys, then the `notes` span
For example, if `notes` is on the list of allowed keys, then the `notes`
attribute is retained. However, if there is a value such as a credit card
number in the `notes` field that matched a regular expression on the list of
blocked values, then that value is masked.
46 changes: 46 additions & 0 deletions processor/redactionprocessor/factory.go
Original file line number Diff line number Diff line change
Expand Up @@ -23,6 +23,8 @@ func NewFactory() processor.Factory {
metadata.Type,
createDefaultConfig,
processor.WithTraces(createTracesProcessor, metadata.TracesStability),
processor.WithLogs(createLogsProcessor, metadata.LogsStability),
processor.WithMetrics(createMetricsProcessor, metadata.MetricsStability),
)
}

Expand Down Expand Up @@ -53,3 +55,47 @@ func createTracesProcessor(
redaction.processTraces,
processorhelper.WithCapabilities(consumer.Capabilities{MutatesData: true}))
}

// createLogsProcessor creates an instance of redaction for processing logs
func createLogsProcessor(
ctx context.Context,
set processor.Settings,
cfg component.Config,
next consumer.Logs) (processor.Logs, error) {
oCfg := cfg.(*Config)

red, err := newRedaction(ctx, oCfg, set.Logger)
if err != nil {
return nil, fmt.Errorf("error creating a redaction processor: %w", err)
}

return processorhelper.NewLogsProcessor(
ctx,
set,
cfg,
next,
red.processLogs,
processorhelper.WithCapabilities(consumer.Capabilities{MutatesData: true}))
}

// createMetricsProcessor creates an instance of redaction for processing metrics
func createMetricsProcessor(
ctx context.Context,
set processor.Settings,
cfg component.Config,
next consumer.Metrics) (processor.Metrics, error) {
oCfg := cfg.(*Config)

red, err := newRedaction(ctx, oCfg, set.Logger)
if err != nil {
return nil, fmt.Errorf("error creating a redaction processor: %w", err)
}

return processorhelper.NewMetricsProcessor(
ctx,
set,
cfg,
next,
red.processMetrics,
processorhelper.WithCapabilities(consumer.Capabilities{MutatesData: true}))
}
18 changes: 18 additions & 0 deletions processor/redactionprocessor/factory_test.go
Original file line number Diff line number Diff line change
Expand Up @@ -26,3 +26,21 @@ func TestCreateTestProcessor(t *testing.T) {
assert.NotNil(t, tp)
assert.True(t, tp.Capabilities().MutatesData)
}

func TestCreateTestLogsProcessor(t *testing.T) {
cfg := &Config{}

tp, err := createLogsProcessor(context.Background(), processortest.NewNopSettings(), cfg, consumertest.NewNop())
assert.NoError(t, err)
assert.NotNil(t, tp)
assert.Equal(t, true, tp.Capabilities().MutatesData)
}

func TestCreateTestMetricsProcessor(t *testing.T) {
cfg := &Config{}

tp, err := createMetricsProcessor(context.Background(), processortest.NewNopSettings(), cfg, consumertest.NewNop())
assert.NoError(t, err)
assert.NotNil(t, tp)
assert.Equal(t, true, tp.Capabilities().MutatesData)
}
14 changes: 14 additions & 0 deletions processor/redactionprocessor/generated_component_test.go

Some generated files are not rendered by default. Learn more about how customized files appear on GitHub.

Some generated files are not rendered by default. Learn more about how customized files appear on GitHub.

1 change: 1 addition & 0 deletions processor/redactionprocessor/metadata.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -4,6 +4,7 @@ status:
class: processor
stability:
beta: [traces]
alpha: [logs,metrics]
distributions: [contrib]
codeowners:
active: [dmitryax, mx-psi, TylerHelmuth]
Expand Down
75 changes: 75 additions & 0 deletions processor/redactionprocessor/processor.go
Original file line number Diff line number Diff line change
Expand Up @@ -11,6 +11,8 @@ import (
"strings"

"go.opentelemetry.io/collector/pdata/pcommon"
"go.opentelemetry.io/collector/pdata/plog"
"go.opentelemetry.io/collector/pdata/pmetric"
"go.opentelemetry.io/collector/pdata/ptrace"
"go.uber.org/zap"
)
Expand Down Expand Up @@ -59,6 +61,22 @@ func (s *redaction) processTraces(ctx context.Context, batch ptrace.Traces) (ptr
return batch, nil
}

func (s *redaction) processLogs(ctx context.Context, logs plog.Logs) (plog.Logs, error) {
for i := 0; i < logs.ResourceLogs().Len(); i++ {
rl := logs.ResourceLogs().At(i)
s.processResourceLog(ctx, rl)
}
return logs, nil
}

func (s *redaction) processMetrics(ctx context.Context, metrics pmetric.Metrics) (pmetric.Metrics, error) {
for i := 0; i < metrics.ResourceMetrics().Len(); i++ {
rm := metrics.ResourceMetrics().At(i)
s.processResourceMetric(ctx, rm)
}
return metrics, nil
}

// processResourceSpan processes the RS and all of its spans and then returns the last
// view metric context. The context can be used for tests
func (s *redaction) processResourceSpan(ctx context.Context, rs ptrace.ResourceSpans) {
Expand All @@ -79,6 +97,63 @@ func (s *redaction) processResourceSpan(ctx context.Context, rs ptrace.ResourceS
}
}

// processResourceLog processes the log resource and all of its logs and then returns the last
// view metric context. The context can be used for tests
func (s *redaction) processResourceLog(ctx context.Context, rl plog.ResourceLogs) {
rsAttrs := rl.Resource().Attributes()

s.processAttrs(ctx, rsAttrs)

for j := 0; j < rl.ScopeLogs().Len(); j++ {
ils := rl.ScopeLogs().At(j)
for k := 0; k < rl.ScopeLogs().Len(); k++ {
log := ils.LogRecords().At(k)
s.processAttrs(ctx, log.Attributes())
}
}
}

func (s *redaction) processResourceMetric(ctx context.Context, rm pmetric.ResourceMetrics) {
rsAttrs := rm.Resource().Attributes()

s.processAttrs(ctx, rsAttrs)

for j := 0; j < rm.ScopeMetrics().Len(); j++ {
ils := rm.ScopeMetrics().At(j)
for k := 0; k < ils.Metrics().Len(); k++ {
metric := ils.Metrics().At(k)
switch metric.Type() {
case pmetric.MetricTypeGauge:
dps := metric.Gauge().DataPoints()
for i := 0; i < dps.Len(); i++ {
s.processAttrs(ctx, dps.At(i).Attributes())
}
case pmetric.MetricTypeSum:
dps := metric.Sum().DataPoints()
for i := 0; i < dps.Len(); i++ {
s.processAttrs(ctx, dps.At(i).Attributes())
}
case pmetric.MetricTypeHistogram:
dps := metric.Histogram().DataPoints()
for i := 0; i < dps.Len(); i++ {
s.processAttrs(ctx, dps.At(i).Attributes())
}
case pmetric.MetricTypeExponentialHistogram:
dps := metric.ExponentialHistogram().DataPoints()
for i := 0; i < dps.Len(); i++ {
s.processAttrs(ctx, dps.At(i).Attributes())
}
case pmetric.MetricTypeSummary:
dps := metric.Summary().DataPoints()
for i := 0; i < dps.Len(); i++ {
s.processAttrs(ctx, dps.At(i).Attributes())
}
case pmetric.MetricTypeEmpty:
}
}
}
}

// processAttrs redacts the attributes of a resource span or a span
func (s *redaction) processAttrs(_ context.Context, attributes pcommon.Map) {
// TODO: Use the context for recording metrics
Expand Down
Loading

0 comments on commit 184e954

Please sign in to comment.