foundationdb/flow/Tracing.h
Ray Jenkins c45abc7c32
Add TRACING_SPAN_ATTRIBUTES_ENABLED Knob, default false. (#7354)
* Add TRACING_SPAN_ATTRIBUTES_ENABLED Knob, default false.

In order to prevent accidental leakage of PII to external tracing collector services,
we've added a knob to prevent additional attributes to be added to spans unless explicitly
enabled by the user.

* Enable span attributes knob for unit tests.
2022-06-13 11:37:09 -05:00

286 lines
11 KiB
C++

/*
* Tracing.h
*
* This source file is part of the FoundationDB open source project
*
* Copyright 2013-2022 Apple Inc. and the FoundationDB project authors
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
#pragma once
#include "fdbclient/FDBTypes.h"
#include "fdbrpc/FlowTransport.h"
#include "flow/IRandom.h"
#include <unordered_set>
#include <atomic>
struct Location {
StringRef name;
};
inline Location operator"" _loc(const char* str, size_t size) {
return Location{ StringRef(reinterpret_cast<const uint8_t*>(str), size) };
}
enum class TraceFlags : uint8_t { unsampled = 0b00000000, sampled = 0b00000001 };
inline TraceFlags operator&(TraceFlags lhs, TraceFlags rhs) {
return static_cast<TraceFlags>(static_cast<std::underlying_type_t<TraceFlags>>(lhs) &
static_cast<std::underlying_type_t<TraceFlags>>(rhs));
}
struct SpanContext {
UID traceID;
uint64_t spanID;
TraceFlags m_Flags;
SpanContext() : traceID(UID()), spanID(0), m_Flags(TraceFlags::unsampled) {}
SpanContext(UID traceID, uint64_t spanID, TraceFlags flags) : traceID(traceID), spanID(spanID), m_Flags(flags) {}
SpanContext(UID traceID, uint64_t spanID) : traceID(traceID), spanID(spanID), m_Flags(TraceFlags::unsampled) {}
SpanContext(Arena arena, const SpanContext& span)
: traceID(span.traceID), spanID(span.spanID), m_Flags(span.m_Flags) {}
bool isSampled() const { return (m_Flags & TraceFlags::sampled) == TraceFlags::sampled; }
std::string toString() const { return format("%016llx%016llx%016llx", traceID.first(), traceID.second(), spanID); };
bool isValid() const { return traceID.first() != 0 && traceID.second() != 0 && spanID != 0; }
template <class Ar>
void serialize(Ar& ar) {
serializer(ar, traceID, spanID, m_Flags);
}
};
// Span
//
// Span is a tracing implementation which, for the most part, complies with the W3C Trace Context specification
// https://www.w3.org/TR/trace-context/ and the OpenTelemetry API
// https://github.com/open-telemetry/opentelemetry-specification/blob/main/specification/trace/api.md.
//
// The major differences between Span and the 7.0 Span implementation, which is based off the OpenTracing.io
// specification https://opentracing.io/ are as follows.
// https://github.com/open-telemetry/opentelemetry-specification/blob/main/specification/trace/api.md#span
//
// OpenTelemetry Spans have...
// 1. A SpanContext which consists of 3 attributes.
//
// TraceId - A valid trace identifier is a 16-byte array with at least one non-zero byte.
// SpanId - A valid span identifier is an 8-byte array with at least one non-zero byte.
// TraceFlags - 1 byte, bit field for flags.
//
// TraceState is not implemented, specifically we do not provide some of the following APIs
// https://www.w3.org/TR/trace-context/#mutating-the-tracestate-field In particular APIs to delete/update a specific,
// arbitrary key/value pair, as this complies with the OTEL specification where SpanContexts are immutable.
// 2. A begin/end and those values are serialized, unlike the Span implementation which has an end but serializes with a
// begin and calculated duration field.
// 3. A SpanKind
// https://github.com/open-telemetry/opentelemetry-specification/blob/main/specification/trace/api.md#spankind
// 4. A SpanStatus
// https://github.com/open-telemetry/opentelemetry-specification/blob/main/specification/trace/api.md#set-status
// 5. A singular parent SpanContext, which may optionally be null, as opposed to our Span implementation which allows
// for a list of parents.
// 6. An "attributes" rather than "tags", however the implementation is essentially the same, a set of key/value of
// strings, stored here as a SmallVectorRef<KeyValueRef> rather than map as a convenience.
// https://github.com/open-telemetry/opentelemetry-specification/blob/main/specification/common/common.md#attributes
// 7. An optional list of linked SpanContexts.
// https://github.com/open-telemetry/opentelemetry-specification/blob/main/specification/trace/api.md#specifying-links
// 8. An optional list of timestamped Events.
// https://github.com/open-telemetry/opentelemetry-specification/blob/main/specification/trace/api.md#add-events
enum class SpanKind : uint8_t { INTERNAL = 0, CLIENT = 1, SERVER = 2, PRODUCER = 3, CONSUMER = 4 };
enum class SpanStatus : uint8_t { UNSET = 0, OK = 1, ERR = 2 };
struct SpanEventRef {
SpanEventRef() {}
SpanEventRef(const StringRef& name,
const double& time,
const SmallVectorRef<KeyValueRef>& attributes = SmallVectorRef<KeyValueRef>())
: name(name), time(time), attributes(attributes) {}
SpanEventRef(Arena& arena, const SpanEventRef& other)
: name(arena, other.name), time(other.time), attributes(arena, other.attributes) {}
StringRef name;
double time = 0.0;
SmallVectorRef<KeyValueRef> attributes;
};
class Span {
public:
// Construct a Span with a given context, location, parentContext and optional links.
//
// N.B. While this constructor receives a parentContext it does not overwrite the traceId of the Span's context.
// Therefore it is the responsibility of the caller to ensure the traceID and m_Flags of both the context and
// parentContext are identical if the caller wishes to establish a parent/child relationship between these spans. We
// do this to avoid needless comparisons or copies as this constructor is only called once in NativeAPI.actor.cpp
// and from below in the by the Span(location, parent, links) constructor. The Span(location, parent, links)
// constructor is used broadly and performs the copy of the parent's traceID and m_Flags.
Span(const SpanContext& context,
const Location& location,
const SpanContext& parentContext,
const std::initializer_list<SpanContext>& links = {})
: context(context), location(location), parentContext(parentContext), links(arena, links.begin(), links.end()),
begin(g_network->now()) {
this->kind = SpanKind::SERVER;
this->status = SpanStatus::OK;
this->attributes.push_back(
// this->arena, KeyValueRef("address"_sr, StringRef(this->arena, "localhost:4000")));
this->arena,
KeyValueRef("address"_sr, StringRef(this->arena, FlowTransport::transport().getLocalAddressAsString())));
}
// Construct Span with a location, parent, and optional links.
// This constructor copies the parent's traceID creating a parent->child relationship between Spans.
// Additionally we inherit the m_Flags of the parent, thus enabling or disabling sampling to match the parent.
Span(const Location& location, const SpanContext& parent, const std::initializer_list<SpanContext>& links = {})
: Span(SpanContext(parent.traceID, deterministicRandom()->randomUInt64(), parent.m_Flags),
location,
parent,
links) {}
// Construct Span without parent. Used for creating a root span, or when the parent is not known at construction
// time.
Span(const SpanContext& context, const Location& location) : Span(context, location, SpanContext()) {}
// We've determined for initial tracing release, spans with only a location will not be traced.
// Generally these are for background processes, some are called infrequently, while others may be high volume.
// TODO: review and address in subsequent PRs.
Span(const Location& location) : location(location), begin(g_network->now()) {}
Span(const Span&) = delete;
Span(Span&& o) {
arena = std::move(o.arena);
context = o.context;
location = o.location;
parentContext = std::move(o.parentContext);
kind = o.kind;
begin = o.begin;
end = o.end;
links = std::move(o.links);
events = std::move(o.events);
status = o.status;
o.context = SpanContext();
o.parentContext = SpanContext();
o.kind = SpanKind::INTERNAL;
o.begin = 0.0;
o.end = 0.0;
o.status = SpanStatus::UNSET;
}
Span() {}
~Span();
Span& operator=(Span&& o);
Span& operator=(const Span&) = delete;
void swap(Span& other) {
std::swap(arena, other.arena);
std::swap(context, other.context);
std::swap(location, other.location);
std::swap(parentContext, other.parentContext);
std::swap(kind, other.kind);
std::swap(status, other.status);
std::swap(begin, other.begin);
std::swap(end, other.end);
std::swap(links, other.links);
std::swap(events, other.events);
}
Span& addLink(const SpanContext& linkContext) {
links.push_back(arena, linkContext);
// Check if link is sampled, if so sample this span.
if (!context.isSampled() && linkContext.isSampled()) {
context.m_Flags = TraceFlags::sampled;
// If for some reason this span isn't valid, we need to give it a
// traceID and spanID. This case is currently hit in CommitProxyServer
// CommitBatchContext::CommitBatchContext and CommitBatchContext::setupTraceBatch.
if (!context.isValid()) {
context.traceID = deterministicRandom()->randomUniqueID();
context.spanID = deterministicRandom()->randomUInt64();
}
}
return *this;
}
Span& addLinks(const std::initializer_list<SpanContext>& linkContexts = {}) {
for (auto const& sc : linkContexts) {
addLink(sc);
}
return *this;
}
Span& addEvent(const SpanEventRef& event) {
events.push_back_deep(arena, event);
return *this;
}
Span& addEvent(const StringRef& name,
const double& time,
const SmallVectorRef<KeyValueRef>& attrs = SmallVectorRef<KeyValueRef>()) {
return addEvent(SpanEventRef(name, time, attrs));
}
Span& addAttribute(const StringRef& key, const StringRef& value) {
if (FLOW_KNOBS->TRACING_SPAN_ATTRIBUTES_ENABLED) {
attributes.push_back_deep(arena, KeyValueRef(key, value));
}
return *this;
}
Span& setParent(const SpanContext& parent) {
parentContext = parent;
context.traceID = parent.traceID;
context.spanID = deterministicRandom()->randomUInt64();
context.m_Flags = parent.m_Flags;
return *this;
}
Arena arena;
SpanContext context;
Location location;
SpanContext parentContext;
SpanKind kind;
SmallVectorRef<SpanContext> links;
double begin = 0.0, end = 0.0;
SmallVectorRef<KeyValueRef> attributes; // not necessarily sorted
SmallVectorRef<SpanEventRef> events;
SpanStatus status;
};
// The user selects a tracer using a string passed to fdbserver on boot.
// Clients should not refer to TracerType directly, and mappings of names to
// values in this enum can change without notice.
enum class TracerType {
DISABLED = 0,
NETWORK_LOSSY = 1,
SIM_END = 2, // Any tracers that come after SIM_END will not be tested in simulation
LOG_FILE = 3
};
struct ITracer {
virtual ~ITracer();
virtual TracerType type() const = 0;
// passed ownership to the tracer
virtual void trace(Span const& span) = 0;
};
void openTracer(TracerType type);
template <class T>
struct SpannedDeque : Deque<T> {
Span span;
explicit SpannedDeque(Location loc) : span(loc) {}
SpannedDeque(SpannedDeque&& other) : Deque<T>(std::move(other)), span(std::move(other.span)) {}
SpannedDeque(SpannedDeque const&) = delete;
SpannedDeque& operator=(SpannedDeque const&) = delete;
SpannedDeque& operator=(SpannedDeque&& other) {
*static_cast<Deque<T>*>(this) = std::move(other);
span = std::move(other.span);
}
};