Skip to content
Open
Show file tree
Hide file tree
Changes from 46 commits
Commits
Show all changes
59 commits
Select commit Hold shift + click to select a range
b8fd92e
fix
TAOXUY Mar 6, 2026
4dd73b0
iterate
TAOXUY Mar 6, 2026
4f243b3
stats: fix eviction of stats with active references
TAOXUY Mar 6, 2026
f44561b
format
TAOXUY Mar 8, 2026
32cc03e
fix: restore evictionDisabled and fix test
TAOXUY Mar 8, 2026
b9deaef
fix test
TAOXUY Mar 8, 2026
8ae0f97
fix test
TAOXUY Mar 9, 2026
4e530a7
fix
TAOXUY Mar 9, 2026
d5f87d2
fix
TAOXUY Mar 11, 2026
e5259b5
fix
TAOXUY Mar 11, 2026
7e9176a
fix
TAOXUY Mar 11, 2026
5628f8f
fix
TAOXUY Mar 11, 2026
77dac2d
fix
TAOXUY Mar 12, 2026
8ad7e93
fix
TAOXUY Mar 12, 2026
2995c40
fix
TAOXUY Mar 13, 2026
0ed297f
fix
TAOXUY Mar 16, 2026
464577d
Merge branch 'main' into fixStatDestructor
TAOXUY Mar 16, 2026
cbd6fba
fix
TAOXUY Mar 16, 2026
ee2a3ad
fix
TAOXUY Mar 17, 2026
e6a43a0
Merge branch 'main' into fixStatDestructor
TAOXUY Mar 17, 2026
b28e622
fix
TAOXUY Mar 17, 2026
fe1706c
protect over-subtract
TAOXUY Mar 17, 2026
a836a3a
fix
TAOXUY Mar 18, 2026
f6f870c
fix
TAOXUY Mar 18, 2026
7c910c9
fix
TAOXUY Mar 18, 2026
09e2737
fix
TAOXUY Mar 18, 2026
163fd59
fix
TAOXUY Mar 18, 2026
5b3a9af
fix
TAOXUY Mar 18, 2026
f54bb9f
fix
TAOXUY Mar 18, 2026
b927087
fix
TAOXUY Mar 18, 2026
80ce33d
fix
TAOXUY Mar 18, 2026
154c3b7
Merge branch 'main' into fixStatDestructor
TAOXUY Mar 18, 2026
71c8b8c
fix
TAOXUY Mar 18, 2026
8395f2b
fix
TAOXUY Mar 19, 2026
db26105
fix
TAOXUY Mar 19, 2026
ff3a7e0
fix
TAOXUY Mar 19, 2026
ab3f86e
add key test
TAOXUY Mar 19, 2026
2a8f97d
fix
TAOXUY Mar 19, 2026
1b1e6e0
Update source/extensions/access_loggers/stats/stats.cc
TAOXUY Mar 19, 2026
a9cdc38
fix
TAOXUY Mar 19, 2026
81cca1c
fix
TAOXUY Mar 20, 2026
0c6103d
format
TAOXUY Mar 20, 2026
b8d6c70
fix
TAOXUY Mar 20, 2026
cabad6d
fix
TAOXUY Mar 20, 2026
627aab0
fix
TAOXUY Mar 20, 2026
222c0fa
fix
TAOXUY Mar 20, 2026
f097aad
fix
TAOXUY Mar 21, 2026
713686f
fix
TAOXUY Mar 21, 2026
d15e5ed
fix
TAOXUY Mar 21, 2026
d8af134
fix
TAOXUY Mar 23, 2026
eabbbfd
Merge branch 'main' into fixStatDestructor
TAOXUY Mar 23, 2026
9b6ef12
add test
TAOXUY Mar 24, 2026
808a9c6
test: add memory footprint tests for GaugeKey and AccessLogState and …
TAOXUY Mar 24, 2026
d2d97fa
fix comment
TAOXUY Mar 24, 2026
98ef2b0
Apply suggestions from code review
TAOXUY Mar 25, 2026
8757699
Apply suggestions from code review
TAOXUY Mar 25, 2026
617b60b
add integration test for TCP
TAOXUY Mar 25, 2026
b4bdd87
fix
TAOXUY Mar 25, 2026
e447bea
fix
TAOXUY Mar 25, 2026
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
14 changes: 10 additions & 4 deletions source/common/stats/thread_local_store.cc
Original file line number Diff line number Diff line change
Expand Up @@ -1130,15 +1130,21 @@ void ThreadLocalStoreImpl::evictUnused() {
MetricBag metrics(scope->scope_id_);
CentralCacheEntrySharedPtr& central_cache = scope->centralCacheMutableNoThreadAnalysis();
auto filter_unused = []<typename T>(StatNameHashMap<T>& unused_metrics) {
return [&unused_metrics](std::pair<StatName, T> kv) {
return [&unused_metrics](const std::pair<const StatName, T>& kv) {
const auto& [name, metric] = kv;
// We assume the gauge is used as an `updown` counter here and if the value is 0, it is
// unused.
if constexpr (std::is_same_v<T, GaugeSharedPtr>) {
if (metric->value() != 0) {
return false;
}
}
if (metric->used()) {
metric->markUnused();
return false;
} else {
unused_metrics.try_emplace(name, metric);
return true;
}
unused_metrics.try_emplace(name, metric);
return true;
};
};
absl::erase_if(central_cache->counters_, filter_unused(metrics.counters_));
Expand Down
147 changes: 90 additions & 57 deletions source/extensions/access_loggers/stats/stats.cc
Original file line number Diff line number Diff line change
Expand Up @@ -19,64 +19,72 @@ using Extensions::Matching::Actions::TransformStat::ActionContext;

class AccessLogState : public StreamInfo::FilterState::Object {
public:
AccessLogState(Stats::ScopeSharedPtr scope) : scope_(std::move(scope)) {}
AccessLogState(std::shared_ptr<const StatsAccessLog> parent) : parent_(std::move(parent)) {}

// When the request is destroyed, we need to subtract the value from the gauge.
// We need to look up the gauge again in the scope because it might have been evicted.
// The gauge object itself is kept alive by the shared_ptr in the state, so we can access its
// name and tags to re-lookup/re-create it in the scope.
~AccessLogState() override {
for (const auto& [gauge_ptr, state] : inflight_gauges_) {
// TODO(taoxuy): make this as an accessor of the
// Stat class.
Stats::StatNameTagVector tag_names;
state.gauge_->iterateTagStatNames(
[&tag_names](Stats::StatName name, Stats::StatName value) -> bool {
tag_names.emplace_back(name, value);
return true;
});

// Using state.gauge_->statName() directly would be incorrect because it returns the fully
// qualified name (including tags). Passing this full name to scope_->gaugeFromStatName(...)
// would cause the scope to attempt tag extraction on the full name. Since the tags in
// AccessLogState are often dynamic and not configured in the global tag extractors, this
// extraction would likely fail to identify the tags correctly, resulting in a gauge with a
// different identity (the full name as the stat name and no tags).
auto& gauge = scope_->gaugeFromStatNameWithTags(
state.gauge_->tagExtractedStatName(), tag_names, Stats::Gauge::ImportMode::Accumulate);
gauge.sub(state.value_);
for (const std::pair<const GaugeKey, InflightGauge>& p : inflight_gauges_) {
Stats::Gauge& gauge_stat = parent_->scope().gaugeFromStatNameWithTags(
p.first.stat_name_, p.first.tags(), p.first.import_mode_);
gauge_stat.sub(p.second.value_);
}
}

void addInflightGauge(Stats::Gauge* gauge, uint64_t value) {
inflight_gauges_.try_emplace(gauge, Stats::GaugeSharedPtr(gauge), value);
}
void addInflightGauge(Stats::StatName stat_name, Stats::StatNameTagVectorOptConstRef tags,
Stats::Gauge::ImportMode import_mode, uint64_t value,
std::vector<Stats::StatNameDynamicStorage> tags_storage) {
if (value == 0) {
return;
}

absl::optional<uint64_t> removeInflightGauge(Stats::Gauge* gauge) {
auto it = inflight_gauges_.find(gauge);
GaugeKey key{stat_name, import_mode, tags};

auto it = inflight_gauges_.find(key);
if (it == inflight_gauges_.end()) {
return absl::nullopt;
key.makeOwned();
auto [new_it, inserted] =
inflight_gauges_.emplace(std::move(key), InflightGauge{std::move(tags_storage), 0});
it = new_it;
}
it->second.value_ += value;
parent_->scope().gaugeFromStatNameWithTags(stat_name, tags, import_mode).add(value);
}

void removeInflightGauge(Stats::StatName stat_name, Stats::StatNameTagVectorOptConstRef tags,
Stats::Gauge::ImportMode import_mode, uint64_t value) {
if (value == 0) {
return;
}

GaugeKey key{stat_name, import_mode, tags};

// Create the gauge so it gets registered in the stat store (expected by some tests and stats
// logic)
Stats::Gauge& gauge_stat =
parent_->scope().gaugeFromStatNameWithTags(stat_name, tags, import_mode);

auto it = inflight_gauges_.find(key);
if (it != inflight_gauges_.end()) {
it->second.value_ -= value;
gauge_stat.sub(value);
if (it->second.value_ == 0) {
inflight_gauges_.erase(it);
}
}
uint64_t value = it->second.value_;
inflight_gauges_.erase(it);
return value;
}

static constexpr absl::string_view key() { return "envoy.access_loggers.stats.access_log_state"; }

private:
struct State {
State(Stats::GaugeSharedPtr gauge, uint64_t value) : gauge_(std::move(gauge)), value_(value) {}
// Hold a shared_ptr to the parent to ensure the parent and its members exist for the lifetime of
// AccessLogState.
std::shared_ptr<const StatsAccessLog> parent_;

Stats::GaugeSharedPtr gauge_;
struct InflightGauge {
std::vector<Stats::StatNameDynamicStorage> tags_storage_;
uint64_t value_;
};

Stats::ScopeSharedPtr scope_;

// The map key holds a raw pointer to the gauge. The value holds a ref-counted pointer to ensure
// the gauge is not destroyed if it is evicted from the stats scope.
absl::flat_hash_map<Stats::Gauge*, State> inflight_gauges_;
absl::flat_hash_map<GaugeKey, InflightGauge> inflight_gauges_;
};

Formatter::FormatterProviderPtr
Expand Down Expand Up @@ -138,6 +146,36 @@ class TagActionValidationVisitor

} // namespace

GaugeKey::GaugeKey(Stats::StatName stat_name, Stats::Gauge::ImportMode import_mode,
Stats::StatNameTagVectorOptConstRef borrowed_tags)
: stat_name_(stat_name), import_mode_(import_mode), borrowed_tags_(borrowed_tags) {}

void GaugeKey::makeOwned() {
if (borrowed_tags_.has_value() && !owned_tags_.has_value()) {
owned_tags_ = borrowed_tags_.value().get();
borrowed_tags_ = absl::nullopt;
}
}

Stats::StatNameTagVectorOptConstRef GaugeKey::tags() const {
if (owned_tags_.has_value()) {
return std::cref(owned_tags_.value());
}
return borrowed_tags_;
}

bool GaugeKey::operator==(const GaugeKey& rhs) const {
if (stat_name_ != rhs.stat_name_ || import_mode_ != rhs.import_mode_) {
return false;
}
Stats::StatNameTagVectorOptConstRef lhs_tags = tags();
Stats::StatNameTagVectorOptConstRef rhs_tags = rhs.tags();
if (lhs_tags.has_value() != rhs_tags.has_value()) {
return false;
}
return !lhs_tags.has_value() || lhs_tags.value().get() == rhs_tags.value().get();
}

StatsAccessLog::StatsAccessLog(const envoy::extensions::access_loggers::stats::v3::Config& config,
Server::Configuration::GenericFactoryContext& context,
AccessLog::FilterPtr&& filter,
Expand Down Expand Up @@ -417,31 +455,26 @@ void StatsAccessLog::emitLogForGauge(const Gauge& gauge, const Formatter::Contex
Stats::Gauge::ImportMode import_mode = op == Gauge::OperationType::SET
? Stats::Gauge::ImportMode::NeverImport
: Stats::Gauge::ImportMode::Accumulate;
auto& gauge_stat = scope_->gaugeFromStatNameWithTags(gauge.stat_.name_, tags, import_mode);

if (op == Gauge::OperationType::PAIRED_ADD || op == Gauge::OperationType::PAIRED_SUBTRACT) {
if (op == Gauge::OperationType::SET) {
Stats::Gauge& gauge_stat =
scope_->gaugeFromStatNameWithTags(gauge.stat_.name_, tags, import_mode);
gauge_stat.set(value);
} else if (op == Gauge::OperationType::PAIRED_ADD ||
op == Gauge::OperationType::PAIRED_SUBTRACT) {
auto& filter_state = const_cast<StreamInfo::FilterState&>(stream_info.filterState());
if (!filter_state.hasData<AccessLogState>(AccessLogState::key())) {
filter_state.setData(AccessLogState::key(), std::make_shared<AccessLogState>(scope_),
StreamInfo::FilterState::StateType::Mutable,
StreamInfo::FilterState::LifeSpan::Request);
filter_state.setData(
AccessLogState::key(), std::make_shared<AccessLogState>(shared_from_this()),
StreamInfo::FilterState::StateType::Mutable, StreamInfo::FilterState::LifeSpan::Request);
Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

What if this is a connection-level access log, like a listener access log? I'm not sure what a lifespan of Request does in that case, but it may not do the right thing. I think this should be addressed in a separate PR, but it just came to mind so I wanted to mention it.

Copy link
Contributor Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Good catch! Updated the comment that it should be good for TCP connection and I have add an integration test for TCP.

}
auto* state = filter_state.getDataMutable<AccessLogState>(AccessLogState::key());

if (op == Gauge::OperationType::PAIRED_ADD) {
state->addInflightGauge(&gauge_stat, value);
gauge_stat.add(value);
state->addInflightGauge(gauge.stat_.name_, tags, import_mode, value, std::move(storage));
} else {
absl::optional<uint64_t> added_value = state->removeInflightGauge(&gauge_stat);
if (added_value.has_value()) {
gauge_stat.sub(added_value.value());
}
state->removeInflightGauge(gauge.stat_.name_, tags, import_mode, value);
}
return;
}

if (op == Gauge::OperationType::SET) {
gauge_stat.set(value);
}
}

Expand Down
48 changes: 47 additions & 1 deletion source/extensions/access_loggers/stats/stats.h
Original file line number Diff line number Diff line change
Expand Up @@ -6,6 +6,7 @@
#include "envoy/stats/tag.h"

#include "source/common/matcher/matcher.h"
#include "source/common/stats/symbol_table.h"
#include "source/extensions/access_loggers/common/access_log_base.h"
#include "source/extensions/matching/actions/transform_stat/transform_stat.h"

Expand All @@ -14,8 +15,52 @@ namespace Extensions {
namespace AccessLoggers {
namespace StatsAccessLog {

class StatsAccessLog : public AccessLoggers::Common::ImplBase {
// GaugeKey serves as a lock-free map key composed of exactly the configuration
// properties that define a fully resolved gauge metric.
//
// It preserves the raw components (base name + tags) allowing us to safely
// re-create the gauge from the scope if it gets evicted while the request is in-flight.
//
// To avoid heap-allocating a new std::vector on every map lookup (which happens
// on every single gauge increment/decrement), this key acts as a lightweight
// zero-allocation "view" using `borrowed_tags_` during map lookups.
// When the key actually needs to be safely persisted into the map, `makeOwned()`
// is explicitly called to allocate and copy the tags into `owned_tags_`.
struct GaugeKey {
Stats::StatName stat_name_;
Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

should makeOwned ensure that stat_name has local backup also? stat_name is like string_view.

Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

I scanned this a bit more and I am not understanding why the backing-store management for stat_name differs from the backing-store management for tags.

I think the stat-name comes from some pre-existing gauge but I am having a hard time keeping this all in my head. Wherever you get the the name from should have the tags; there should be no need to copy the tags if you are copying the name.

Copy link
Contributor Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Because stat_name_ always comes from the persistent static configuration of the StatsAccessLog (which is kept alive by std::shared_ptr in the AccessLogState filter state), whereas the tags are dynamic and computed per request.

Since the static name outlives the request, it is safe without local storage. The tags, however, are dynamic and need to be persisted if they are pushed to the background/delayed logging map.

Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

I can see you copying the vector of tag name/value pairs, but I do not see how the backing store of the tag names & values is managed. Copying the vector won't copy the backing store of the tag names & values.

I think that ultimately if you are creating a new gauge, the gauge should own the tag names/values that are held in the GaugeKey.

Actually I think maybe the best way to manage the backing store is to to have an OptRef<Gauge> in the GaugeKey.

Copy link
Contributor Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

The backing store is in the map value(InflightGauge.tags_storage_).
image

the best way to manage the backing store is to to have an OptRef

I don't follow. Can you explain a little?

Copy link
Contributor Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

One example, if 2 such stats accesslogger defined the same gauge. The time sequence is like

  • one accesslog add 1 on the gauge
  • the other accesslog set the gauge to 0
  • eviction happen
  • the first accesslog now does a subtract 1

Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Sorry, let me ask this a different way.

If you have a loop like

for (int i = 0; i < a billion; ++i) {
  allocate gauge and store in map
  evict gauge
}

what happens to the map?

Copy link
Contributor Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Shared the benchmarking offline

Copy link
Contributor Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Copy link
Contributor Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

The benchmark test added for AccessLogState

Stats::Gauge::ImportMode import_mode_;
absl::optional<Stats::StatNameTagVector> owned_tags_;
Stats::StatNameTagVectorOptConstRef borrowed_tags_{absl::nullopt};

GaugeKey(Stats::StatName stat_name, Stats::Gauge::ImportMode import_mode,
Stats::StatNameTagVectorOptConstRef borrowed_tags);

void makeOwned();

Stats::StatNameTagVectorOptConstRef tags() const;

bool operator==(const GaugeKey& rhs) const;

template <typename H> friend H AbslHashValue(H h, const GaugeKey& key) {
// We hash the logical tag content to match operator== behavior, ignoring
// whether the tags are stored in owned_tags_ or borrowed_tags_. This ensures
// that two equal keys produce the same hash regardless of their storage representation.
Stats::StatNameTagVectorOptConstRef tags = key.tags();
if (tags.has_value()) {
h = H::combine(std::move(h), key.stat_name_, key.import_mode_, true);
for (const auto& tag : tags.value().get()) {
h = H::combine(std::move(h), tag.first, tag.second);
}
return h;
}
return H::combine(std::move(h), key.stat_name_, key.import_mode_, false);
}
};

class StatsAccessLog : public AccessLoggers::Common::ImplBase,
public std::enable_shared_from_this<StatsAccessLog> {
public:
Stats::Scope& scope() const { return *scope_; }
StatsAccessLog(const envoy::extensions::access_loggers::stats::v3::Config& config,
Server::Configuration::GenericFactoryContext& context,
AccessLog::FilterPtr&& filter,
Expand Down Expand Up @@ -103,6 +148,7 @@ class StatsAccessLog : public AccessLoggers::Common::ImplBase {
};

} // namespace StatsAccessLog

} // namespace AccessLoggers
} // namespace Extensions
} // namespace Envoy
Loading
Loading