diff --git a/.github/ai-opt-out b/.github/ai-opt-out
new file mode 100644
index 00000000000..f2bf078d222
--- /dev/null
+++ b/.github/ai-opt-out
@@ -0,0 +1 @@
+opt-out: true
diff --git a/.github/workflows/tests.yaml b/.github/workflows/tests.yaml
index 1cef39e1945..7abc185173f 100644
--- a/.github/workflows/tests.yaml
+++ b/.github/workflows/tests.yaml
@@ -39,6 +39,32 @@ jobs:
       mode: release
       enables: --enable-dpdk
       options: --cook dpdk --dpdk-machine corei7-avx
+    # disable dpdk build as we don't use it an it is
+    # long and breaks now and then: it still runs
+    # upstream
+    if: false
+
+  build_with_dual_tls:
+    name: "Test with both TLS backends"
+    uses: ./.github/workflows/test.yaml
+    strategy:
+      fail-fast: false
+    with:
+      compiler: clang++
+      standard: 23
+      mode: debug
+      options: --tls-mode=both
+
+  build_with_openssl_tls:
+    name: "Test with OpenSSL TLS backend only"
+    uses: ./.github/workflows/test.yaml
+    strategy:
+      fail-fast: false
+    with:
+      compiler: clang++
+      standard: 23
+      mode: debug
+      options: --tls-mode=openssl
 
   build_with_cxx_modules:
     name: "Test with C++20 modules enabled"
@@ -51,6 +77,9 @@ jobs:
       mode: debug
       enables: --enable-cxx-modules
       enable-ccache: false
+    # disable modules build as we aren't using module and it is quite
+    # broken at the moment
+    if: false
 
   fuzz_test:
     name: "Fuzz Tests"
diff --git a/CMakeLists.txt b/CMakeLists.txt
index bacd7a7fb4a..da32c419ab1 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -525,11 +525,13 @@ seastar_generate_protobuf (
   IN_FILE ${CMAKE_CURRENT_SOURCE_DIR}/src/proto/metrics2.proto
   OUT_DIR ${Seastar_GEN_BINARY_DIR}/src/proto)
 
-set_option_if_package_is_found (Seastar_GNUTLS GnuTLS)
-set_option_if_package_is_found (Seastar_OPENSSL OpenSSL)
+option (Seastar_GNUTLS "Enable the GnuTLS-based TLS backend" ON)
+option (Seastar_OPENSSL "Enable the OpenSSL-based TLS backend" OFF)
 
 if (NOT Seastar_GNUTLS AND NOT Seastar_OPENSSL)
-  message (FATAL_ERROR "At least one TLS/crypto backend is required. Install GnuTLS or OpenSSL development packages.")
+  message (FATAL_ERROR "At least one TLS backend must be enabled. "
+    "Pass -DSeastar_GNUTLS=ON and/or -DSeastar_OPENSSL=ON, "
+    "or use configure.py --tls-mode=gnutls|openssl|both.")
 endif ()
 
 add_library (seastar
@@ -722,6 +724,7 @@ add_library (seastar
   src/core/reactor_backend.cc
   src/core/thread_pool.cc
   src/core/app-template.cc
+  src/core/cpu_profiler.cc
   src/core/disk_params.cc
   src/core/dpdk_rte.cc
   src/core/exception_hacks.cc
@@ -755,6 +758,7 @@ add_library (seastar
   src/core/semaphore.cc
   src/core/condition-variable.cc
   src/core/crypto.cc
+  src/core/signal_mutex.cc
   src/http/api_docs.cc
   src/http/common.cc
   src/http/file_handler.cc
@@ -1132,6 +1136,15 @@ if (Seastar_OPENSSL)
     PRIVATE OpenSSL::SSL OpenSSL::Crypto)
 endif ()
 
+if (Seastar_GNUTLS AND Seastar_OPENSSL)
+  # Public marker: both TLS backends are compiled in, so the active backend is
+  # selected at reactor startup. Code that needs to handle the no-reactor case
+  # (e.g. static initializers, unit tests without a reactor) can use this to
+  # distinguish from the single-backend builds where the backend is fixed at
+  # compile time and available unconditionally.
+  target_compile_definitions (seastar PUBLIC SEASTAR_TLS_DUAL_BACKEND)
+endif ()
+
 set_option_if_package_is_found (Seastar_IO_URING LibUring)
 if (Seastar_IO_URING)
   list (APPEND Seastar_PRIVATE_COMPILE_DEFINITIONS SEASTAR_HAVE_URING)
diff --git a/apps/memcached/memcache.cc b/apps/memcached/memcache.cc
index 6933e9e3975..6746e0fc07b 100644
--- a/apps/memcached/memcache.cc
+++ b/apps/memcached/memcache.cc
@@ -893,7 +893,7 @@ class ascii_protocol {
 private:
     static void append(std::vector<temporary_buffer<char>>& bufs, const char* buf, size_t size) {
         if (size) {
-            bufs.emplace_back(const_cast<char*>(buf), size, deleter());
+            bufs.push_back(temporary_buffer<char>::maybe_unsafe_from_deleter(const_cast<char*>(buf), size, deleter()));
         }
     }
 
@@ -917,7 +917,7 @@ class ascii_protocol {
 
         append(bufs, msg_crlf);
         append(bufs, item->value());
-        bufs.emplace_back(const_cast<char*>(msg_crlf), strlen(msg_crlf), make_deleter([item = std::move(item)]{}));
+        bufs.push_back(temporary_buffer<char>::maybe_unsafe_from_deleter(const_cast<char*>(msg_crlf), strlen(msg_crlf), make_deleter([item = std::move(item)]{})));
     }
 
     template <bool WithVersion>
diff --git a/configure.py b/configure.py
index 1cd299e5fa4..ca81cf1781b 100755
--- a/configure.py
+++ b/configure.py
@@ -173,6 +173,9 @@ def resolve_compilers_for_compiler_cache(args, compiler_cache):
 arg_parser.add_argument('--verbose', dest='verbose', action='store_true', help='Make configure output more verbose.')
 arg_parser.add_argument('--scheduling-groups-count', action='store', dest='scheduling_groups_count', default='16',
                         help='Number of available scheduling groups in the reactor')
+arg_parser.add_argument('--tls-mode', action='store', dest='tls_mode',
+                        choices=['gnutls', 'openssl', 'both'], default='gnutls',
+                        help='TLS backend(s) to enable: gnutls (default), openssl, or both')
 
 add_tristate(
     arg_parser,
@@ -289,6 +292,8 @@ def configure_mode(mode):
         '-DBUILD_SHARED_LIBS={}'.format('yes' if mode in ('debug', 'dev') else 'no'),
         '-DSeastar_API_LEVEL={}'.format(args.api_level),
         '-DSeastar_SCHEDULING_GROUPS_COUNT={}'.format(args.scheduling_groups_count),
+        '-DSeastar_GNUTLS={}'.format('ON' if args.tls_mode in ('gnutls', 'both') else 'OFF'),
+        '-DSeastar_OPENSSL={}'.format('ON' if args.tls_mode in ('openssl', 'both') else 'OFF'),
         tr(args.exclude_tests, 'EXCLUDE_TESTS_FROM_ALL'),
         tr(args.exclude_apps, 'EXCLUDE_APPS_FROM_ALL'),
         tr(args.exclude_demos, 'EXCLUDE_DEMOS_FROM_ALL'),
diff --git a/demos/tls_echo_server.hh b/demos/tls_echo_server.hh
index e7185dac95e..4c633b1c520 100644
--- a/demos/tls_echo_server.hh
+++ b/demos/tls_echo_server.hh
@@ -46,70 +46,86 @@ class echoserver {
     seastar::gate _gate;
     bool _stopped = false;
     bool _verbose = false;
+
+    future<stop_iteration> run_once() {
+        if (_stopped) {
+            return make_ready_future<stop_iteration>(stop_iteration::yes);
+        }
+        return with_gate(_gate, [this] {
+            return _socket.accept().then([this](accept_result ar) {
+                ::connected_socket s = std::move(ar.connection);
+                    socket_address a = std::move(ar.remote_address);
+                    if (_verbose) {
+                        std::cout << "Got connection from "<< a << std::endl;
+                    }
+                    auto strms = make_lw_shared<streams>(std::move(s));
+                    return repeat([strms, this]() {
+                        return strms->in.read().then([this, strms](temporary_buffer<char> buf) {
+                            if (buf.empty()) {
+                                if (_verbose) {
+                                    std::cout << "EOM" << std::endl;
+                                }
+                                return make_ready_future<stop_iteration>(stop_iteration::yes);
+                            }
+                            sstring tmp(buf.begin(), buf.end());
+                            if (_verbose) {
+                                std::cout << "Read " << tmp.size() << "B" << std::endl;
+                            }
+                            return strms->out.write(tmp).then([strms]() {
+                                return strms->out.flush();
+                            }).then([] {
+                                return make_ready_future<stop_iteration>(stop_iteration::no);
+                            });
+                        });
+                    }).then([strms]{
+                        return strms->out.close();
+                    }).handle_exception([](auto ep) {
+                        std::cout << "Exception: " << ep << std::endl;
+                    }).finally([this, strms]{
+                        if (_verbose) {
+                            std::cout << "Ending session" << std::endl;
+                        }
+                        return strms->in.close();
+                    });
+            }).handle_exception([this](auto ep) {
+                if (!_stopped) {
+                    std::cerr << "Error: " << ep << std::endl;
+                }
+            }).then([this] {
+                return make_ready_future<stop_iteration>(_stopped ? stop_iteration::yes : stop_iteration::no);
+            });
+        });
+    }
 public:
     echoserver(bool verbose = false)
             : _certs(make_shared<tls::server_credentials>(make_shared<tls::dh_params>()))
             , _verbose(verbose)
     {}
 
-    future<> listen(socket_address addr, sstring crtfile, sstring keyfile, tls::client_auth ca = tls::client_auth::NONE) {
-        _certs->set_client_auth(ca);
-        return _certs->set_x509_key_file(crtfile, keyfile, tls::x509_crt_format::PEM).then([this, addr] {
-            ::listen_options opts;
-            opts.reuse_address = true;
+    future<> listen(socket_address addr, sstring crtfile, sstring keyfile, sstring cafile) {
+        _certs->set_dn_verification_callback([](seastar::tls::session_type, sstring subject, sstring issuer){
+            std::cout << "DN Verification callback, subject: " << subject << " issuer: " << issuer << std::endl;
+        });
+        auto f = make_ready_future();
+        auto cauth = tls::client_auth::NONE;
+        if (cafile != "") {
+            cauth = tls::client_auth::REQUIRE;
+            f = _certs->set_x509_trust_file(cafile, tls::x509_crt_format::PEM);
+        }
+        _certs->set_client_auth(cauth);
+        return f.then([this, addr, crtfile, keyfile] {
+            return _certs->set_x509_key_file(crtfile, keyfile, tls::x509_crt_format::PEM).then([this, addr] {
+                ::listen_options opts;
+                    opts.reuse_address = true;
 
-            _socket = tls::listen(_certs, addr, opts);
+                    _socket = tls::listen(_certs, addr, opts);
 
-            // Listen in background.
-            (void)repeat([this] {
-                if (_stopped) {
-                    return make_ready_future<stop_iteration>(stop_iteration::yes);
-                }
-                return with_gate(_gate, [this] {
-                    return _socket.accept().then([this](accept_result ar) {
-                        ::connected_socket s = std::move(ar.connection);
-                        socket_address a = std::move(ar.remote_address);
-                        if (_verbose) {
-                            std::cout << "Got connection from "<< a << std::endl;
-                        }
-                        auto strms = make_lw_shared<streams>(std::move(s));
-                        return repeat([strms, this]() {
-                            return strms->in.read().then([this, strms](temporary_buffer<char> buf) {
-                                if (buf.empty()) {
-                                    if (_verbose) {
-                                        std::cout << "EOM" << std::endl;
-                                    }
-                                    return make_ready_future<stop_iteration>(stop_iteration::yes);
-                                }
-                                sstring tmp(buf.begin(), buf.end());
-                                if (_verbose) {
-                                    std::cout << "Read " << tmp.size() << "B" << std::endl;
-                                }
-                                return strms->out.write(tmp).then([strms]() {
-                                    return strms->out.flush();
-                                }).then([] {
-                                    return make_ready_future<stop_iteration>(stop_iteration::no);
-                                });
-                            });
-                        }).then([strms]{
-                            return strms->out.close();
-                        }).handle_exception([](auto ep) {
-                        }).finally([this, strms]{
-                            if (_verbose) {
-                                std::cout << "Ending session" << std::endl;
-                            }
-                            return strms->in.close();
-                        });
-                    }).handle_exception([this](auto ep) {
-                        if (!_stopped) {
-                            std::cerr << "Error: " << ep << std::endl;
-                        }
-                    }).then([this] {
-                        return make_ready_future<stop_iteration>(_stopped ? stop_iteration::yes : stop_iteration::no);
+                    // Listen in background.
+                    (void)repeat([this] {
+                        return run_once();
                     });
-                });
+                    return make_ready_future();
             });
-            return make_ready_future();
         });
     }
 
diff --git a/demos/tls_echo_server_demo.cc b/demos/tls_echo_server_demo.cc
index 4c445fea973..9611f5e8b06 100644
--- a/demos/tls_echo_server_demo.cc
+++ b/demos/tls_echo_server_demo.cc
@@ -37,6 +37,7 @@ int main(int ac, char** av) {
     app.add_options()
                     ("port", bpo::value<uint16_t>()->default_value(10000), "Server port")
                     ("address", bpo::value<std::string>()->default_value("127.0.0.1"), "Server address")
+                    ("ca,a", bpo::value<std::string>()->default_value(""), "Server CA chain file")
                     ("cert,c", bpo::value<std::string>()->required(), "Server certificate file")
                     ("key,k", bpo::value<std::string>()->required(), "Certificate key")
                     ("verbose,v", bpo::value<bool>()->default_value(false)->implicit_value(true), "Verbose")
@@ -46,6 +47,7 @@ int main(int ac, char** av) {
             seastar_apps_lib::stop_signal stop_signal;
             auto&& config = app.configuration();
             uint16_t port = config["port"].as<uint16_t>();
+            auto ca = config["ca"].as<std::string>();
             auto crt = config["cert"].as<std::string>();
             auto key = config["key"].as<std::string>();
             auto addr = config["address"].as<std::string>();
@@ -61,7 +63,7 @@ int main(int ac, char** av) {
             auto stop_server = deferred_stop(server);
 
             try {
-                server.invoke_on_all(&echoserver::listen, socket_address(ia), sstring(crt), sstring(key), tls::client_auth::NONE).get();
+                server.invoke_on_all(&echoserver::listen, socket_address(ia), sstring(crt), sstring(key),sstring(ca)).get();
             } catch (...) {
                 std::cerr << "Error: " << std::current_exception() << std::endl;
                 return 1;
diff --git a/demos/tls_simple_client_demo.cc b/demos/tls_simple_client_demo.cc
index d35b451d229..a83ed798f8b 100644
--- a/demos/tls_simple_client_demo.cc
+++ b/demos/tls_simple_client_demo.cc
@@ -39,6 +39,8 @@ int main(int ac, char** av) {
                     ("port", bpo::value<uint16_t>()->default_value(10000), "Remote port")
                     ("address", bpo::value<std::string>()->default_value("127.0.0.1"), "Remote address")
                     ("trust,t", bpo::value<std::string>(), "Trust store")
+                    ("certificate", bpo::value<std::string>(), "Certficiate")
+                    ("key,k", bpo::value<std::string>(), "Private Keyfile")
                     ("msg,m", bpo::value<std::string>(), "Message to send")
                     ("bytes,b", bpo::value<size_t>()->default_value(512), "Use random bytes of length as message")
                     ("iterations,i", bpo::value<size_t>()->default_value(1), "Repeat X times")
@@ -68,6 +70,15 @@ int main(int ac, char** av) {
             f = certs->set_x509_trust_file(config["trust"].as<std::string>(), tls::x509_crt_format::PEM);
         }
 
+        if (config.count("certificate") && config.count("key")) {
+            f = f.then([certs,
+                        cert = config["certificate"].as<std::string>(),
+                        key = config["key"].as<std::string>()]{
+                return certs->set_x509_key_file(cert, key, tls::x509_crt_format::PEM);
+            });
+        }
+
+
         seastar::shared_ptr<sstring> msg;
 
         if (config.count("msg")) {
diff --git a/demos/udp_zero_copy_demo.cc b/demos/udp_zero_copy_demo.cc
index 79dae99444f..c59b238138a 100644
--- a/demos/udp_zero_copy_demo.cc
+++ b/demos/udp_zero_copy_demo.cc
@@ -107,7 +107,7 @@ class server {
                     if (_copy) {
                         bufs.emplace_back(temporary_buffer<char>(chunk, _chunk_size));
                     } else {
-                        bufs.emplace_back(temporary_buffer<char>(chunk, _chunk_size, deleter()));
+                        bufs.emplace_back(temporary_buffer<char>::maybe_unsafe_from_deleter(chunk, _chunk_size, deleter()));
                     }
                     chunk += _chunk_size;
                 }
diff --git a/include/seastar/core/deleter.hh b/include/seastar/core/deleter.hh
index 371459e242f..9db9e0c61ee 100644
--- a/include/seastar/core/deleter.hh
+++ b/include/seastar/core/deleter.hh
@@ -21,13 +21,26 @@
 
 #pragma once
 
+#include <atomic>
 #include <cassert>
 #include <cstdint>
 #include <cstdlib>
 #include <new>
 #include <utility>
 
+// The forward declarations of classes below are used for
+// friending by the deleter.
+struct test_deleter_append_does_not_free_shared_object;
+struct test_deleter_append_same_shared_object_twice;
+
 namespace seastar {
+namespace net {
+    class packet;
+};
+namespace internal {
+    struct wrapped_iovecs;
+}
+class pipe_data_sink_impl;
 
 /// \addtogroup memory-module
 /// @{
@@ -82,11 +95,21 @@ public:
         this->~deleter();
         new (this) deleter(i);
     }
+private:
     /// \endcond
     /// Appends another deleter to this deleter.  When this deleter is
     /// destroyed, both encapsulated actions will be carried out.
+    ///
+    /// This operation is not thread-safe and therefore not made public
+    /// except for a few manually verified uses that are marked as freinds
+    /// below.
     void append(deleter d);
-private:
+    friend class ::seastar::net::packet;
+    friend struct ::test_deleter_append_does_not_free_shared_object;
+    friend struct ::test_deleter_append_same_shared_object_twice;
+    friend struct ::seastar::internal::wrapped_iovecs;
+    friend class ::seastar::pipe_data_sink_impl;
+
     static bool is_raw_object(impl* i) noexcept {
         auto x = reinterpret_cast<uintptr_t>(i);
         return x & 1;
@@ -109,7 +132,9 @@ private:
 
 /// \cond internal
 struct deleter::impl {
-    unsigned refs = 1;
+    // The memory ordering on operations to this counter is similar to
+    // std::shared_ptr.
+    std::atomic<unsigned int> refs = 1;
     deleter next;
     impl(deleter next) : next(std::move(next)) {}
     virtual ~impl() {}
@@ -122,7 +147,7 @@ deleter::~deleter() {
         std::free(to_raw_object());
         return;
     }
-    if (_impl && --_impl->refs == 0) {
+    if (_impl && _impl->refs.fetch_sub(1, std::memory_order_acq_rel) == 1) {
         delete _impl;
     }
 }
@@ -203,7 +228,7 @@ deleter::share() {
     if (is_raw_object()) {
         _impl = new free_deleter_impl(to_raw_object());
     }
-    ++_impl->refs;
+    _impl->refs.fetch_add(1, std::memory_order_relaxed);
     return deleter(_impl);
 }
 
diff --git a/include/seastar/core/disk_params.hh b/include/seastar/core/disk_params.hh
index 9bbd51e909f..3a8846add75 100644
--- a/include/seastar/core/disk_params.hh
+++ b/include/seastar/core/disk_params.hh
@@ -45,6 +45,7 @@ struct disk_params {
     std::optional<uint32_t> physical_block_size; // Override for disks that lie about their physical block size
     bool duplex = false;
     float rate_factor = 1.0;
+    bool max_cost_function = true;
 };
 
 class disk_config_params {
diff --git a/include/seastar/core/file.hh b/include/seastar/core/file.hh
index 6dc41b67985..19c69ea3250 100644
--- a/include/seastar/core/file.hh
+++ b/include/seastar/core/file.hh
@@ -643,7 +643,7 @@ public:
     future<temporary_buffer<CharType>>
     dma_read_bulk(uint64_t offset, size_t range_size, io_intent* intent = nullptr) noexcept {
         return dma_read_bulk_impl(offset, range_size, intent).then([] (temporary_buffer<uint8_t> t) {
-            return temporary_buffer<CharType>(reinterpret_cast<CharType*>(t.get_write()), t.size(), t.release());
+            return temporary_buffer<CharType>::maybe_unsafe_from_deleter(reinterpret_cast<CharType*>(t.get_write()), t.size(), t.release());
         });
     }
 
diff --git a/include/seastar/core/internal/cpu_profiler.hh b/include/seastar/core/internal/cpu_profiler.hh
new file mode 100644
index 00000000000..7fb369cb1f6
--- /dev/null
+++ b/include/seastar/core/internal/cpu_profiler.hh
@@ -0,0 +1,182 @@
+/*
+ * This file is open source software, licensed to you under the terms
+ * of the Apache License, Version 2.0 (the "License").  See the NOTICE file
+ * distributed with this work for additional information regarding copyright
+ * ownership.  You may not use this file except in compliance with the License.
+ *
+ * You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+/*
+ * Copyright (C) 2023 ScyllaDB
+ */
+
+#pragma once
+
+#include <seastar/util/backtrace.hh>
+#include <seastar/core/circular_buffer_fixed_capacity.hh>
+#include <seastar/core/internal/signal_mutex.hh>
+#include <seastar/core/internal/timers.hh>
+#include <seastar/core/scheduling.hh>
+
+#include <boost/container/static_vector.hpp>
+
+#include <chrono>
+#include <csignal>
+#include <cstdint>
+#include <ctime>
+#include <atomic>
+#include <optional>
+
+namespace seastar {
+
+class reactor;
+
+struct cpu_profiler_trace {
+    using kernel_trace_vec = boost::container::static_vector<uintptr_t, 64>;
+    simple_backtrace user_backtrace;
+    kernel_trace_vec kernel_backtrace;
+    // The scheduling group active at the time the same was taken. Note that
+    // non-task reactor work (such as polling) ends up the in the default
+    // scheduling group (with name "main").
+    scheduling_group sg;
+};
+
+constexpr size_t max_number_of_traces = 128;
+
+namespace internal {
+
+// Temporarily enable/disable the CPU profiler from taking stacktraces on this thread,
+// but don't disable the profiler completely. This can be used disable the profiler
+// for cases when taking a backtrace isn't valid (IE JIT generated code).
+void profiler_drop_stacktraces(bool) noexcept;
+
+// A small RAII object to disable profiling temporarily
+//
+// This is not reentrant.
+class scoped_disable_profile_temporarily {
+public:
+    scoped_disable_profile_temporarily() noexcept {
+        profiler_drop_stacktraces(true);
+    }
+    ~scoped_disable_profile_temporarily() noexcept {
+        profiler_drop_stacktraces(false);
+    }
+};
+
+struct cpu_profiler_config {
+    bool enabled;
+    std::chrono::nanoseconds period;
+};
+
+struct cpu_profiler_stats {
+    unsigned dropped_samples_from_manual_disablement{0};
+    unsigned dropped_samples_from_exceptions{0};
+    unsigned dropped_samples_from_buffer_full{0};
+    unsigned dropped_samples_from_mutex_contention{0};
+
+    void clear_dropped() {
+        dropped_samples_from_manual_disablement = 0;
+        dropped_samples_from_exceptions = 0;
+        dropped_samples_from_buffer_full = 0;
+        dropped_samples_from_mutex_contention = 0;
+    }
+
+    unsigned sum_dropped() const {
+        return dropped_samples_from_manual_disablement
+            + dropped_samples_from_buffer_full
+            + dropped_samples_from_exceptions
+            + dropped_samples_from_mutex_contention;
+    }
+};
+
+class cpu_profiler {
+private:
+    circular_buffer_fixed_capacity<cpu_profiler_trace, max_number_of_traces> _traces;
+    // The operations in `_traces` are not reentrant. Therefore mutex is used to ensure
+    // that an interrupt cannot access `_traces` if the interrupted thread was already
+    // accessing it.
+    signal_mutex _traces_mutex;
+    cpu_profiler_config _cfg;
+    std::chrono::nanoseconds _last_set_timeout;
+    cpu_profiler_stats _stats;
+    bool _is_stopped{true};
+
+
+    bool is_enabled() const;
+    std::chrono::nanoseconds period() const;
+    std::chrono::nanoseconds get_next_timeout();
+
+protected:
+    friend reactor;
+
+public:
+    static int signal_number() { return SIGRTMIN + 2; }
+
+    cpu_profiler(cpu_profiler_config cfg) : _cfg(cfg) {}
+
+    // Allows for the sampling period of the profiler to be adjusted
+    // and the profiler to be enabled and disabled.
+    void update_config(cpu_profiler_config cfg);
+    // Stops the profiler if running and prevents it from starting until
+    // `start()` is explicitly called.
+    void stop();
+    // Allows to profiler to run when it's enabled via the `cpu_profiler_config`.
+    void start();
+    void on_signal();
+    size_t results(std::vector<cpu_profiler_trace>& results_buffer);
+
+    virtual ~cpu_profiler() = default;
+    virtual void arm_timer(std::chrono::nanoseconds) = 0;
+    virtual void disarm_timer() = 0;
+    virtual bool is_spurious_signal() { return false; }
+    virtual std::optional<linux_perf_event::kernel_backtrace>
+    try_get_kernel_backtrace() { return std::nullopt; }
+};
+
+class cpu_profiler_posix_timer : public cpu_profiler {
+    posix_timer _timer;
+public:
+    cpu_profiler_posix_timer(cpu_profiler_config cfg)
+            : cpu_profiler(cfg)
+            // CLOCK_MONOTONIC is used here in place of CLOCK_THREAD_CPUTIME_ID.
+            // This is since for intervals of ~5ms or less CLOCK_THREAD_CPUTIME_ID
+            // fires 200-600% after it's configured time. Therefore it is not granular
+            // enough for cases where the reactor is configured to sleep when idle and
+            // is only active for short intervals. CLOCK_MONOTONIC doesn't suffer from
+            // this issue.
+            , _timer({signal_number()}, CLOCK_MONOTONIC) {}
+
+    virtual ~cpu_profiler_posix_timer() override = default;
+    virtual void arm_timer(std::chrono::nanoseconds) override;
+    virtual void disarm_timer() override;
+};
+
+class cpu_profiler_linux_perf_event : public cpu_profiler {
+    linux_perf_event _perf_event;
+public:
+    static std::unique_ptr<cpu_profiler_linux_perf_event> try_make(cpu_profiler_config);
+    cpu_profiler_linux_perf_event(linux_perf_event perf_event, cpu_profiler_config cfg)
+            : cpu_profiler(cfg)
+            , _perf_event(std::move(perf_event)) {}
+
+    virtual ~cpu_profiler_linux_perf_event() override = default;
+    virtual void arm_timer(std::chrono::nanoseconds) override;
+    virtual void disarm_timer() override;
+    virtual bool is_spurious_signal() override;
+    virtual std::optional<linux_perf_event::kernel_backtrace>
+    try_get_kernel_backtrace() override;
+};
+
+std::unique_ptr<cpu_profiler> make_cpu_profiler(cpu_profiler_config cfg = {false, std::chrono::milliseconds(100)});
+
+}
+}
diff --git a/include/seastar/core/internal/signal_mutex.hh b/include/seastar/core/internal/signal_mutex.hh
new file mode 100644
index 00000000000..e48841cc772
--- /dev/null
+++ b/include/seastar/core/internal/signal_mutex.hh
@@ -0,0 +1,52 @@
+/*
+ * This file is open source software, licensed to you under the terms
+ * of the Apache License, Version 2.0 (the "License").  See the NOTICE file
+ * distributed with this work for additional information regarding copyright
+ * ownership.  You may not use this file except in compliance with the License.
+ *
+ * You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+/*
+ * Copyright (C) 2025 ScyllaDB
+ */
+
+#pragma once
+
+#include <atomic>
+#include <optional>
+
+namespace seastar::internal {
+
+/// A lightweight mutex designed to work with interrupts
+/// utilizing only compiler barriers.
+class signal_mutex {
+public:
+    class guard {
+    private:
+        signal_mutex* _mutex;
+        guard(signal_mutex* m) : _mutex(m) {}
+        friend class signal_mutex;
+    public:
+        guard(guard&& o) : _mutex(o._mutex) { o._mutex = nullptr; }
+        ~guard();
+    };
+
+    // Returns a `guard` if the lock was acquired.
+    // Otherwise returns a nullopt.
+    std::optional<guard> try_lock();
+
+private:
+    friend class guard;
+    std::atomic_bool _mutex;
+};
+
+} // namespace seastar::internal
diff --git a/include/seastar/core/internal/stall_detector.hh b/include/seastar/core/internal/stall_detector.hh
index cdee5b825fa..f65ab9eb96e 100644
--- a/include/seastar/core/internal/stall_detector.hh
+++ b/include/seastar/core/internal/stall_detector.hh
@@ -32,6 +32,7 @@
 #include <seastar/core/posix.hh>
 #include <seastar/core/metrics_registration.hh>
 #include <seastar/core/scheduling.hh>
+#include <seastar/core/internal/timers.hh>
 
 namespace seastar {
 
@@ -94,85 +95,25 @@ public:
 };
 
 class cpu_stall_detector_posix_timer : public cpu_stall_detector {
-    timer_t _timer;
+    posix_timer _timer;
 public:
     explicit cpu_stall_detector_posix_timer(cpu_stall_detector_config cfg = {});
-    virtual ~cpu_stall_detector_posix_timer() override;
+    virtual ~cpu_stall_detector_posix_timer() override = default;
 private:
     virtual void arm_timer() override;
     virtual void start_sleep() override;
 };
 
 class cpu_stall_detector_linux_perf_event : public cpu_stall_detector {
-    file_desc _fd;
-    bool _enabled = false;
-    uint64_t _current_period = 0;
-    struct ::perf_event_mmap_page* _mmap;
-    char* _data_area;
-    size_t _data_area_mask;
-    // after the detector has been armed (i.e., _enabled is true), this
-    // is the moment at or after which the next signal is expected to occur
-    // and can be used for detecting spurious signals
-    sched_clock::time_point _next_signal_time{};
-private:
-    class data_area_reader {
-        cpu_stall_detector_linux_perf_event& _p;
-        const char* _data_area;
-        size_t _data_area_mask;
-        uint64_t _head;
-        uint64_t _tail;
-    public:
-        explicit data_area_reader(cpu_stall_detector_linux_perf_event& p)
-                : _p(p)
-                , _data_area(p._data_area)
-                , _data_area_mask(p._data_area_mask) {
-            _head = _p._mmap->data_head;
-            _tail = _p._mmap->data_tail;
-            std::atomic_thread_fence(std::memory_order_acquire); // required after reading data_head
-        }
-        ~data_area_reader() {
-            std::atomic_thread_fence(std::memory_order_release); // not documented, but probably required before writing data_tail
-            _p._mmap->data_tail = _tail;
-        }
-        uint64_t read_u64() {
-            uint64_t ret;
-            // We cannot wrap around if the 8-byte unit is aligned
-            std::copy_n(_data_area + (_tail & _data_area_mask), 8, reinterpret_cast<char*>(&ret));
-            _tail += 8;
-            return ret;
-        }
-        template <typename S>
-        S read_struct() {
-            static_assert(sizeof(S) % 8 == 0);
-            S ret;
-            char* p = reinterpret_cast<char*>(&ret);
-            for (size_t i = 0; i != sizeof(S); i += 8) {
-                uint64_t w = read_u64();
-                std::copy_n(reinterpret_cast<const char*>(&w), 8, p + i);
-            }
-            return ret;
-        }
-        void skip(uint64_t bytes_to_skip) {
-            _tail += bytes_to_skip;
-        }
-        // skip all the remaining data in the buffer, as-if calling read until
-        // have_data returns false (but much faster)
-        void skip_all() {
-            _tail = _head;
-        }
-        bool have_data() const {
-            return _head != _tail;
-        }
-    };
-
-    virtual void maybe_report_kernel_trace(backtrace_buffer& buf) override;
+    linux_perf_event _perf_event;
 public:
     static std::unique_ptr<cpu_stall_detector_linux_perf_event> try_make(cpu_stall_detector_config cfg = {});
-    explicit cpu_stall_detector_linux_perf_event(file_desc fd, cpu_stall_detector_config cfg = {});
-    ~cpu_stall_detector_linux_perf_event();
+    explicit cpu_stall_detector_linux_perf_event(linux_perf_event perf_event, cpu_stall_detector_config cfg = {});
+    virtual ~cpu_stall_detector_linux_perf_event() override = default;
     virtual void arm_timer() override;
     virtual void start_sleep() override;
     virtual bool is_spurious_signal() override;
+    virtual void maybe_report_kernel_trace(backtrace_buffer& buf) override;
 };
 
 std::unique_ptr<cpu_stall_detector> make_cpu_stall_detector(cpu_stall_detector_config cfg = {});
diff --git a/include/seastar/core/internal/timers.hh b/include/seastar/core/internal/timers.hh
new file mode 100644
index 00000000000..ec4995bfe34
--- /dev/null
+++ b/include/seastar/core/internal/timers.hh
@@ -0,0 +1,146 @@
+/*
+ * This file is open source software, licensed to you under the terms
+ * of the Apache License, Version 2.0 (the "License").  See the NOTICE file
+ * distributed with this work for additional information regarding copyright
+ * ownership.  You may not use this file except in compliance with the License.
+ *
+ * You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+/*
+ * Copyright (C) 2023 ScyllaDB
+ */
+
+#pragma once
+
+#ifndef SEASTAR_MODULE
+#include <atomic>
+#include <chrono>
+#include <cstdint>
+#include <optional>
+#include <functional>
+
+#include <linux/perf_event.h>
+#endif
+
+#include <seastar/core/posix.hh>
+#include <seastar/core/scheduling.hh>
+
+namespace seastar {
+namespace internal {
+
+struct timer_cfg {
+    int signal_number;
+};
+
+class posix_timer {
+    timer_t _timer;
+public:
+    explicit posix_timer(timer_cfg cfg, clockid_t clock_id = CLOCK_THREAD_CPUTIME_ID);
+    virtual ~posix_timer();
+    void arm_timer(std::chrono::nanoseconds);
+    void disarm_timer();
+};
+
+class linux_perf_event {
+    file_desc _fd;
+    bool _enabled = false;
+    uint64_t _current_period = 0;
+    struct ::perf_event_mmap_page* _mmap;
+    char* _data_area;
+    size_t _data_area_mask;
+    // after the detector has been armed (i.e., _enabled is true), this
+    // is the moment at or after which the next signal is expected to occur
+    // and can be used for detecting spurious signals
+    sched_clock::time_point _next_signal_time{};
+private:
+    class data_area_reader {
+        std::reference_wrapper<linux_perf_event> _p;
+        const char* _data_area;
+        size_t _data_area_mask;
+        uint64_t _head;
+        uint64_t _tail;
+    public:
+        explicit data_area_reader(linux_perf_event& p)
+                : _p(p)
+                , _data_area(p._data_area)
+                , _data_area_mask(p._data_area_mask) {
+            _head = _p.get()._mmap->data_head;
+            _tail = _p.get()._mmap->data_tail;
+            std::atomic_thread_fence(std::memory_order_acquire); // required after reading data_head
+        }
+        data_area_reader(data_area_reader&& o)
+                : _p(o._p)
+                , _data_area(o._data_area)
+                , _data_area_mask(o._data_area_mask)
+                , _head(o._head)
+                , _tail(o._tail) {
+            o._data_area = nullptr;
+        }
+        ~data_area_reader() {
+            if(_data_area != nullptr) {
+                std::atomic_thread_fence(std::memory_order_release); // not documented, but probably required before writing data_tail
+                _p.get()._mmap->data_tail = _tail;
+            }
+        }
+        uint64_t read_u64() {
+
+            uint64_t ret;
+            // We cannot wrap around if the 8-byte unit is aligned
+            std::copy_n(_data_area + (_tail & _data_area_mask), 8, reinterpret_cast<char*>(&ret));
+            _tail += 8;
+            return ret;
+        }
+        template <typename S>
+        S read_struct() {
+            static_assert(sizeof(S) % 8 == 0);
+            S ret;
+            char* p = reinterpret_cast<char*>(&ret);
+            for (size_t i = 0; i != sizeof(S); i += 8) {
+                uint64_t w = read_u64();
+                std::copy_n(reinterpret_cast<const char*>(&w), 8, p + i);
+            }
+            return ret;
+        }
+        void skip(uint64_t bytes_to_skip) {
+            _tail += bytes_to_skip;
+        }
+        // skip all the remaining data in the buffer, as-if calling read until
+        // have_data returns false (but much faster)
+        void skip_all() {
+            _tail = _head;
+        }
+        bool have_data() const {
+            return _head != _tail;
+        }
+    };
+
+    explicit linux_perf_event(file_desc fd);
+public:
+
+    class kernel_backtrace {
+        data_area_reader _reader;
+    public:
+        kernel_backtrace(data_area_reader reader) : _reader(std::move(reader)) {}
+        void read_backtrace(std::function<void(uintptr_t)>);
+    };
+
+    linux_perf_event(linux_perf_event&&);
+    static linux_perf_event try_make(timer_cfg cfg);
+    ~linux_perf_event();
+    void arm_timer(std::chrono::nanoseconds);
+    void disarm_timer();
+    bool is_spurious_signal();
+    std::optional<kernel_backtrace> try_get_kernel_backtrace();
+};
+
+}
+}
diff --git a/include/seastar/core/io_queue.hh b/include/seastar/core/io_queue.hh
index 69411e901f4..d07db79feb4 100644
--- a/include/seastar/core/io_queue.hh
+++ b/include/seastar/core/io_queue.hh
@@ -23,6 +23,7 @@
 
 #include <boost/container/static_vector.hpp>
 #include <chrono>
+#include <limits>
 #include <memory>
 #include <vector>
 #include <sys/uio.h>
@@ -192,6 +193,13 @@ public:
         std::chrono::milliseconds stall_threshold = std::chrono::milliseconds(100);
         std::chrono::microseconds tau = std::chrono::milliseconds(5);
         std::optional<uint32_t> physical_block_size; // Override for disks that lie about their physical block size
+
+        // Original values of io-properties (if available)
+        size_t read_bytes_rate = std::numeric_limits<size_t>::max();
+        size_t write_bytes_rate = std::numeric_limits<size_t>::max();
+        size_t read_req_rate = std::numeric_limits<size_t>::max();
+        size_t write_req_rate = std::numeric_limits<size_t>::max();
+        bool max_cost_function = true;
     };
 
     io_queue(io_group_ptr group, internal::io_sink& sink);
diff --git a/include/seastar/core/memory.hh b/include/seastar/core/memory.hh
index 05c66bcce7e..e2762464a0a 100644
--- a/include/seastar/core/memory.hh
+++ b/include/seastar/core/memory.hh
@@ -184,6 +184,17 @@ public:
     }
 };
 
+// Within the scope of this object, the allocator will not abort (when it
+// would normally do so, i.e., when abort_on_allocation_failure is true),
+// but rather fall back to the system allocator.
+struct scoped_system_alloc_fallback {
+    scoped_system_alloc_fallback() noexcept;
+    ~scoped_system_alloc_fallback() noexcept;
+
+    scoped_system_alloc_fallback(const scoped_system_alloc_fallback&) = delete;
+    scoped_system_alloc_fallback& operator=(const scoped_system_alloc_fallback&) = delete;
+};
+
 // Disables heap profiling as long as this object is alive.
 // Can be nested, in which case the profiling is re-enabled when all
 // the objects go out of scope.
@@ -300,6 +311,7 @@ class statistics {
     uint64_t _reclaims;
     uint64_t _large_allocs;
     uint64_t _failed_allocs;
+    uint64_t _fallback_allocs;
 
     uint64_t _foreign_mallocs;
     uint64_t _foreign_frees;
@@ -307,11 +319,11 @@ class statistics {
 private:
     statistics(uint64_t mallocs, uint64_t frees, uint64_t cross_cpu_frees,
             uint64_t total_memory, uint64_t free_memory, uint64_t total_bytes_allocated, uint64_t reclaims,
-            uint64_t large_allocs, uint64_t failed_allocs,
+            uint64_t large_allocs, uint64_t failed_allocs, uint64_t fallback_allocs,
             uint64_t foreign_mallocs, uint64_t foreign_frees, uint64_t foreign_cross_frees)
         : _mallocs(mallocs), _frees(frees), _cross_cpu_frees(cross_cpu_frees)
         , _total_memory(total_memory), _free_memory(free_memory), _total_bytes_allocated(total_bytes_allocated), _reclaims(reclaims)
-        , _large_allocs(large_allocs), _failed_allocs(failed_allocs)
+        , _large_allocs(large_allocs), _failed_allocs(failed_allocs), _fallback_allocs(fallback_allocs)
         , _foreign_mallocs(foreign_mallocs), _foreign_frees(foreign_frees)
         , _foreign_cross_frees(foreign_cross_frees) {}
 public:
@@ -337,13 +349,18 @@ public:
     /// Number of allocations which violated the large allocation threshold
     uint64_t large_allocations() const { return _large_allocs; }
     /// Number of allocations which failed, i.e., where the required memory could not be obtained
-    /// even after reclaim was attempted
+    /// even after reclaim was attempted and which did not fallback (see fallback_allocations())
     uint64_t failed_allocations() const { return _failed_allocs; }
-    /// Number of foreign allocations
+    /// Number of allocations which fell back to the system allocator, i.e., because they were
+    /// in a fallback allocation scope. These are not counted in failed_allocations.
+    uint64_t fallback_allocations() const { return _fallback_allocs; }
+    /// Number of foreign allocations, which are all allocations which use the system allocator.
+    /// These include allocations on alien threads, allocations (even on reactor threads) before
+    /// the allocator is initialized and allocations in a fallback allocation scope.
     uint64_t foreign_mallocs() const { return _foreign_mallocs; }
-    /// Number of foreign frees
+    /// Number of foreign frees (frees of non-seastar-heap pointers) on alien threads
     uint64_t foreign_frees() const { return _foreign_frees; }
-    /// Number of foreign frees on reactor threads
+    /// Number of foreign frees (frees of non-seastar-heap pointers) on reactor threads
     uint64_t foreign_cross_frees() const { return _foreign_cross_frees; }
     friend statistics stats();
 };
diff --git a/include/seastar/core/metrics.hh b/include/seastar/core/metrics.hh
index cd3c5749c5c..ba25db36a52 100644
--- a/include/seastar/core/metrics.hh
+++ b/include/seastar/core/metrics.hh
@@ -435,6 +435,7 @@ public:
     virtual metric_groups_def& add_metric(group_name_type name, const metric_definition& md) = 0;
     virtual metric_groups_def& add_group(group_name_type name, const std::initializer_list<metric_definition>& l) = 0;
     virtual metric_groups_def& add_group(group_name_type name, const std::vector<metric_definition>& l) = 0;
+    virtual int get_handle() const = 0;
 };
 
 escaped_string shard();
@@ -649,6 +650,13 @@ impl::metric_definition_impl make_total_operations(metric_name_type name,
     return make_counter(name, std::forward<T>(val), d, labels).set_type("total_operations");
 }
 
+/*!
+ * \brief Update the aggregation labels of a metric family
+ */
+void update_aggregate_labels(const group_name_type& group_name,
+                             const metric_name_type& metric_name,
+                             const std::vector<label>& aggregate_labels);
+
 /*! @} */
 }
 }
diff --git a/include/seastar/core/metrics_api.hh b/include/seastar/core/metrics_api.hh
index e47fc035c80..2ef073438c7 100644
--- a/include/seastar/core/metrics_api.hh
+++ b/include/seastar/core/metrics_api.hh
@@ -41,6 +41,9 @@ namespace impl {
 
 using internalized_labels_ref = lw_shared_ptr<const labels_type>;
 
+
+int default_handle();
+
 }
 }
 }
@@ -230,6 +233,8 @@ inline bool operator<(const internalized_holder& lhs, const internalized_holder&
 
 
 class impl;
+using metric_implementations = std::unordered_map<int, ::seastar::shared_ptr<impl>>;
+metric_implementations& get_metric_implementations();
 
 class registered_metric final {
     metric_info _info;
@@ -250,6 +255,11 @@ public:
     void set_skip_when_empty(skip_when_empty skip) noexcept {
         _info.should_skip_when_empty = skip;
     }
+
+    skip_when_empty get_skip_when_empty() const {
+        return _info.should_skip_when_empty;
+    }
+
     const metric_id& get_id() const {
         return _info.id;
     }
@@ -270,16 +280,18 @@ using metric_instances = std::map<internalized_holder, register_ref, std::less<>
 using metrics_registration = std::vector<register_ref>;
 
 class metric_groups_impl : public metric_groups_def {
+    int _handle;
     metrics_registration _registration;
     shared_ptr<impl> _impl; // keep impl alive while metrics are registered
 public:
-    metric_groups_impl();
+    explicit metric_groups_impl(int handle = default_handle());
     ~metric_groups_impl();
     metric_groups_impl(const metric_groups_impl&) = delete;
     metric_groups_impl(metric_groups_impl&&) = default;
     metric_groups_impl& add_metric(group_name_type name, const metric_definition& md);
     metric_groups_impl& add_group(group_name_type name, const std::initializer_list<metric_definition>& l);
     metric_groups_impl& add_group(group_name_type name, const std::vector<metric_definition>& l);
+    int get_handle() const;
 };
 
 class metric_family {
@@ -451,6 +463,7 @@ class impl {
     std::vector<relabel_config> _relabel_configs;
     std::vector<metric_family_config> _metric_family_configs;
     internalized_set _internalized_labels;
+    std::unordered_multimap<seastar::sstring, int> _metric_families_to_replicate;
 public:
     value_map& get_value_map() {
         return _value_map;
@@ -462,6 +475,7 @@ public:
 
     register_ref add_registration(const metric_id& id, const metric_type& type, metric_function f, const description& d, bool enabled, skip_when_empty skip, const std::vector<std::string>& aggregate_labels);
     internalized_labels_ref internalize_labels(labels_type labels);
+    void update_aggregate_labels(const metric_id& id, const std::vector<label>& aggregate_labels);
     void remove_registration(const metric_id& id);
     future<> stop() {
         return make_ready_future<>();
@@ -492,6 +506,7 @@ public:
     const std::vector<relabel_config>& get_relabel_configs() const noexcept {
         return _relabel_configs;
     }
+
     const std::vector<metric_family_config>& get_metric_family_configs() const noexcept {
         return _metric_family_configs;
     }
@@ -500,19 +515,49 @@ public:
 
     void update_aggregate(metric_family_info& mf) const noexcept;
 
+    // Set the metrics families to be replicated from this metrics::impl.
+    // All metrics families that match one of the keys of
+    // the 'metric_families_to_replicate' argument will be replicated
+    // on the metrics::impl identified by the corresponding value.
+    //
+    // If this function was called previously, any previously
+    // replicated metrics will be removed before the provided ones are
+    // replicated.
+    //
+    // Metric replication spans the full life cycle of this class.
+    // Newly registered metrics that belong to a replicated family
+    // be replicated too and unregistering a replicated metric will
+    // unregister the replica.
+    void set_metric_families_to_replicate(
+            std::unordered_multimap<seastar::sstring, int> metric_families_to_replicate);
+
 private:
     void gc_internalized_labels();
     bool apply_relabeling(const relabel_config& rc, metric_info& info);
+    void replicate_metric_family(const seastar::sstring& name,
+                                 int destination_handle) const;
+    void replicate_metric_if_required(const shared_ptr<registered_metric>& metric) const;
+    void replicate_metric(const shared_ptr<registered_metric>& metric,
+                          const metric_family& family,
+                          const shared_ptr<impl>& destination,
+                          int destination_handle) const;
+
+    void remove_metric_replica_family(const seastar::sstring& name,
+                                      int destination_handle) const;
+    void remove_metric_replica(const metric_id& id,
+                               const shared_ptr<impl>& destination) const;
+    void remove_metric_replica_if_required(const metric_id& id) const;
 };
 
-const value_map& get_value_map();
+const value_map& get_value_map(int handle = default_handle());
 using values_reference = shared_ptr<values_copy>;
 
-foreign_ptr<values_reference> get_values();
+foreign_ptr<values_reference> get_values(int handle = default_handle());
+
+shared_ptr<impl> get_local_impl(int handle = default_handle());
 
-shared_ptr<impl> get_local_impl();
 
-void unregister_metric(const metric_id & id);
+void unregister_metric(const metric_id & id, int handle = default_handle());
 
 /*!
  * \brief initialize metric group
@@ -520,7 +565,7 @@ void unregister_metric(const metric_id & id);
  * Create a metric_group_def.
  * No need to use it directly.
  */
-std::unique_ptr<metric_groups_def> create_metric_groups();
+std::unique_ptr<metric_groups_def> create_metric_groups(int handle = default_handle());
 
 }
 
@@ -537,7 +582,7 @@ struct options : public program_options::option_group {
 /*!
  * \brief set the metrics configuration
  */
-future<> configure(const options& opts);
+future<> configure(const options& opts, int handle = default_handle());
 
 /*!
  * \brief Perform relabeling and operation on metrics dynamically.
@@ -615,5 +660,12 @@ void set_metric_family_configs(const std::vector<metric_family_config>& metrics_
  * This function returns a vector of the current metrics family config
  */
 const std::vector<metric_family_config>& get_metric_family_configs();
+
+/*!
+ * \brief replicate metric families accross internal metrics implementations
+ */
+future<>
+replicate_metric_families(int source_handle, std::unordered_multimap<seastar::sstring, int> metric_families_to_replicate);
+
 }
 }
diff --git a/include/seastar/core/metrics_registration.hh b/include/seastar/core/metrics_registration.hh
index 52ef7a30e35..4324492adfc 100644
--- a/include/seastar/core/metrics_registration.hh
+++ b/include/seastar/core/metrics_registration.hh
@@ -51,13 +51,17 @@ namespace seastar {
 namespace metrics {
 
 namespace impl {
+int default_handle();
 class metric_groups_def;
 struct metric_definition_impl;
 class metric_groups_impl;
 }
 
 
+int default_handle();
+
 using group_name_type = sstring; /*!< A group of logically related metrics */
+using metric_name_type = sstring; /*!< A single metric name */
 class metric_groups;
 
 class metric_definition {
@@ -90,7 +94,7 @@ public:
 class metric_groups {
     std::unique_ptr<impl::metric_groups_def> _impl;
 public:
-    metric_groups() noexcept;
+    explicit metric_groups(int handle = default_handle()) noexcept;
     metric_groups(metric_groups&&) = default;
     virtual ~metric_groups();
     metric_groups& operator=(metric_groups&&) = default;
@@ -99,7 +103,7 @@ public:
      *
      * combine the constructor with the add_group functionality.
      */
-    metric_groups(std::initializer_list<metric_group_definition> mg);
+    metric_groups(std::initializer_list<metric_group_definition> mg, int handle = default_handle());
 
     /*!
      * \brief Add metrics belonging to the same group.
@@ -155,7 +159,7 @@ public:
  */
 class metric_group : public metric_groups {
 public:
-    metric_group() noexcept;
+    explicit metric_group(int handle = default_handle()) noexcept;
     metric_group(const metric_group&) = delete;
     metric_group(metric_group&&) = default;
     virtual ~metric_group();
@@ -166,7 +170,7 @@ public:
      *
      *
      */
-    metric_group(const group_name_type& name, std::initializer_list<metric_definition> l);
+    metric_group(const group_name_type& name, std::initializer_list<metric_definition> l, int handle = default_handle());
 };
 
 
diff --git a/include/seastar/core/polymorphic_temporary_buffer.hh b/include/seastar/core/polymorphic_temporary_buffer.hh
index 7fe09625ae4..8c1d1a71c59 100644
--- a/include/seastar/core/polymorphic_temporary_buffer.hh
+++ b/include/seastar/core/polymorphic_temporary_buffer.hh
@@ -37,7 +37,7 @@ temporary_buffer<CharType> make_temporary_buffer(std::pmr::polymorphic_allocator
         return temporary_buffer<CharType>(size);
     }
     CharType *buffer = allocator->allocate(size);
-    return temporary_buffer<CharType>(buffer, size,
+    return temporary_buffer<CharType>::maybe_unsafe_from_deleter(buffer, size,
         make_deleter(deleter(), [allocator, buffer, size] () mutable { allocator->deallocate(buffer, size); }));
 }
 
diff --git a/include/seastar/core/prometheus.hh b/include/seastar/core/prometheus.hh
index 6144daa87c1..f9e225ce723 100644
--- a/include/seastar/core/prometheus.hh
+++ b/include/seastar/core/prometheus.hh
@@ -55,12 +55,15 @@ struct config {
     std::optional<metrics::label_instance> label; //!< A label that will be added to all metrics, we advice not to use it and set it on the prometheus server
     sstring prefix = "seastar"; //!< a prefix that will be added to metric names
     bool allow_protobuf = false; // protobuf support is experimental and off by default
+    int handle = metrics::default_handle(); //!< Handle that specifies which metric implementation to query
+    sstring route = "/metrics"; //!< Name of the route on which to expose the metrics
 };
 
 future<> start(httpd::http_server_control& http_server, config ctx);
 
-/// \defgroup add_prometheus_routes adds a /metrics endpoint that returns prometheus metrics
-///    both in txt format and in protobuf according to the prometheus spec
+/// \defgroup add_prometheus_routes adds a specified endpoint (defaults to /metrics) that returns prometheus metrics
+///    in txt format format and in protobuf according to the prometheus spec
+
 /// @{
 future<> add_prometheus_routes(sharded<httpd::http_server>& server, config ctx);
 future<> add_prometheus_routes(httpd::http_server& server, config ctx);
diff --git a/include/seastar/core/reactor.hh b/include/seastar/core/reactor.hh
index 721c496f2c2..323241f8c78 100644
--- a/include/seastar/core/reactor.hh
+++ b/include/seastar/core/reactor.hh
@@ -111,11 +111,13 @@ class reactor_backend_selector;
 
 class reactor_backend;
 struct pollfn;
+struct cpu_profiler_trace;
 
 namespace internal {
 
 class reactor_stall_sampler;
 class cpu_stall_detector;
+class cpu_profiler;
 class buffer_allocator;
 class priority_class;
 class poller;
@@ -253,6 +255,7 @@ private:
     uint64_t _polls = 0;
     metrics::internal::time_estimated_histogram _stalls_histogram;
     std::unique_ptr<internal::cpu_stall_detector> _cpu_stall_detector;
+    std::unique_ptr<internal::cpu_profiler> _cpu_profiler;
 
     timer<>::set_t _timers;
     timer<>::set_t::timer_list_t _expired_timers;
@@ -766,6 +769,21 @@ public:
     void update_blocked_reactor_notify_ms(std::chrono::milliseconds ms);
     std::chrono::milliseconds get_blocked_reactor_notify_ms() const;
 
+    bool get_cpu_profiler_enabled();
+    void set_cpu_profiler_enabled(bool);
+    std::chrono::nanoseconds get_cpu_profiler_period();
+    void set_cpu_profiler_period(std::chrono::nanoseconds);
+    /// Copies all profiler samples that were collected since the function
+    /// was last called into `results_buffer`.
+    ///
+    /// Returns the number of samples that had to be dropped since the function
+    /// was last called due to a full internal buffer.
+    ///
+    /// Note: All existing data in `results_buffer` will be overriden. And if
+    /// `results_buffer` does not have enough capacity to hold all samples it's
+    /// capacity will be increased internally. The capacity is never shrunk though.
+    size_t profiler_results(std::vector<cpu_profiler_trace>& results_buffer);
+
     class test {
     public:
         static void with_allow_abandoned_failed_futures(unsigned count, noncopyable_function<void ()> func);
diff --git a/include/seastar/core/reactor_config.hh b/include/seastar/core/reactor_config.hh
index 5664367d6a7..2f7e594e152 100644
--- a/include/seastar/core/reactor_config.hh
+++ b/include/seastar/core/reactor_config.hh
@@ -54,8 +54,13 @@ class network_stack_factory;
 struct reactor_options : public program_options::option_group {
     /// \brief Select cryptographic provider backend.
     ///
-    /// Available providers:
-    /// * gnutls (default)
+    /// In dual-backend builds (\c SEASTAR_TLS_DUAL_BACKEND), accepts:
+    /// * gnutls
+    /// * openssl
+    ///
+    /// In single-backend builds the only valid value is the backend that was
+    /// compiled in; the option is kept for CLI compatibility but is otherwise
+    /// a no-op (the provider is a compile-time-fixed static singleton).
     program_options::selection_value<crypto_provider_factory> crypto_provider;
     /// \brief Select network stack to use.
     ///
@@ -115,6 +120,14 @@ struct reactor_options : public program_options::option_group {
     ///
     /// Default: \p true.
     program_options::value<bool> blocked_reactor_report_format_oneline;
+    /// \brief The sample rate for the reactor profiler.
+    ///
+    /// Default 100.
+    program_options::value<unsigned> profiler_sample_period_ms;
+    /// \brief Optionally enable the profiler.
+    ///
+    /// Default false.
+    program_options::value<bool> profiler_enabled;
     /// \brief Allow using buffered I/O if DMA is not available (reduces performance).
     program_options::value<> relaxed_dma;
     /// \brief Use the Linux NOWAIT AIO feature, which reduces reactor stalls due
diff --git a/include/seastar/core/scheduling.hh b/include/seastar/core/scheduling.hh
index b5d76d537e1..85413c9ecc9 100644
--- a/include/seastar/core/scheduling.hh
+++ b/include/seastar/core/scheduling.hh
@@ -426,6 +426,13 @@ public:
     friend unsigned internal::scheduling_group_index(scheduling_group sg) noexcept;
     friend scheduling_group internal::scheduling_group_from_index(unsigned index) noexcept;
 
+    struct stats {
+        sched_clock::duration runtime;
+        sched_clock::duration waittime;
+        sched_clock::duration starvetime;
+    };
+    stats get_stats() const noexcept;
+
     template<typename SpecificValType, typename Mapper, typename Reducer, typename Initial>
     requires requires(SpecificValType specific_val, Mapper mapper, Reducer reducer, Initial initial) {
         {reducer(initial, mapper(specific_val))} -> std::convertible_to<Initial>;
diff --git a/include/seastar/core/scollectd.hh b/include/seastar/core/scollectd.hh
index cab55657f8b..ce1d283c99a 100644
--- a/include/seastar/core/scollectd.hh
+++ b/include/seastar/core/scollectd.hh
@@ -371,7 +371,7 @@ struct options : public program_options::option_group {
     /// \endcond
 };
 
-void configure(const options&);
+void configure(const options&, int handle = seastar::metrics::default_handle());
 void remove_polled_metric(const type_instance_id &);
 
 class plugin_instance_metrics;
@@ -390,8 +390,8 @@ class plugin_instance_metrics;
  */
 struct registration {
     registration() = default;
-    registration(const type_instance_id& id);
-    registration(type_instance_id&& id);
+    registration(const type_instance_id& id, int handle = seastar::metrics::default_handle());
+    registration(type_instance_id&& id, int handle = seastar::metrics::default_handle());
     registration(const registration&) = delete;
     registration(registration&&) = default;
     ~registration();
@@ -779,8 +779,8 @@ seastar::metrics::impl::metric_id to_metrics_id(const type_instance_id & id);
  */
 template<typename Arg>
 [[deprecated("Use the metrics layer")]] static type_instance_id add_polled_metric(const type_instance_id & id, description d,
-        Arg&& arg, bool enabled = true) {
-    seastar::metrics::impl::get_local_impl()->add_registration(to_metrics_id(id), arg.type, seastar::metrics::impl::make_function(arg.value, arg.type), d, enabled);
+        Arg&& arg, bool enabled = true, int handle = seastar::metrics::default_handle()) {
+    seastar::metrics::impl::get_local_impl(handle)->add_registration(to_metrics_id(id), arg.type, seastar::metrics::impl::make_function(arg.value, arg.type), d, enabled);
     return id;
 }
 /*!
diff --git a/include/seastar/core/sstring.hh b/include/seastar/core/sstring.hh
index 3517669c971..265247e55b7 100644
--- a/include/seastar/core/sstring.hh
+++ b/include/seastar/core/sstring.hh
@@ -544,7 +544,7 @@ public:
             auto size = u.external.size;
             u.external.str = nullptr;
             u.external.size = 0;
-            return temporary_buffer<char_type>(ptr, size, make_free_deleter(ptr));
+            return temporary_buffer<char>::maybe_unsafe_from_deleter(ptr, size, make_free_deleter(ptr));
         } else {
             auto buf = temporary_buffer<char_type>(u.internal.size);
             std::copy(u.internal.str, u.internal.str + u.internal.size, buf.get_write());
diff --git a/include/seastar/core/temporary_buffer.hh b/include/seastar/core/temporary_buffer.hh
index 4b17f9d4f1e..4b741505693 100644
--- a/include/seastar/core/temporary_buffer.hh
+++ b/include/seastar/core/temporary_buffer.hh
@@ -36,6 +36,15 @@
 
 namespace seastar {
 
+/*
+ * The custom-deleter constructor of temporary_buffer has been made private to
+ * better ensure the safety of cross-shard sharing the temporary_buffer.
+ *
+ * The forward declarations here are to allow for some manually verified, pre-existing,
+ * code to still access the newly-private constructor.
+ */
+
+
 /// \addtogroup memory-module
 /// @{
 
@@ -95,6 +104,17 @@ public:
         x._size = 0;
     }
 
+    /// @brief Create a temporary buffer from a buffer pointer and deleter.
+    ///
+    /// In the Redpanda fork, this operation is potentially unsafe as deleters
+    /// may be invoked on _any_ thread, so a deleter must be safe to call in
+    /// this way. In seastar upstream, temporary_buffer is not safe to share
+    /// across threads, so deleters are called in a more restricted way.
+    static temporary_buffer maybe_unsafe_from_deleter(CharType* buf, size_t size, deleter&& d) noexcept {
+        return temporary_buffer(buf, size, std::move(d));
+    }
+
+private:
     /// Creates a \c temporary_buffer with a specific deleter.
     ///
     /// \param buf beginning of the buffer held by this \c temporary_buffer
@@ -103,6 +123,8 @@ public:
     ///          will be destroyed when there are no longer any users for the buffer.
     temporary_buffer(CharType* buf, size_t size, deleter d) noexcept
         : _buffer(buf), _size(size), _deleter(std::move(d)) {}
+
+public:
     /// Creates a `temporary_buffer` containing a copy of the provided data
     ///
     /// \param src  data buffer to be copied
diff --git a/include/seastar/http/exception.hh b/include/seastar/http/exception.hh
index eaef705074e..b7962492b1a 100644
--- a/include/seastar/http/exception.hh
+++ b/include/seastar/http/exception.hh
@@ -41,6 +41,16 @@ public:
             : _msg(msg), _status(status) {
     }
 
+    /**
+     * A base_exception with a content_type is specifying a full response body, whereas
+     * a base_exception with only a _status is specifying a string that may be wrapped
+     * in e.g. a json_exception.
+     */
+    base_exception(const std::string& msg, http::reply::status_type status, const std::string &content_type)
+            : _msg(msg), _status(status), _content_type(content_type) {
+    }
+
+
     virtual const char* what() const noexcept {
         return _msg.c_str();
     }
@@ -52,9 +62,14 @@ public:
     virtual const std::string& str() const {
         return _msg;
     }
+
+    virtual const std::string& content_type() const {
+        return _content_type;
+    }
 private:
     std::string _msg;
     http::reply::status_type _status;
+    std::string _content_type;
 
 };
 
@@ -63,10 +78,22 @@ private:
  */
 class redirect_exception : public base_exception {
 public:
-    redirect_exception(const std::string& url, http::reply::status_type status = http::reply::status_type::moved_permanently)
-            : base_exception("", status), url(url) {
+    redirect_exception(const std::string& url, http::reply::status_type status = http::reply::status_type::moved_permanently, const std::optional<int>& retry_after = std::nullopt)
+            : base_exception("", status), url(url), retry_after(retry_after) {
+    }
+
+    http::reply to_reply() const {
+        http::reply reply{};
+        reply.add_header("Location", url);
+        if (retry_after.has_value()) {
+            reply.add_header("Retry-After", std::to_string(retry_after.value()));
+        }
+        reply.set_status(status());
+        return reply;
     }
+
     std::string url;
+    std::optional<int> retry_after;
 };
 
 /**
diff --git a/include/seastar/http/httpd.hh b/include/seastar/http/httpd.hh
index 181392dd4f1..2f572a25640 100644
--- a/include/seastar/http/httpd.hh
+++ b/include/seastar/http/httpd.hh
@@ -72,29 +72,32 @@ class connection : public boost::intrusive::list_base_hook<> {
     queue<std::unique_ptr<http::reply>> _replies { 10 };
     bool _done = false;
     const bool _tls;
+    int _listener_idx;
 public:
-    [[deprecated("use connection(http_server&, connected_socket&&, bool tls)")]]
-    connection(http_server& server, connected_socket&& fd, socket_address, bool tls)
-            : connection(server, std::move(fd), tls) {}
-    connection(http_server& server, connected_socket&& fd, bool tls)
+    [[deprecated("use connection(http_server&, connected_socket&&, bool tls, int listener_idx)")]]
+    connection(http_server& server, connected_socket&& fd, socket_address, bool tls, int listener_idx)
+            : connection(server, std::move(fd), tls, listener_idx) {}
+    connection(http_server& server, connected_socket&& fd, bool tls, int listener_idx)
             : _server(server)
             , _fd(std::move(fd))
             , _read_buf(_fd.input())
             , _write_buf(_fd.output())
             , _client_addr(_fd.remote_address())
             , _server_addr(_fd.local_address())
-            , _tls(tls) {
+            , _tls(tls)
+            , _listener_idx(listener_idx) {
         on_new_connection();
     }
     connection(http_server& server, connected_socket&& fd,
-            socket_address client_addr, socket_address server_addr, bool tls)
+            socket_address client_addr, socket_address server_addr, bool tls, int listener_idx)
             : _server(server)
             , _fd(std::move(fd))
             , _read_buf(_fd.input())
             , _write_buf(_fd.output())
             , _client_addr(std::move(client_addr))
             , _server_addr(std::move(server_addr))
-            , _tls(tls) {
+            , _tls(tls)
+            , _listener_idx(listener_idx) {
         on_new_connection();
     }
     ~connection();
@@ -112,7 +115,7 @@ public:
     future<> start_response();
 
     future<bool> generate_reply(std::unique_ptr<http::request> req);
-    void generate_error_reply_and_close(std::unique_ptr<http::request> req, http::reply::status_type status, const sstring& msg);
+    void generate_error_reply_and_close(std::unique_ptr<http::request> req, http::reply::status_type status, const sstring& msg, const sstring &content_type={});
 
     output_stream<char>& out();
 };
diff --git a/include/seastar/http/request.hh b/include/seastar/http/request.hh
index 50791fb72c4..f6119e5baf7 100644
--- a/include/seastar/http/request.hh
+++ b/include/seastar/http/request.hh
@@ -69,7 +69,8 @@ struct request {
     // deprecated: it is used to store last value of query parameters, but will be removed in the future
     [[deprecated("Use helper methods instead")]] std::unordered_map<sstring, sstring> query_parameters;
     httpd::parameters param;
-    [[deprecated("use content_stream (server-side) / write_body (client-side) instead")]]
+    // undo this deprecation until CORE-15051 is addressed
+    // [[deprecated("use content_stream (server-side) / write_body (client-side) instead")]]
     sstring content; // server-side deprecated: use content_stream instead
     /*
      * The handler should read the contents of this stream till reaching eof (i.e., the end of this request's content). Failing to do so
@@ -81,6 +82,7 @@ struct request {
     std::unordered_map<sstring, sstring> chunk_extensions;
     sstring protocol_name = "http";
     http::body_writer_type body_writer; // for client
+    int listener_idx;
 
     using query_parameters_type = std::unordered_map<sstring, std::vector<sstring>, seastar::internal::string_view_hash, std::equal_to<>>;
 private:
@@ -243,6 +245,13 @@ public:
     bool is_form_post() const {
         return content_type_class == ctclass::app_x_www_urlencoded;
     }
+    /**
+     * Get index of listener which accepted connection receiving this request
+     * @return position of listener in server _listeners vector
+     */
+    int get_listener_idx() const {
+        return listener_idx;
+    }
 
     bool should_keep_alive() const {
         if (_version == "0.9") {
diff --git a/include/seastar/net/api.hh b/include/seastar/net/api.hh
index 10f2e63c42a..1dcfde4c7a2 100644
--- a/include/seastar/net/api.hh
+++ b/include/seastar/net/api.hh
@@ -22,6 +22,7 @@
 #pragma once
 
 #include <chrono>
+#include <cstddef>
 #include <memory>
 #include <vector>
 #include <cstring>
@@ -192,6 +193,12 @@ struct connected_socket_input_stream_config final {
     unsigned max_buffer_size = 128 * 1024;
 };
 
+/// Certificate information (serial number and expiry)
+struct cert_info {
+    std::vector<std::byte> serial;
+    time_t expiry;
+};
+
 /// Distinguished name
 struct session_dn {
     sstring subject;
diff --git a/include/seastar/net/packet.hh b/include/seastar/net/packet.hh
index a26bbb91e33..dd6607af5ff 100644
--- a/include/seastar/net/packet.hh
+++ b/include/seastar/net/packet.hh
@@ -298,7 +298,7 @@ public:
         }
         while (idx < nr_frags()) {
             auto&& f = frag(idx++);
-            func(temporary_buffer<char>(f.base, f.size, _impl->_deleter.share()));
+            func(temporary_buffer<char>::maybe_unsafe_from_deleter(f.base, f.size, _impl->_deleter.share()));
         }
     }
     std::vector<temporary_buffer<char>> release() {
diff --git a/include/seastar/net/stack.hh b/include/seastar/net/stack.hh
index d6ad82fca9f..80d76c25713 100644
--- a/include/seastar/net/stack.hh
+++ b/include/seastar/net/stack.hh
@@ -46,8 +46,8 @@ public:
     virtual keepalive_params get_keepalive_parameters() const = 0;
     virtual void set_sockopt(int level, int optname, const void* data, size_t len) = 0;
     virtual int get_sockopt(int level, int optname, void* data, size_t len) const = 0;
-    virtual socket_address local_address() const noexcept = 0;
-    virtual socket_address remote_address() const noexcept = 0;
+    virtual socket_address local_address() const = 0;
+    virtual socket_address remote_address() const = 0;
     virtual future<> wait_input_shutdown() = 0;
 };
 
diff --git a/include/seastar/net/tls.hh b/include/seastar/net/tls.hh
index 7c726a242c8..ed9f6fe69d3 100644
--- a/include/seastar/net/tls.hh
+++ b/include/seastar/net/tls.hh
@@ -48,10 +48,31 @@ class socket_address;
  * Relatively thin SSL wrapper for socket IO.
  * (Can be expanded to other IO forms).
  *
- * The current underlying mechanism is
- * gnutls, however, all interfaces are kept
- * agnostic, so in theory it could be replaced
- * with OpenSSL or similar.
+ * Two underlying mechanisms are supported, GnuTLS and OpenSSL. Each one can
+ * be enabled or disabled at build time (\c Seastar_GNUTLS, \c Seastar_OPENSSL).
+ * When both are compiled in (\c SEASTAR_TLS_DUAL_BACKEND), the active backend
+ * is chosen at reactor startup via the \c --crypto-provider option; when only
+ * one is compiled in, that backend is fixed for the lifetime of the program.
+ *
+ * The interfaces here are kept agnostic so that either backend can be used
+ * without changes to client code.
+ *
+ * \section backend_lifetime When backend-dependent state is valid
+ *
+ * Several entry points below expose state that comes from the active backend
+ * (\ref error_category, \ref backend_name, the \c ERROR_* globals, and any
+ * function that internally creates a TLS session, credentials, or DH params).
+ *
+ * - In **single-backend** builds the backend is fixed at compile time. All
+ *   of these entry points are valid at any time, including from static
+ *   initializers and from unit tests that never start a reactor. The
+ *   \c ERROR_* globals are additionally declared \c const and statically
+ *   initialized to the backend's constants.
+ * - In **dual-backend** builds the backend is installed by
+ *   \c smp::configure() at reactor startup. Calling any backend-dependent
+ *   entry point before that point is undefined; the \c ERROR_* globals in
+ *   particular are zero-initialized and silently read as 0. Build with a
+ *   single TLS backend if you need them to be valid unconditionally.
  *
  */
 namespace tls {
@@ -199,7 +220,23 @@ namespace tls {
          */
         future<> set_system_trust();
 
-        // TODO add methods for certificate verification
+        /**
+         * Retrieve information about the loaded certificate(s).
+         *
+         * Returns a std::vector of cert_info, each extracted from a loaded
+         * certificate. If no certificates have been loaded, the returned
+         * optional is empty.
+         */
+        std::optional<std::vector<cert_info>> get_cert_info() const noexcept;
+
+        /**
+         * Retrieve information about the loaded current trust list.
+         *
+         * Returns a std::vector of cert_info, each extracted from a CA in the
+         * trust list. If no trust list has been loaded, the returned optional
+         * is empty.
+         */
+        std::optional<std::vector<cert_info>> get_trust_list_info() const noexcept;
 
         /**
          * TLS handshake priority string. See gnutls docs and syntax at
@@ -344,6 +381,7 @@ namespace tls {
 
     using reload_callback = std::function<void(const std::unordered_set<sstring>&, std::exception_ptr)>;
     using reload_callback_ex = std::function<future<>(const credentials_builder&, const std::unordered_set<sstring>&, std::exception_ptr)>;
+    using reload_callback_with_creds = std::function<void(const std::unordered_set<sstring> &, const certificate_credentials &, std::exception_ptr, std::optional<blob>)>;
 
     /**
      * Intentionally "primitive", and more importantly, copyable
@@ -410,6 +448,11 @@ namespace tls {
 
         future<shared_ptr<certificate_credentials>> build_reloadable_certificate_credentials(reload_callback, std::optional<std::chrono::milliseconds> tolerance = {}) const;
         future<shared_ptr<server_credentials>> build_reloadable_server_credentials(reload_callback, std::optional<std::chrono::milliseconds> tolerance = {}) const;
+
+        future<shared_ptr<certificate_credentials>> build_reloadable_certificate_credentials(reload_callback_with_creds, std::optional<std::chrono::milliseconds> tolerance = {}) const;
+        future<shared_ptr<server_credentials>> build_reloadable_server_credentials(reload_callback_with_creds, std::optional<std::chrono::milliseconds> tolerance = {}) const;
+
+        std::optional<blob> get_trust_file_blob() const;
     private:
         friend class reloadable_credentials_base;
 
@@ -575,6 +618,13 @@ namespace tls {
      */
     future<std::optional<session_dn>> get_dn_information(connected_socket& socket);
 
+    enum class dn_format {
+        legacy, // legacy format
+        rfc2253
+    };
+
+    future<std::optional<session_dn>> get_dn_information(connected_socket& socket, dn_format format);
+
     /**
      * Force a re-handshake (session key renegotiotion on TLS1.3).
      * Can only be called on a server side socket.
@@ -696,39 +746,49 @@ namespace tls {
     std::ostream& operator<<(std::ostream&, subject_alt_name_type);
 
     /**
-     * Error handling.
+     * The error_category instance used by exceptions thrown by TLS.
      *
-     * The error_category instance used by exceptions thrown by TLS
+     * See \ref backend_lifetime for when this is valid to call.
      */
     const std::error_category& error_category();
 
     /**
      * Returns the name of the active TLS backend (e.g. "gnutls", "openssl").
+     *
+     * See \ref backend_lifetime for when this is valid to call.
      */
     const char* backend_name();
 
     /**
-     * The more common error codes encountered in TLS.
-     * Not an exhaustive list. Add exports as needed.
+     * The more common error codes encountered in TLS. Not an exhaustive
+     * list — add exports as needed.
+     *
+     * See \ref backend_lifetime for when these are valid to read.
      */
-    extern int ERROR_UNKNOWN_COMPRESSION_ALGORITHM;
-    extern int ERROR_UNKNOWN_CIPHER_TYPE;
-    extern int ERROR_INVALID_SESSION;
-    extern int ERROR_UNEXPECTED_HANDSHAKE_PACKET;
-    extern int ERROR_UNKNOWN_CIPHER_SUITE;
-    extern int ERROR_UNKNOWN_ALGORITHM;
-    extern int ERROR_UNSUPPORTED_SIGNATURE_ALGORITHM;
-    extern int ERROR_SAFE_RENEGOTIATION_FAILED;
-    extern int ERROR_UNSAFE_RENEGOTIATION_DENIED;
-    extern int ERROR_UNKNOWN_SRP_USERNAME;
-    extern int ERROR_PREMATURE_TERMINATION;
-    extern int ERROR_PUSH;
-    extern int ERROR_PULL;
-    extern int ERROR_UNEXPECTED_PACKET;
-    extern int ERROR_UNSUPPORTED_VERSION;
-    extern int ERROR_NO_CIPHER_SUITES;
-    extern int ERROR_DECRYPTION_FAILED;
-    extern int ERROR_MAC_VERIFY_FAILED;
+#ifdef SEASTAR_TLS_DUAL_BACKEND
+#define SEASTAR_TLS_ERROR_QUALIFIERS extern
+#else
+#define SEASTAR_TLS_ERROR_QUALIFIERS extern const
+#endif
+    SEASTAR_TLS_ERROR_QUALIFIERS int ERROR_UNKNOWN_COMPRESSION_ALGORITHM;
+    SEASTAR_TLS_ERROR_QUALIFIERS int ERROR_UNKNOWN_CIPHER_TYPE;
+    SEASTAR_TLS_ERROR_QUALIFIERS int ERROR_INVALID_SESSION;
+    SEASTAR_TLS_ERROR_QUALIFIERS int ERROR_UNEXPECTED_HANDSHAKE_PACKET;
+    SEASTAR_TLS_ERROR_QUALIFIERS int ERROR_UNKNOWN_CIPHER_SUITE;
+    SEASTAR_TLS_ERROR_QUALIFIERS int ERROR_UNKNOWN_ALGORITHM;
+    SEASTAR_TLS_ERROR_QUALIFIERS int ERROR_UNSUPPORTED_SIGNATURE_ALGORITHM;
+    SEASTAR_TLS_ERROR_QUALIFIERS int ERROR_SAFE_RENEGOTIATION_FAILED;
+    SEASTAR_TLS_ERROR_QUALIFIERS int ERROR_UNSAFE_RENEGOTIATION_DENIED;
+    SEASTAR_TLS_ERROR_QUALIFIERS int ERROR_UNKNOWN_SRP_USERNAME;
+    SEASTAR_TLS_ERROR_QUALIFIERS int ERROR_PREMATURE_TERMINATION;
+    SEASTAR_TLS_ERROR_QUALIFIERS int ERROR_PUSH;
+    SEASTAR_TLS_ERROR_QUALIFIERS int ERROR_PULL;
+    SEASTAR_TLS_ERROR_QUALIFIERS int ERROR_UNEXPECTED_PACKET;
+    SEASTAR_TLS_ERROR_QUALIFIERS int ERROR_UNSUPPORTED_VERSION;
+    SEASTAR_TLS_ERROR_QUALIFIERS int ERROR_NO_CIPHER_SUITES;
+    SEASTAR_TLS_ERROR_QUALIFIERS int ERROR_DECRYPTION_FAILED;
+    SEASTAR_TLS_ERROR_QUALIFIERS int ERROR_MAC_VERIFY_FAILED;
+#undef SEASTAR_TLS_ERROR_QUALIFIERS
 }
 }
 
diff --git a/include/seastar/rpc/rpc_impl.hh b/include/seastar/rpc/rpc_impl.hh
index 8a73d312447..6c2a6c3e77d 100644
--- a/include/seastar/rpc/rpc_impl.hh
+++ b/include/seastar/rpc/rpc_impl.hh
@@ -684,12 +684,12 @@ auto recv_helper(uint64_t verb, signature<Ret (InArgs...)> sig, Func&& func, Wan
                                                                  gate::holder guard) mutable {
         auto memory_consumed = client->estimate_request_size(data.size);
         if (memory_consumed > client->max_request_size()) {
-            auto err = format("request size {:d} large than memory limit {:d}, verb {}", memory_consumed, client->max_request_size(), verb);
+            auto err = ::seastar::format("request size {:d} large than memory limit {:d}, verb {}", memory_consumed, client->max_request_size(), verb);
             client->get_logger()(client->peer_address(), err);
             // FIXME: future is discarded
             (void)try_with_gate(client->get_server().reply_gate(), [verb, client, timeout, msg_id, err = std::move(err)] {
                 return reply<Serializer>(wait_style(), futurize<Ret>::make_exception_future(std::runtime_error(err.c_str())), verb, msg_id, client, timeout, std::nullopt).handle_exception([verb, client, msg_id] (std::exception_ptr eptr) {
-                    client->get_logger()(client->info(), msg_id, seastar::format("got exception while processing an oversized message: {} for verb {}", eptr, verb));
+                    client->get_logger()(client->info(), msg_id, ::seastar::format("got exception while processing an oversized message: {} for verb {}", eptr, verb));
                 });
             }).handle_exception_type([] (gate_closed_exception&) {/* ignore */});
             return make_ready_future();
@@ -703,11 +703,11 @@ auto recv_helper(uint64_t verb, signature<Ret (InArgs...)> sig, Func&& func, Wan
                         auto start = rpc_clock_type::now();
                         return apply(func, client->info(), timeout, WantClientInfo(), WantTimePoint(), signature(), std::move(args)).then_wrapped([verb, client, timeout, msg_id, permit = std::move(permit), start] (futurize_t<Ret> ret) mutable {
                             return reply<Serializer>(wait_style(), std::move(ret), verb, msg_id, client, timeout, rpc_clock_type::now() - start).handle_exception([verb, permit = std::move(permit), client, msg_id] (std::exception_ptr eptr) {
-                                client->get_logger()(client->info(), msg_id, seastar::format("got exception while processing a message: {}, verb {}", eptr, verb));
+                                client->get_logger()(client->info(), msg_id, ::seastar::format("got exception while processing a message: {}, verb {}", eptr, verb));
                             });
                         });
                     } catch (...) {
-                        client->get_logger()(client->info(), msg_id, seastar::format("caught exception while processing a message: {}, verb {}", std::current_exception(), verb));
+                        client->get_logger()(client->info(), msg_id, ::seastar::format("caught exception while processing a message: {}, verb {}", std::current_exception(), verb));
                         return make_ready_future();
                     }
                 }).handle_exception_type([g = std::move(g)] (gate_closed_exception&) {/* ignore */});
diff --git a/include/seastar/util/assert.hh b/include/seastar/util/assert.hh
index 2c8eba9018d..e3a7ffc5962 100644
--- a/include/seastar/util/assert.hh
+++ b/include/seastar/util/assert.hh
@@ -34,3 +34,11 @@ namespace seastar::internal {
                                            __PRETTY_FUNCTION__);      \
         }                                                             \
     } while (0)
+
+/// Like SEASTAR_ASSERT(), but only active when SEASTAR_DEBUG is defined
+/// (Debug, Sanitize, and Fuzz build modes). Compiles to nothing otherwise.
+#ifdef SEASTAR_DEBUG
+#define SEASTAR_DEBUG_ASSERT(x) SEASTAR_ASSERT(x)
+#else
+#define SEASTAR_DEBUG_ASSERT(x) do { (void)sizeof(x); } while (0)
+#endif
diff --git a/include/seastar/util/backtrace.hh b/include/seastar/util/backtrace.hh
index 36795999a4f..83306dd12a7 100644
--- a/include/seastar/util/backtrace.hh
+++ b/include/seastar/util/backtrace.hh
@@ -25,6 +25,7 @@
 #include <seastar/core/sstring.hh>
 #include <seastar/core/scheduling.hh>
 #include <seastar/core/shared_ptr.hh>
+#include <seastar/core/internal/signal_mutex.hh>
 #include <seastar/util/assert.hh>
 
 #if __has_include(<execinfo.h>)
@@ -57,6 +58,17 @@ bool operator==(const frame& a, const frame& b) noexcept;
 // will be considered as part of the executable.
 frame decorate(uintptr_t addr) noexcept;
 
+
+// Wrapper for ::backtrace which takes a signal-safe thread-local mutex before
+// calling ::backtrace, to avoid concurrent backtrace calls on the same thread,
+// which is known to crash. If the lock cannot be obtained, no backtrace is taken
+// and this method returns 0.
+#ifdef HAVE_EXECINFO
+int guarded_backtrace(void **array, int size) noexcept;
+#endif
+
+
+
 // Invokes func for each frame passing it as argument.
 // incremental=false is the default mode and simply calls ::backtrace once
 // and then calls func for each frame. If the ::backtrace call crashes,
@@ -74,7 +86,7 @@ void backtrace(Func&& func, bool incremental = false) noexcept(noexcept(func(fra
 
     if (incremental) {
         for (size_t last_frame = 1; last_frame <= max_backtrace; ++last_frame) {
-            int n = ::backtrace(buffer, last_frame);
+            int n = guarded_backtrace(buffer, last_frame);
             if (n < static_cast<int>(last_frame)) {
                 return;
             }
@@ -82,7 +94,7 @@ void backtrace(Func&& func, bool incremental = false) noexcept(noexcept(func(fra
             func(decorate(ip - 1));
         }
     } else {
-        int n = ::backtrace(buffer, max_backtrace);
+        int n = guarded_backtrace(buffer, max_backtrace);
         for (int i = 0; i < n; ++i) {
             auto ip = reinterpret_cast<uintptr_t>(buffer[i]);
             func(decorate(ip - 1));
@@ -122,6 +134,10 @@ public:
     bool operator!=(const simple_backtrace& o) const noexcept {
         return !(*this == o);
     }
+
+    bool is_empty() const noexcept {
+        return _frames.empty();
+    }
 };
 
 using shared_backtrace = seastar::lw_shared_ptr<simple_backtrace>;
diff --git a/include/seastar/util/log.hh b/include/seastar/util/log.hh
index 8cc8bd5bf56..f8d178c9064 100644
--- a/include/seastar/util/log.hh
+++ b/include/seastar/util/log.hh
@@ -298,6 +298,25 @@ public:
         }
     }
 
+    /// \cond internal
+    /// logs to desired level if enabled, otherwise we ignore the log line
+    ///
+    /// \param writer a function which writes directly to the underlying log buffer
+    /// \param fmt - optional logger::format_info passed down the call chain.
+    ///
+    /// This is a low level method for use cases where it is very important to
+    /// avoid any allocations. The \arg writer will be passed a
+    /// internal::log_buf::inserter_iterator that allows it to write into the log
+    /// buffer directly, avoiding the use of any intermediary buffers.
+    void log(log_level level, log_writer& writer, format_info_t<> fmt = {}) noexcept {
+        if (is_enabled(level)) {
+            try {
+                do_log(level, writer);
+            } catch (...) {
+                failed_to_log(std::current_exception(), "", fmt.loc);
+            }
+        }
+    }
     /// logs to desired level if enabled, otherwise we ignore the log line
     ///
     /// \param writer a function which writes directly to the underlying log buffer
diff --git a/src/core/cpu_profiler.cc b/src/core/cpu_profiler.cc
new file mode 100644
index 00000000000..b920cf846f8
--- /dev/null
+++ b/src/core/cpu_profiler.cc
@@ -0,0 +1,247 @@
+/*
+ * This file is open source software, licensed to you under the terms
+ * of the Apache License, Version 2.0 (the "License").  See the NOTICE file
+ * distributed with this work for additional information regarding copyright
+ * ownership.  You may not use this file except in compliance with the License.
+ *
+ * You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+/*
+ * Copyright (C) 2023 ScyllaDB
+ */
+
+#include <chrono>
+#include <optional>
+#include <random>
+
+#include <seastar/core/internal/cpu_profiler.hh>
+#include <seastar/core/scheduling.hh>
+#include <seastar/util/log.hh>
+
+namespace seastar {
+seastar::logger cpu_profiler_logger("cpu_profiler");
+
+namespace internal {
+
+using namespace std::chrono_literals;
+
+namespace {
+thread_local bool force_drop_stacktraces = false;
+}
+
+void profiler_drop_stacktraces(bool should_drop) noexcept {
+    force_drop_stacktraces = should_drop;
+}
+
+/**
+ * The profiler breaks sample periods into windows of size _cfg.period.
+ * I.e, [1ns, _cfg.period), [_cfg.period, 2*_cfg.period)... etc. And it
+ * will ensure that a sample is taken exactly once per window. The goal
+ * of this function is to randomly select a point in the window to sample.
+ * This avoids potential bias from sampling at the same point in time every
+ * window.
+ */
+std::chrono::nanoseconds cpu_profiler::get_next_timeout() {
+    using ns_rep = std::chrono::nanoseconds::rep;
+    static thread_local std::mt19937_64 gen = std::mt19937_64(std::default_random_engine()());
+
+    auto remaining_time_for_last_profiler_period = _cfg.period - _last_set_timeout;
+
+    std::uniform_int_distribution<ns_rep> profiler_dist{0, _cfg.period / 1ns};
+    auto rwait = profiler_dist(gen);
+    _last_set_timeout = std::chrono::nanoseconds(rwait);
+
+    // The interrupt needs to be at least 1ns for perf_event
+    auto wait = std::max(_last_set_timeout + remaining_time_for_last_profiler_period, 1ns);
+    return wait;
+}
+
+bool cpu_profiler::is_enabled() const {
+    return _cfg.enabled;
+}
+
+std::chrono::nanoseconds cpu_profiler::period() const {
+    return _cfg.period;
+}
+
+void cpu_profiler::update_config(cpu_profiler_config cfg) {
+    auto is_stopped = _is_stopped;
+    stop();
+    _cfg = cfg;
+    // Don't start the profiler if it's been explicitly
+    // stopped elsewhere.
+    if (!is_stopped) {
+        start();
+    }
+}
+
+void cpu_profiler::stop() {
+    if (_is_stopped) {
+        return;
+    }
+    if (_cfg.enabled) {
+        disarm_timer();
+    }
+    _is_stopped = true;
+}
+
+void cpu_profiler::start() {
+    _is_stopped = false;
+    if (_cfg.enabled) {
+        _last_set_timeout = _cfg.period;
+        auto next = get_next_timeout();
+        arm_timer(next);
+    }
+}
+
+void cpu_profiler::on_signal() {
+    if (is_spurious_signal()) {
+        return;
+    }
+
+    // During exception handling in libgcc there is a critical section
+    // where the stack is being modified so execution can be returned to
+    // a handler for the exception. This modification isn't capture by
+    // the eh_frames for the program though. So when libgcc's backtrace
+    // enters the partially modified stack it will follow invalid addresses
+    // and cause a segfault. To avoid this we check if any exception
+    // is currently being unwound and avoid taking a profiling sample if so.
+    //
+    // Note: this only protects against C++ exceptions, therefore foreign
+    // exceptions or long jumps could still cause segfaults within the profiler.
+    const bool no_uncaught_exceptions = std::uncaught_exceptions() == 0;
+
+    if (force_drop_stacktraces) {
+        _stats.dropped_samples_from_manual_disablement++;
+    } else if (!no_uncaught_exceptions) {
+        _stats.dropped_samples_from_exceptions++;
+    } else if (auto guard_opt = _traces_mutex.try_lock(); guard_opt.has_value()) {
+        // Skip the sample if the main thread is currently reading
+        // _traces. This case shouldn't happen often though.
+
+        // The oldest trace will be overridden if the circular
+        // buffer is full so update the bookkeeping to indicate
+        // this.
+        if (_traces.size() == _traces.capacity()) {
+            _traces.pop_front();
+            _stats.dropped_samples_from_buffer_full++;
+        }
+        _traces.emplace_back();
+        _traces.back().user_backtrace = current_backtrace_tasklocal();
+        _traces.back().sg = current_scheduling_group();
+
+        if (_traces.back().user_backtrace.is_empty()) {
+            // An empty backtrace implies that there was some issue collecting
+            // the backtrace. Currently the most likely reason is that another
+            // backtrace was being collected when the profiler interrupted the
+            // process.
+            _stats.dropped_samples_from_mutex_contention++;
+        }
+
+        auto kernel_bt = try_get_kernel_backtrace();
+        if (kernel_bt) {
+            auto& kernel_vec = _traces.back().kernel_backtrace;
+
+            kernel_bt->read_backtrace([&] (uintptr_t addr) {
+                if((kernel_vec.size() + 1) <= kernel_vec.max_size()) {
+                    kernel_vec.push_back(addr);
+                }
+            });
+        }
+    } else {
+        _stats.dropped_samples_from_mutex_contention++;
+    }
+
+    auto next = get_next_timeout();
+    arm_timer(next);
+}
+
+size_t cpu_profiler::results(std::vector<cpu_profiler_trace>& results_buffer) {
+    // Since is this not called in the interrupt it should always succeed
+    // in acquiring the lock.
+    auto guard_opt = _traces_mutex.try_lock();
+    if (!guard_opt.has_value()) {
+        results_buffer.clear();
+        return 0;
+    }
+
+    results_buffer.assign(_traces.cbegin(), _traces.cend());
+    _traces.clear();
+
+    auto dropped_samples = _stats.sum_dropped();
+    _stats.clear_dropped();
+
+    return dropped_samples;
+}
+
+void cpu_profiler_posix_timer::arm_timer(std::chrono::nanoseconds ns) {
+    return _timer.arm_timer(ns);
+}
+
+void cpu_profiler_posix_timer::disarm_timer() {
+    return _timer.disarm_timer();
+}
+
+bool cpu_profiler_linux_perf_event::is_spurious_signal() {
+    return _perf_event.is_spurious_signal();
+}
+
+std::optional<linux_perf_event::kernel_backtrace>
+cpu_profiler_linux_perf_event::try_get_kernel_backtrace() {
+    return _perf_event.try_get_kernel_backtrace();
+}
+
+void cpu_profiler_linux_perf_event::arm_timer(std::chrono::nanoseconds ns) {
+    _perf_event.arm_timer(ns);
+}
+
+void cpu_profiler_linux_perf_event::disarm_timer() {
+    _perf_event.disarm_timer();
+}
+
+std::unique_ptr<cpu_profiler_linux_perf_event>
+cpu_profiler_linux_perf_event::try_make(cpu_profiler_config cfg) {
+    return std::make_unique<cpu_profiler_linux_perf_event>(
+            linux_perf_event::try_make({signal_number()}), std::move(cfg));
+}
+
+std::unique_ptr<cpu_profiler> make_cpu_profiler(cpu_profiler_config cfg) {
+    std::unique_ptr<cpu_profiler> profiler;
+
+    try {
+        profiler = cpu_profiler_linux_perf_event::try_make(cfg);
+
+    } catch (std::system_error& e) {
+        // This failure occurs when /proc/sys/kernel/perf_event_paranoid is set
+        // to 2 or higher, and is expected since most distributions set it to that
+        // way as of 2023. In this case we log a different message and only at INFO
+        // level on shard 0.
+        if (e.code() == std::error_code(EACCES, std::system_category())) {
+            cpu_profiler_logger.info0("Perf-based cpu profiler creation failed (EACCESS), "
+                    "try setting /proc/sys/kernel/perf_event_paranoid to 1 or less to "
+                    "enable kernel backtraces: falling back to posix timer.");
+        } else {
+            cpu_profiler_logger.warn("Creation of perf_event based cpu profiler failed: falling back to posix timer: {}", e.what());
+        }
+    } catch (...) {
+        cpu_profiler_logger.warn("Creation of perf_event based cpu profiler failed: falling back to posix timer: {}", std::current_exception());
+    }
+
+    if (!profiler) {
+        profiler = std::make_unique<cpu_profiler_posix_timer>(cfg);
+    }
+
+    return profiler;
+}
+
+} // namespace internal
+} // namespace seastar
diff --git a/src/core/crypto.cc b/src/core/crypto.cc
index 0a6ce42866e..47d494f4822 100644
--- a/src/core/crypto.cc
+++ b/src/core/crypto.cc
@@ -20,21 +20,48 @@
  */
 
 #include "crypto.hh"
+#include <seastar/util/assert.hh>
 #include <memory>
 
 namespace seastar::internal::crypto {
 
+#ifdef SEASTAR_TLS_DUAL_BACKEND
+
+// Dual-backend build: the active provider is selected at reactor startup
+// (--crypto-provider) and installed via set_provider() from smp::configure().
 static std::unique_ptr<crypto_provider> the_provider;
 
 crypto_provider& provider() {
+    SEASTAR_DEBUG_ASSERT(the_provider != nullptr);
     return *the_provider;
 }
 
 void set_provider(std::unique_ptr<crypto_provider> p) {
+    SEASTAR_ASSERT(the_provider == nullptr);
     the_provider = std::move(p);
     provider().get_tls_backend().init_error_codes();
 }
 
+void reset_provider() {
+    the_provider.reset();
+}
+
+#else // single-backend
+
+// Single-backend build: the provider is fixed at compile time. Use a
+// function-local static so provider() works at any time, including before
+// reactor startup. No set_provider() is compiled or needed.
+crypto_provider& provider() {
+#ifdef SEASTAR_HAVE_GNUTLS
+    static auto instance = create_gnutls_provider();
+#else // SEASTAR_HAVE_OPENSSL
+    static auto instance = create_openssl_provider();
+#endif
+    return *instance;
+}
+
+#endif // SEASTAR_TLS_DUAL_BACKEND
+
 md5_hasher make_md5_hasher() {
     return provider().make_md5_hasher();
 }
diff --git a/src/core/crypto.hh b/src/core/crypto.hh
index 46a1a1998fa..223207a2d11 100644
--- a/src/core/crypto.hh
+++ b/src/core/crypto.hh
@@ -73,6 +73,11 @@ public:
     virtual std::unique_ptr<tls::dh_params_impl> make_dh_params(const tls::blob&, tls::x509_crt_format) = 0;
 
     /// \brief Initialize backend-specific TLS error code constants.
+    ///
+    /// In dual-backend builds this fills in the legacy \c tls::ERROR_*
+    /// globals from the active backend's values. In single-backend builds
+    /// the globals are \c const, statically initialized in the backend's
+    /// own translation unit, and this method is a no-op.
     virtual void init_error_codes() = 0;
 
     /// \brief Return the name of this TLS backend (e.g. "gnutls", "openssl").
@@ -106,16 +111,37 @@ public:
 
 /// \brief Return the process-wide crypto provider.
 ///
-/// Must be called after set_provider().  The returned reference
-/// remains valid for the lifetime of the process.
+/// In dual-backend builds, must be called after \ref set_provider(). The
+/// returned reference remains valid for the lifetime of the process.
+/// In single-backend builds the provider is fixed at compile time, lazily
+/// created on first call, and \ref provider() works at any time including
+/// from static initializers / before reactor startup.
 crypto_provider& provider();
 
+#ifdef SEASTAR_TLS_DUAL_BACKEND
 /// \brief Install the process-wide crypto provider.
 ///
-/// Must be called exactly once, before any call to provider().
-/// Ownership is transferred to the crypto subsystem.
+/// Must be called exactly once per \c set_provider / \c reset_provider
+/// cycle, before any call to \ref provider(). Ownership is transferred
+/// to the crypto subsystem.
+///
+/// Only compiled in dual-backend builds. In single-backend builds the
+/// provider is fixed at compile time and \ref provider() handles the
+/// lifetime internally.
 void set_provider(std::unique_ptr<crypto_provider> p);
 
+/// \brief Tear down the process-wide crypto provider installed by
+/// \ref set_provider.
+///
+/// Called from \c smp::cleanup() so that a subsequent \c app::run()
+/// (and the \c smp::configure() it triggers) starts from a clean slate
+/// and can call \ref set_provider again. Safe to call when no provider
+/// is installed.
+///
+/// Only compiled in dual-backend builds.
+void reset_provider();
+#endif
+
 #ifdef SEASTAR_HAVE_GNUTLS
 /// \brief Create a GnuTLS-backed crypto provider.
 std::unique_ptr<crypto_provider> create_gnutls_provider();
diff --git a/src/core/disk_params.cc b/src/core/disk_params.cc
index fa1abab1385..a3db216b8c2 100644
--- a/src/core/disk_params.cc
+++ b/src/core/disk_params.cc
@@ -67,7 +67,9 @@ struct convert<seastar::internal::disk_params> {
         if (node["rate_factor"]) {
             mp.rate_factor = node["rate_factor"].as<float>();
         }
-        return true;
+        if (node["max_cost_function"]) {
+            mp.max_cost_function = node["max_cost_function"].as<bool>();
+        }        return true;
     }
 };
 }
@@ -203,6 +205,12 @@ struct io_queue::config disk_config_params::generate_config(const disk_params& p
     cfg.stall_threshold = stall_threshold();
     cfg.physical_block_size = p.physical_block_size;
 
+    cfg.read_bytes_rate = p.read_bytes_rate;
+    cfg.write_bytes_rate = p.write_bytes_rate;
+    cfg.read_req_rate = p.read_req_rate;
+    cfg.write_req_rate = p.write_req_rate;
+    cfg.max_cost_function = p.max_cost_function;
+
     return cfg;
 }
 
diff --git a/src/core/fstream.cc b/src/core/fstream.cc
index 176b6789d52..1d87284d1d7 100644
--- a/src/core/fstream.cc
+++ b/src/core/fstream.cc
@@ -328,7 +328,7 @@ class file_data_source_impl : public data_source_impl {
                     if (start < pos) {
                         tmp.trim_front(pos - start);
                     }
-                    return make_ready_future<temporary_buffer<char>>(temporary_buffer<char>(reinterpret_cast<char*>(tmp.get_write()), tmp.size(), tmp.release()));
+                    return make_ready_future<temporary_buffer<char>>(temporary_buffer<char>::maybe_unsafe_from_deleter(reinterpret_cast<char*>(tmp.get_write()), tmp.size(), tmp.release()));
                 }
             }));
             _remain -= end - _pos;
diff --git a/src/core/io_queue.cc b/src/core/io_queue.cc
index 696faf94117..7f1a6a95253 100644
--- a/src/core/io_queue.cc
+++ b/src/core/io_queue.cc
@@ -37,6 +37,7 @@
 #include <seastar/core/io_queue.hh>
 #include <seastar/core/io_intent.hh>
 #include <seastar/core/reactor.hh>
+#include <seastar/core/smp.hh>
 #include <seastar/core/when_all.hh>
 #include <seastar/core/metrics.hh>
 #include <seastar/core/internal/io_desc.hh>
@@ -861,7 +862,7 @@ void io_queue::register_stats(sstring name, priority_class_data& pc) {
     }
 
     new_metrics.add_group("io_queue", std::move(metrics));
-    pc.metric_groups = std::exchange(new_metrics, {});
+    pc.metric_groups = std::exchange(new_metrics, sm::metric_groups{});
 }
 
 io_queue::priority_class_data& io_queue::find_or_create_class(internal::priority_class pc) {
@@ -977,7 +978,14 @@ double internal::request_tokens(io_direction_and_length dnl, const io_queue::con
 
     const auto& m = mult[dnl.rw_idx()];
 
-    return double(m.weight) / cfg.req_count_rate + double(m.size) * (dnl.length() >> io_queue::block_size_shift) / cfg.blocks_count_rate;
+    // See https://redpandadata.atlassian.net/wiki/x/CgAIGw#io-queue-cost-function
+    double iops_cost = double(m.weight) / cfg.req_count_rate;
+    double tp_cost = double(m.size) * (dnl.length() >> io_queue::block_size_shift) / cfg.blocks_count_rate;
+    if (cfg.max_cost_function) {
+        return std::max(iops_cost, tp_cost);
+    } else {
+        return iops_cost + tp_cost;
+    }
 }
 
 fair_queue_entry::capacity_t io_queue::request_capacity(io_direction_and_length dnl) const noexcept {
diff --git a/src/core/memory.cc b/src/core/memory.cc
index 819fafdf218..a5b3e96e070 100644
--- a/src/core/memory.cc
+++ b/src/core/memory.cc
@@ -156,6 +156,21 @@ thread_local constinit int abort_on_alloc_failure_suppressed = 0;
 
 }
 
+static thread_local int fallback_to_system_nest_count = 0;
+
+scoped_system_alloc_fallback::scoped_system_alloc_fallback() noexcept {
+    ++fallback_to_system_nest_count;
+}
+
+scoped_system_alloc_fallback::~scoped_system_alloc_fallback() noexcept {
+    --fallback_to_system_nest_count;
+    SEASTAR_ASSERT(fallback_to_system_nest_count >= 0);
+}
+
+void enable_abort_on_allocation_failure() {
+    set_abort_on_allocation_failure(true);
+}
+
 static std::pmr::polymorphic_allocator<char> static_malloc_allocator{std::pmr::get_default_resource()};;
 std::pmr::polymorphic_allocator<char>* malloc_allocator{&static_malloc_allocator};
 
@@ -238,7 +253,7 @@ std::atomic<bool> use_transparent_hugepages = true;
 namespace alloc_stats {
 
 enum class types { allocs, frees, cross_cpu_frees, total_bytes_allocated, reclaims, large_allocs, failed_allocs,
-    foreign_mallocs, foreign_frees, foreign_cross_frees, enum_size };
+    foreign_mallocs, foreign_frees, foreign_cross_frees, fallback_allocs, enum_size };
 
 using stats_array = std::array<uint64_t, static_cast<std::size_t>(types::enum_size)>;
 using stats_atomic_array = std::array<std::atomic_uint64_t, static_cast<std::size_t>(types::enum_size)>;
@@ -533,6 +548,10 @@ static_assert(object_size_with_alloc_site(max_small_allocation - sizeof(allocati
 static_assert(object_size_with_alloc_site(max_small_allocation - sizeof(allocation_site_ptr) - 2) == max_small_allocation - 2, "");
 #endif
 
+// if not, do_test_fallback_alloc needs to be updated to use a size
+// larger than the small alloc threshold
+static_assert(max_small_allocation < 32 * 1024);
+
 struct cross_cpu_free_item {
     cross_cpu_free_item* next;
 };
@@ -862,7 +881,11 @@ cpu_pages::allocate_large_and_trim(unsigned n_pages, bool should_sample) {
 void
 cpu_pages::warn_large_allocation(size_t size) {
     alloc_stats::increment_local(alloc_stats::types::large_allocs);
-    seastar_memory_logger.warn("oversized allocation: {} bytes. This is non-fatal, but could lead to latency and/or fragmentation issues. Please report: at {}", size, current_backtrace());
+    if (fallback_to_system_nest_count) {
+        seastar_memory_logger.debug("large allocation: {} bytes (in scoped fallback mode)", size);
+    } else {
+        seastar_memory_logger.warn("oversized allocation: {} bytes. This is non-fatal, but could lead to latency and/or fragmentation issues. Please report: at {}", size, current_backtrace());
+    }
 }
 
 allocation_site_ptr
@@ -1169,7 +1192,7 @@ static void free_slowpath(void* obj, S size) {
 void
 cpu_pages::do_foreign_free(void* ptr) {
     // handles:
-    // 1) non-seastar pointers
+    // 1) non-seastar pointers (including system fallback allocs)
     // 2) cross-shard frees
     // 3) null pointer
 
@@ -1655,6 +1678,20 @@ static inline void* finish_allocation(void* ptr, size_t size) {
     return ptr;
 }
 
+static void * maybe_system_fallback(void *ptr, size_t align, size_t size) {
+    auto func_present = align ? (bool)original_aligned_alloc_func : (bool)original_malloc_func;
+    if (!ptr && fallback_to_system_nest_count && func_present) {
+        // we are in a fallback scope, call the system malloc
+        // fallback allocs count as foreign allocs because they also count as foreign frees
+        alloc_stats::increment(alloc_stats::types::foreign_mallocs);
+        alloc_stats::increment(alloc_stats::types::fallback_allocs);
+        return align ? original_aligned_alloc_func(align, size) : original_malloc_func(size);
+    } else {
+        return ptr;
+    }
+}
+
+
 void *allocate_slowpath(size_t size) {
     if (!is_reactor_thread) {
         if (original_malloc_func) {
@@ -1707,7 +1744,9 @@ void *allocate_slowpath(size_t size) {
         }
     } else {
         ptr = allocate_large(size, should_sample);
+        ptr = maybe_system_fallback(ptr, 0, size);
     }
+
     return finish_allocation(ptr, size);
 }
 
@@ -1761,6 +1800,7 @@ void* allocate_aligned(size_t align, size_t size) {
         }
     } else {
         ptr = allocate_large_aligned(align, size, should_sample);
+        ptr = maybe_system_fallback(ptr, align, size);
     }
     return finish_allocation(ptr, size);
 }
@@ -1948,7 +1988,7 @@ configure(std::vector<resource::memory> m, bool mbind,
 statistics stats() {
     return statistics{alloc_stats::get(alloc_stats::types::allocs), alloc_stats::get(alloc_stats::types::frees), alloc_stats::get(alloc_stats::types::cross_cpu_frees),
         cpu_mem.nr_pages * page_size, cpu_mem.nr_free_pages * page_size, alloc_stats::get(alloc_stats::types::total_bytes_allocated), alloc_stats::get(alloc_stats::types::reclaims), alloc_stats::get(alloc_stats::types::large_allocs),
-        alloc_stats::get(alloc_stats::types::failed_allocs), alloc_stats::get(alloc_stats::types::foreign_mallocs), alloc_stats::get(alloc_stats::types::foreign_frees),
+        alloc_stats::get(alloc_stats::types::failed_allocs), alloc_stats::get(alloc_stats::types::fallback_allocs), alloc_stats::get(alloc_stats::types::foreign_mallocs), alloc_stats::get(alloc_stats::types::foreign_frees),
         alloc_stats::get(alloc_stats::types::foreign_cross_frees)};
 }
 
@@ -2719,7 +2759,7 @@ void configure_minimal()
 {}
 
 statistics stats() {
-    return statistics{0, 0, 0, 1 << 30, 1 << 30, 0, 0, 0, 0, 0, 0, 0};
+    return statistics{0, 0, 0, 1 << 30, 1 << 30, 0, 0, 0, 0, 0, 0, 0, 0};
 }
 
 size_t free_memory() {
diff --git a/src/core/metrics.cc b/src/core/metrics.cc
index 1e3bf662177..2dfd4ba0bfd 100644
--- a/src/core/metrics.cc
+++ b/src/core/metrics.cc
@@ -39,16 +39,21 @@ namespace seastar {
 extern seastar::logger seastar_logger;
 namespace metrics {
 
+int default_handle() {
+    return impl::default_handle();
+};
+
 double_registration::double_registration(std::string what): std::runtime_error(what) {}
 
-metric_groups::metric_groups() noexcept : _impl(impl::create_metric_groups()) {
+metric_groups::metric_groups(int handle) noexcept : _impl(impl::create_metric_groups(handle)) {
 }
 
 void metric_groups::clear() {
-    _impl = impl::create_metric_groups();
+    const auto current_handle = _impl->get_handle();
+    _impl = impl::create_metric_groups(current_handle);
 }
 
-metric_groups::metric_groups(std::initializer_list<metric_group_definition> mg) : _impl(impl::create_metric_groups()) {
+metric_groups::metric_groups(std::initializer_list<metric_group_definition> mg, int handle) : _impl(impl::create_metric_groups(handle)) {
     for (auto&& i : mg) {
         add_group(i.name, i.metrics);
     }
@@ -61,10 +66,9 @@ metric_groups& metric_groups::add_group(const group_name_type& name, const std::
     _impl->add_group(name, l);
     return *this;
 }
-metric_group::metric_group() noexcept = default;
+metric_group::metric_group(int handle) noexcept : metric_groups(handle) {}
 metric_group::~metric_group() = default;
-metric_group::metric_group(const group_name_type& name, std::initializer_list<metric_definition> l) {
-    add_group(name, l);
+metric_group::metric_group(const group_name_type& name, std::initializer_list<metric_definition> l, int handle) : metric_groups({metric_group_definition(name, l)}, handle) {
 }
 
 metric_group_definition::metric_group_definition(const group_name_type& name, std::initializer_list<metric_definition> l) : name(name), metrics(l) {
@@ -110,11 +114,11 @@ options::options(program_options::option_group* parent_group)
 {
 }
 
-future<> configure(const options& opts) {
+future<> configure(const options& opts, int handle) {
     impl::config c;
     c.hostname = opts.metrics_hostname.get_value();
-    return smp::invoke_on_all([c] {
-        impl::get_local_impl()->set_config(c);
+    return smp::invoke_on_all([c, handle] {
+        impl::get_local_impl(handle)->set_config(c);
     });
 }
 
@@ -197,6 +201,17 @@ bool impl::impl::apply_relabeling(const relabel_config& rc, metric_info& info) {
     return true;
 }
 
+future<>
+replicate_metric_families(
+        int source_handle,
+        std::unordered_multimap<seastar::sstring, int> metric_families_to_replicate) {
+    return smp::invoke_on_all([source_handle, metric_families_to_replicate] {
+        auto source_impl = impl::get_local_impl(source_handle);
+        source_impl->set_metric_families_to_replicate(
+                std::move(metric_families_to_replicate));
+    });
+}
+
 bool label_instance::operator!=(const label_instance& id2) const {
     auto& id1 = *this;
     return !(id1 == id2);
@@ -330,15 +345,15 @@ metric_definition_impl& metric_definition_impl::set_skip_when_empty(bool skip) n
     return *this;
 }
 
-std::unique_ptr<metric_groups_def> create_metric_groups() {
-    return  std::make_unique<metric_groups_impl>();
+std::unique_ptr<metric_groups_def> create_metric_groups(int handle) {
+    return  std::make_unique<metric_groups_impl>(handle);
 }
 
-metric_groups_impl::metric_groups_impl() {}
+metric_groups_impl::metric_groups_impl(int handle) : _handle(handle) {}
 
 metric_groups_impl::~metric_groups_impl() {
     for (const auto& i : _registration) {
-        unregister_metric(i->info().id);
+        unregister_metric(i->info().id, _handle);
     }
 }
 
@@ -356,14 +371,15 @@ metric_groups_impl& metric_groups_impl::add_metric(group_name_type name, const m
     // than where the actual metrics are added.
     // Hence, the shared_ptr owning shard check would fail so we do it only here.
     if (_impl == nullptr) {
-        _impl = get_local_impl();
+        _impl = get_local_impl(_handle);
     }
 
-    auto internalized_labels = get_local_impl()->internalize_labels(md._impl->labels);
+    auto internalized_labels = get_local_impl(_handle)->internalize_labels(md._impl->labels);
 
     metric_id id(name, md._impl->name, internalized_labels);
 
-    auto reg = get_local_impl()->add_registration(id, md._impl->type, md._impl->f, md._impl->d, md._impl->enabled, md._impl->_skip_when_empty, md._impl->aggregate_labels);
+    auto reg = get_local_impl(_handle)->add_registration(
+            id, md._impl->type, md._impl->f, md._impl->d, md._impl->enabled, md._impl->_skip_when_empty, md._impl->aggregate_labels);
 
     _registration.push_back(std::move(reg));
     return *this;
@@ -383,6 +399,10 @@ metric_groups_impl& metric_groups_impl::add_group(group_name_type name, const st
     return *this;
 }
 
+int metric_groups_impl::get_handle() const {
+    return _handle;
+}
+
 bool metric_id::operator<(
         const metric_id& id2) const {
     return as_tuple() < id2.as_tuple();
@@ -403,14 +423,20 @@ bool metric_id::operator==(
     return as_tuple() == id2.as_tuple();
 }
 
-// Unfortunately, metrics_impl can not be shared because it
-// need to be available before the first users (reactor) will call it
+shared_ptr<impl> get_local_impl(int handle) {
+    auto& impls = get_metric_implementations();
+    auto [it, inserted] = impls.try_emplace(handle);
+
+    if (inserted) {
+        it->second = ::seastar::make_shared<impl>();
+    }
 
-shared_ptr<impl>  get_local_impl() {
-    static thread_local auto the_impl = ::seastar::make_shared<impl>();
-    return the_impl;
+    return it->second;
 }
+
 void impl::remove_registration(const metric_id& id) {
+    remove_metric_replica_if_required(id);
+
     auto i = get_value_map().find(id.full_name());
     if (i != get_value_map().end()) {
         auto j = i->second.find(id.labels());
@@ -425,20 +451,51 @@ void impl::remove_registration(const metric_id& id) {
     }
 }
 
-void unregister_metric(const metric_id & id) {
-    get_local_impl()->remove_registration(id);
+void impl::remove_metric_replica_family(const seastar::sstring& name,
+                                        int destination_handle) const {
+    auto entry = _value_map.find(name);
+
+    if (entry == _value_map.end()) {
+        return;
+    }
+
+    auto destination = get_local_impl(destination_handle);
+    for (const auto& metric_instance: entry->second) {
+        const auto& registered_metric = metric_instance.second;
+        remove_metric_replica(registered_metric->get_id(),
+                              destination);
+    }
+}
+
+void impl::remove_metric_replica(const metric_id& id,
+                                 const shared_ptr<impl>& destination) const {
+    destination->remove_registration(id);
+}
+
+void impl::remove_metric_replica_if_required(const metric_id& id) const {
+    auto [begin, end] = _metric_families_to_replicate.equal_range(id.full_name());
+
+    for (; begin != end; ++begin) {
+        auto destination = get_local_impl(begin->second);
+        remove_metric_replica(id, destination);
+    }
 }
 
-const value_map& get_value_map() {
-    return get_local_impl()->get_value_map();
+void unregister_metric(const metric_id & id, int handle) {
+    get_local_impl(handle)->remove_registration(id);
 }
 
-foreign_ptr<values_reference> get_values() {
+const value_map& get_value_map(int handle) {
+    return get_local_impl(handle)->get_value_map();
+}
+
+foreign_ptr<values_reference> get_values(int handle) {
     shared_ptr<values_copy> res_ref = ::seastar::make_shared<values_copy>();
     auto& res = *(res_ref.get());
     auto& mv = res.values;
-    res.metadata = get_local_impl()->metadata();
-    auto & functions = get_local_impl()->functions();
+    auto impl = get_local_impl(handle);
+    res.metadata = impl->metadata();
+    auto & functions = impl->functions();
     for (auto&& i : functions) {
         value_vector values;
         for (auto&& v : i) {
@@ -464,6 +521,67 @@ void impl::gc_internalized_labels() {
     }
 }
 
+void
+impl::set_metric_families_to_replicate(
+        std::unordered_multimap<seastar::sstring, int> metric_families_to_replicate) {
+    // Remove all previous metric replica families
+    for (const auto& [name, destination]: _metric_families_to_replicate) {
+        remove_metric_replica_family(name, destination);
+    }
+
+    // Replicate the specified metric families.
+    for (const auto& [name, destination]: metric_families_to_replicate) {
+        replicate_metric_family(name, destination);
+    }
+
+    _metric_families_to_replicate = std::move(metric_families_to_replicate);
+}
+
+void impl::replicate_metric_family(const seastar::sstring& name,
+                                   int destination_handle) const {
+    const auto& entry = _value_map.find(name);
+
+    if (entry == _value_map.end()) {
+        return;
+    }
+
+    const auto& metric_family = entry->second;
+    auto destination = get_local_impl(destination_handle);
+    for (const auto& [labels, metric_ptr]: metric_family) {
+        replicate_metric(metric_ptr, metric_family, destination, destination_handle);
+    }
+}
+
+void impl::replicate_metric_if_required(const shared_ptr<registered_metric>& metric) const {
+    auto full_name = metric->get_id().full_name();
+    auto [begin, end]= _metric_families_to_replicate.equal_range(full_name);
+
+    for (; begin != end; ++begin) {
+        const auto& [name, destination_handle] = *begin;
+        const auto& metric_family = _value_map.at(name);
+
+        auto destination = get_local_impl(destination_handle);
+        replicate_metric(metric, metric_family, destination, destination_handle);
+    }
+}
+
+void impl::replicate_metric(const shared_ptr<registered_metric>& metric,
+                            const metric_family& family,
+                            const shared_ptr<impl>& destination,
+                            int destination_handle) const {
+    const auto& family_info = family.info();
+    metric_type type = { .base_type = family_info.type,
+                         .type_name = family_info.inherit_type };
+
+    destination->add_registration(metric->get_id(),
+                                  type,
+                                  metric->get_function(),
+                                  family_info.d,
+                                  metric->is_enabled(),
+                                  metric->get_skip_when_empty(),
+                                  family_info.aggregate_labels);
+}
+
 void impl::update_metrics_if_needed() {
     if (_dirty) {
         // Forcing the metadata to an empty initialization
@@ -540,9 +658,24 @@ register_ref impl::add_registration(const metric_id& id, const metric_type& type
     }
     dirty();
 
+    replicate_metric_if_required(rm);
+
     return rm;
 }
 
+void impl::update_aggregate_labels(const metric_id& id,
+                                   const std::vector<label>& aggregate_labels) {
+    auto iter = _value_map.find(id.full_name());
+    if (iter != _value_map.end()) {
+        iter->second.info().aggregate_labels.clear();
+        std::transform(aggregate_labels.begin(), aggregate_labels.end(),
+            std::back_inserter(iter->second.info().aggregate_labels),
+            [] (const label& l) { return l.name(); });
+
+        dirty();
+    }
+}
+
 future<metric_relabeling_result> impl::set_relabel_configs(const std::vector<relabel_config>& relabel_configs) {
     _relabel_configs = relabel_configs;
     metric_relabeling_result conflicts{0};
@@ -616,6 +749,11 @@ void impl::set_metric_family_configs(const std::vector<metric_family_config>& fa
         }
     }
 }
+
+int default_handle() {
+    return 0;
+}
+
 }
 
 const bool metric_disabled = false;
@@ -668,5 +806,11 @@ histogram histogram::operator+(histogram&& c) const {
     return std::move(c);
 }
 
+void update_aggregate_labels(const group_name_type& group_name,
+                             const metric_name_type& metric_name,
+                             const std::vector<label>& aggregate_labels) {
+    impl::metric_id id(group_name, metric_name, {});
+    impl::get_local_impl()->update_aggregate_labels(id, aggregate_labels);
+}
 }
 }
diff --git a/src/core/prometheus.cc b/src/core/prometheus.cc
index 7b8b6115ceb..27bbdad9dc0 100644
--- a/src/core/prometheus.cc
+++ b/src/core/prometheus.cc
@@ -561,17 +561,15 @@ class metrics_families_per_shard {
     /** @} */
 };
 
-static future<metrics_families_per_shard> get_map_value() {
-    metrics_families_per_shard vec;
+static future<> get_map_value(metrics_families_per_shard& vec, int handle) {
     vec.resize(this_smp_shard_count());
-    co_await parallel_for_each(std::views::iota(0u, this_smp_shard_count()), [&vec] (auto cpu) {
-        return smp::submit_to(cpu, [] {
-            return mi::get_values();
+    co_await parallel_for_each(std::views::iota(0u, this_smp_shard_count()), [handle, &vec] (auto cpu) {
+        return smp::submit_to(cpu, [handle] {
+            return mi::get_values(handle);
         }).then([&vec, cpu] (auto res) {
             vec[cpu] = std::move(res);
         });
     });
-    co_return vec;
 }
 
 /*!
@@ -1111,7 +1109,8 @@ class metrics_handler : public httpd::handler_base  {
 
     future<> write_body(write_body_args args, output_stream<char>&& out_stream) {
         auto s = std::move(out_stream);
-        auto families = co_await get_map_value();
+        metrics_families_per_shard families;
+        co_await get_map_value(families, _ctx.handle);
         bool use_protobuf = args.use_protobuf_format;
 
         write_context context{
@@ -1138,7 +1137,7 @@ std::function<bool(const mi::labels_type&)> metrics_handler::_true_function = []
 };
 
 future<> add_prometheus_routes(httpd::http_server& server, config ctx) {
-    server._routes.put(httpd::GET, "/metrics", new metrics_handler(ctx));
+    server._routes.put(httpd::GET, ctx.route, new metrics_handler(ctx));
     return make_ready_future<>();
 }
 
diff --git a/src/core/reactor.cc b/src/core/reactor.cc
index 60e86000c67..7af5485737c 100644
--- a/src/core/reactor.cc
+++ b/src/core/reactor.cc
@@ -124,6 +124,7 @@
 #include <seastar/core/make_task.hh>
 #include <seastar/core/memory.hh>
 #include <seastar/core/metrics.hh>
+#include <seastar/core/metrics_api.hh>
 #include <seastar/core/posix.hh>
 #include <seastar/core/prefetch.hh>
 #include <seastar/core/print.hh>
@@ -144,10 +145,12 @@
 #include <seastar/core/with_scheduling_group.hh>
 #include <seastar/core/internal/buffer_allocator.hh>
 #include <seastar/core/disk_params.hh>
+#include <seastar/core/internal/cpu_profiler.hh>
 #include <seastar/core/internal/io_desc.hh>
 #include <seastar/core/internal/uname.hh>
 #include <seastar/core/internal/stall_detector.hh>
 #include <seastar/core/internal/run_in_background.hh>
+#include <seastar/core/internal/timers.hh>
 #include <seastar/coroutine/all.hh>
 #include <seastar/net/native-stack.hh>
 #include <seastar/net/packet.hh>
@@ -169,6 +172,7 @@
 #include "core/reactor_backend.hh"
 #include "core/syscall_result.hh"
 #include "core/thread_pool.hh"
+#include "core/scollectd-impl.hh"
 #include "syscall_work_queue.hh"
 #include "cgroup.hh"
 #ifdef SEASTAR_HAVE_DPDK
@@ -1059,7 +1063,7 @@ reactor::task_queue::register_stats() {
 
     register_net_metrics_for_scheduling_group(new_metrics, _id, group_label);
 
-    _metrics = std::exchange(new_metrics, {});
+    _metrics = std::exchange(new_metrics, sm::metric_groups{});
 }
 
 void
@@ -1118,6 +1122,7 @@ reactor::reactor(std::shared_ptr<seastar::smp> smp, alien::instance& alien, unsi
     , _task_quota_timer(file_desc::timerfd_create(CLOCK_MONOTONIC, TFD_CLOEXEC))
     , _id(id)
     , _cpu_stall_detector(internal::make_cpu_stall_detector())
+    , _cpu_profiler(internal::make_cpu_profiler())
     , _cpu_sched(nullptr, 0)
     , _thread_pool(std::make_unique<thread_pool>(seastar::format("syscall-{}", id), _notify_eventfd)) {
     /*
@@ -1137,6 +1142,7 @@ reactor::reactor(std::shared_ptr<seastar::smp> smp, alien::instance& alien, unsi
     sigset_t mask;
     sigemptyset(&mask);
     sigaddset(&mask, internal::cpu_stall_detector::signal_number());
+    sigaddset(&mask, internal::cpu_profiler::signal_number());
     auto r = ::pthread_sigmask(SIG_UNBLOCK, &mask, NULL);
     SEASTAR_ASSERT(r == 0);
     memory::set_reclaim_hook([this] (std::function<void ()> reclaim_fn) {
@@ -1155,6 +1161,7 @@ reactor::~reactor() {
     sigset_t mask;
     sigemptyset(&mask);
     sigaddset(&mask, internal::cpu_stall_detector::signal_number());
+    sigaddset(&mask, internal::cpu_profiler::signal_number());
     auto r = ::pthread_sigmask(SIG_BLOCK, &mask, NULL);
     SEASTAR_ASSERT(r == 0);
 
@@ -1230,6 +1237,189 @@ void reactor::start_handling_signal() {
 
 namespace internal {
 
+posix_timer::posix_timer(timer_cfg cfg, clockid_t clock_id) {
+    struct sigevent sev = {};
+    sev.sigev_notify = SIGEV_THREAD_ID;
+    sev.sigev_signo = cfg.signal_number;
+#ifndef sigev_notify_thread_id
+#define sigev_notify_thread_id _sigev_un._tid
+#endif
+    sev.sigev_notify_thread_id = syscall(SYS_gettid);
+    int err = timer_create(clock_id, &sev, &_timer);
+    if (err) {
+        throw std::system_error(std::error_code(err, std::system_category()));
+    }
+}
+
+posix_timer::~posix_timer() {
+    timer_delete(_timer);
+}
+
+void posix_timer::arm_timer(std::chrono::nanoseconds duration) {
+    auto its = posix::to_relative_itimerspec(duration, 0s);
+    timer_settime(_timer, 0, &its, nullptr);
+}
+
+void posix_timer::disarm_timer() {
+    auto its = posix::to_relative_itimerspec(0s,  0s);
+    timer_settime(_timer, 0, &its, nullptr);
+}
+
+static long
+perf_event_open(struct perf_event_attr* hw_event, pid_t pid, int cpu, int group_fd, unsigned long flags) {
+    return syscall(__NR_perf_event_open, hw_event, pid, cpu, group_fd, flags);
+}
+
+linux_perf_event linux_perf_event::try_make(timer_cfg cfg) {
+    ::perf_event_attr pea = {
+        .type = PERF_TYPE_SOFTWARE,
+        .size = sizeof(pea),
+        .config = PERF_COUNT_SW_TASK_CLOCK, // more likely to work on virtual machines than hardware events
+        .sample_period = 1'000'000'000, // Needs non-zero value or PERF_IOC_PERIOD gets confused
+        .sample_type = PERF_SAMPLE_CALLCHAIN,
+        .disabled = 1,
+        .exclude_callchain_user = 1,  // we're using backtrace() to capture the user callchain
+        .wakeup_events = 1,
+    };
+    unsigned long flags = 0;
+    if (internal::kernel_uname().whitelisted({"3.14"})) {
+        flags |= PERF_FLAG_FD_CLOEXEC;
+    }
+    int fd = perf_event_open(&pea, 0, -1, -1, flags);
+    if (fd == -1) {
+        throw std::system_error(errno, std::system_category(), "perf_event_open() failed");
+    }
+    auto desc = file_desc::from_fd(fd);
+    struct f_owner_ex sig_owner = {
+        .type = F_OWNER_TID,
+        .pid = static_cast<pid_t>(syscall(SYS_gettid)),
+    };
+    auto ret1 = ::fcntl(fd, F_SETOWN_EX, &sig_owner);
+    if (ret1 == -1) {
+        abort();
+    }
+    auto ret2 = ::fcntl(fd, F_SETSIG, cfg.signal_number);
+    if (ret2 == -1) {
+        abort();
+    }
+    auto fd_flags = ::fcntl(fd, F_GETFL);
+    if (fd_flags == -1) {
+        abort();
+    }
+    auto ret3 = ::fcntl(fd, F_SETFL, fd_flags | O_ASYNC);
+    if (ret3 == -1) {
+        abort();
+    }
+
+    return linux_perf_event(std::move(desc));
+}
+
+linux_perf_event::linux_perf_event(file_desc fd) : _fd(std::move(fd)) {
+    void* ret = ::mmap(nullptr, 2*getpagesize(), PROT_READ|PROT_WRITE, MAP_SHARED, _fd.get(), 0);
+    if (ret == MAP_FAILED) {
+        abort();
+    }
+    _mmap = static_cast<struct ::perf_event_mmap_page*>(ret);
+    _data_area = reinterpret_cast<char*>(_mmap) + getpagesize();
+    _data_area_mask = getpagesize() - 1;
+}
+
+linux_perf_event::linux_perf_event(linux_perf_event&& o)
+      : _fd(std::move(o._fd))
+      , _enabled(o._enabled)
+      , _current_period(o._current_period)
+      , _mmap(o._mmap)
+      , _data_area(o._data_area)
+      , _data_area_mask(o._data_area_mask)
+      , _next_signal_time(o._next_signal_time) {
+    o._mmap = nullptr;
+}
+
+linux_perf_event::~linux_perf_event() {
+    if (_mmap != nullptr) {
+        ::munmap(_mmap, 2*getpagesize());
+    }
+}
+
+void linux_perf_event::arm_timer(std::chrono::nanoseconds period) {
+    uint64_t ns =  period / 1ns;
+    _next_signal_time = reactor::now() + period;
+
+    // clear out any existing records in the ring buffer, so when we get interrupted next time
+    // we have only the stack associated with that interrupt, and so we don't overflow.
+    data_area_reader(*this).skip_all();
+    if (__builtin_expect(_enabled && _current_period == ns, 1)) {
+        // Common case - we're re-arming with the same period, the counter
+        // is already enabled.
+
+        // We want to set the next interrupt to ns from now, and somewhat oddly the
+        // way to do this is PERF_EVENT_IOC_PERIOD, even with the same period as
+        // already configured, see the code at:
+        //
+        // https://elixir.bootlin.com/linux/v5.15.86/source/kernel/events/core.c#L5636
+        //
+        // Ths change is intentional: kernel commit bad7192b842c83e580747ca57104dd51fe08c223
+        // so we can resumably rely on it.
+        _fd.ioctl(PERF_EVENT_IOC_PERIOD, ns);
+
+    } else {
+        // Uncommon case - we're moving from disabled to enabled, or changing
+        // the period. Issue more calls and be careful.
+        _fd.ioctl(PERF_EVENT_IOC_DISABLE, 0); // avoid false alarms while we modify stuff
+        _fd.ioctl(PERF_EVENT_IOC_PERIOD, ns);
+        _fd.ioctl(PERF_EVENT_IOC_RESET, 0);
+        _fd.ioctl(PERF_EVENT_IOC_ENABLE, 0);
+        _enabled = true;
+        _current_period = ns;
+    }
+}
+
+void linux_perf_event::disarm_timer() {
+    _fd.ioctl(PERF_EVENT_IOC_DISABLE, 0);
+    _enabled = false;
+}
+
+bool linux_perf_event::is_spurious_signal() {
+    // If the current time is before the expected signal time, it is
+    // probably a spurious signal. One reason this could occur is that
+    // PERF_EVENT_IOC_PERIOD does not reset the current overflow point
+    // on kernels prior to 3.14 (or 3.7 on Arm).
+    return reactor::now() < _next_signal_time;
+}
+
+void linux_perf_event::kernel_backtrace::read_backtrace(std::function<void (uintptr_t)> fn) {
+    if (_reader.have_data()) {
+        auto nr = _reader.read_u64();
+        for (uint64_t i = 0; i < nr; ++i) {
+            // TODO: the first u64 here will be a non-address token
+            // used by perf to indicate which type of callchain this is.
+            // Should we check that it is PERF_CONTEXT_KERNEL and skip
+            // outputting that value as it's not an address?
+            // See: https://github.com/torvalds/linux/commit/f9188e023c248d73f
+            fn(uintptr_t(_reader.read_u64()));
+        }
+    }
+}
+
+std::optional<linux_perf_event::kernel_backtrace> linux_perf_event::try_get_kernel_backtrace() {
+    data_area_reader reader(*this);
+    auto current_record = [&] () -> ::perf_event_header {
+        return reader.read_struct<perf_event_header>();
+    };
+
+    while (reader.have_data()) {
+        auto record = current_record();
+
+        if (record.type != PERF_RECORD_SAMPLE) {
+            reader.skip(record.size - sizeof(record));
+        } else {
+            return {kernel_backtrace{std::move(reader)}};
+        }
+    }
+
+    return std::nullopt;
+}
+
 cpu_stall_detector::cpu_stall_detector(cpu_stall_detector_config cfg)
         : _shard_id(this_shard_id()) {
     // glib's backtrace() calls dlopen("libgcc_s.so.1") once to resolve unwind related symbols.
@@ -1247,23 +1437,8 @@ cpu_stall_detector::cpu_stall_detector(cpu_stall_detector_config cfg)
     // note: if something is added here that can, it should take care to destroy _timer.
 }
 
-cpu_stall_detector_posix_timer::cpu_stall_detector_posix_timer(cpu_stall_detector_config cfg) : cpu_stall_detector(cfg) {
-    struct sigevent sev = {};
-    sev.sigev_notify = SIGEV_THREAD_ID;
-    sev.sigev_signo = signal_number();
-#ifndef sigev_notify_thread_id
-#define sigev_notify_thread_id _sigev_un._tid
-#endif
-    sev.sigev_notify_thread_id = syscall(SYS_gettid);
-    int err = timer_create(CLOCK_THREAD_CPUTIME_ID, &sev, &_timer);
-    if (err) {
-        throw std::system_error(std::error_code(err, std::system_category()));
-    }
-}
-
-cpu_stall_detector_posix_timer::~cpu_stall_detector_posix_timer() {
-    timer_delete(_timer);
-}
+cpu_stall_detector_posix_timer::cpu_stall_detector_posix_timer(cpu_stall_detector_config cfg)
+    : cpu_stall_detector(cfg), _timer({signal_number()}) { }
 
 cpu_stall_detector_config
 cpu_stall_detector::get_config() const {
@@ -1332,8 +1507,8 @@ cpu_stall_detector::reset_suppression_state(sched_clock::time_point now) {
 }
 
 void cpu_stall_detector_posix_timer::arm_timer() {
-    auto its = posix::to_relative_itimerspec(_threshold * _report_at + _slack, 0s);
-    timer_settime(_timer, 0, &its, nullptr);
+    std::chrono::nanoseconds dur = _threshold * _report_at + _slack;
+    _timer.arm_timer(dur);
 }
 
 void cpu_stall_detector::start_task_run(sched_clock::time_point now) {
@@ -1354,153 +1529,52 @@ void cpu_stall_detector::end_task_run(sched_clock::time_point now) {
 }
 
 void cpu_stall_detector_posix_timer::start_sleep() {
-    auto its = posix::to_relative_itimerspec(0s,  0s);
-    timer_settime(_timer, 0, &its, nullptr);
+    _timer.disarm_timer();
     _rearm_timer_at = reactor::now();
 }
 
 void cpu_stall_detector::end_sleep() {
 }
 
-static long
-perf_event_open(struct perf_event_attr* hw_event, pid_t pid, int cpu, int group_fd, unsigned long flags) {
-    return syscall(__NR_perf_event_open, hw_event, pid, cpu, group_fd, flags);
-}
-
-cpu_stall_detector_linux_perf_event::cpu_stall_detector_linux_perf_event(file_desc fd, cpu_stall_detector_config cfg)
-        : cpu_stall_detector(cfg), _fd(std::move(fd)) {
-    void* ret = ::mmap(nullptr, 2*getpagesize(), PROT_READ|PROT_WRITE, MAP_SHARED, _fd.get(), 0);
-    if (ret == MAP_FAILED) {
-        abort();
-    }
-    _mmap = static_cast<struct ::perf_event_mmap_page*>(ret);
-    _data_area = reinterpret_cast<char*>(_mmap) + getpagesize();
-    _data_area_mask = getpagesize() - 1;
-}
-
-cpu_stall_detector_linux_perf_event::~cpu_stall_detector_linux_perf_event() {
-    ::munmap(_mmap, 2*getpagesize());
+cpu_stall_detector_linux_perf_event::cpu_stall_detector_linux_perf_event(linux_perf_event perf_event, cpu_stall_detector_config cfg)
+        : cpu_stall_detector(cfg), _perf_event(std::move(perf_event)) {
 }
 
 void
 cpu_stall_detector_linux_perf_event::arm_timer() {
     auto period = _threshold * _report_at + _slack;
-    uint64_t ns =  period / 1ns;
-    _next_signal_time = reactor::now() + period;
-
-    // clear out any existing records in the ring buffer, so when we get interrupted next time
-    // we have only the stack associated with that interrupt, and so we don't overflow.
-    data_area_reader(*this).skip_all();
-    if (__builtin_expect(_enabled && _current_period == ns, 1)) {
-        // Common case - we're re-arming with the same period, the counter
-        // is already enabled.
-
-        // We want to set the next interrupt to ns from now, and somewhat oddly the
-        // way to do this is PERF_EVENT_IOC_PERIOD, even with the same period as
-        // already configured, see the code at:
-        //
-        // https://elixir.bootlin.com/linux/v5.15.86/source/kernel/events/core.c#L5636
-        //
-        // Ths change is intentional: kernel commit bad7192b842c83e580747ca57104dd51fe08c223
-        // so we can resumably rely on it.
-        _fd.ioctl(PERF_EVENT_IOC_PERIOD, ns);
-
-    } else {
-        // Uncommon case - we're moving from disabled to enabled, or changing
-        // the period. Issue more calls and be careful.
-        _fd.ioctl(PERF_EVENT_IOC_DISABLE, 0); // avoid false alarms while we modify stuff
-        _fd.ioctl(PERF_EVENT_IOC_PERIOD, ns);
-        _fd.ioctl(PERF_EVENT_IOC_RESET, 0);
-        _fd.ioctl(PERF_EVENT_IOC_ENABLE, 0);
-        _enabled = true;
-        _current_period = ns;
-    }
+    _perf_event.arm_timer(period);
 }
 
 void
 cpu_stall_detector_linux_perf_event::start_sleep() {
-    _fd.ioctl(PERF_EVENT_IOC_DISABLE, 0);
-    _enabled = false;
+    _perf_event.disarm_timer();
 }
 
 bool
 cpu_stall_detector_linux_perf_event::is_spurious_signal() {
-    // If the current time is before the expected signal time, it is
-    // probably a spurious signal. One reason this could occur is that
-    // PERF_EVENT_IOC_PERIOD does not reset the current overflow point
-    // on kernels prior to 3.14 (or 3.7 on Arm).
-    return reactor::now() < _next_signal_time;
+    return _perf_event.is_spurious_signal();
 }
 
 void
 cpu_stall_detector_linux_perf_event::maybe_report_kernel_trace(backtrace_buffer& buf) {
-    data_area_reader reader(*this);
-    auto current_record = [&] () -> ::perf_event_header {
-        return reader.read_struct<perf_event_header>();
-    };
-
-    while (reader.have_data()) {
-        auto record = current_record();
-
-        if (record.type != PERF_RECORD_SAMPLE) {
-            reader.skip(record.size - sizeof(record));
-            continue;
-        }
+    auto kernel_bt = _perf_event.try_get_kernel_backtrace();
+    if(kernel_bt) {
+        backtrace_buffer buf;
+        buf.append("kernel callstack:");
+
+        kernel_bt->read_backtrace([&] (uintptr_t addr) {
+            buf.append(" 0x");
+            buf.append_hex(addr);
+        });
 
-        auto nr = reader.read_u64();
-        if (nr > 0) {
-            buf.append("kernel callstack:");
-            for (uint64_t i = 0; i < nr; ++i) {
-                buf.append(" 0x");
-                buf.append_hex(uintptr_t(reader.read_u64()));
-            }
-            buf.append("\n");
-        }
-    };
+        buf.append("\n");
+    }
 }
 
 std::unique_ptr<cpu_stall_detector_linux_perf_event>
 cpu_stall_detector_linux_perf_event::try_make(cpu_stall_detector_config cfg) {
-    ::perf_event_attr pea = {
-        .type = PERF_TYPE_SOFTWARE,
-        .size = sizeof(pea),
-        .config = PERF_COUNT_SW_TASK_CLOCK, // more likely to work on virtual machines than hardware events
-        .sample_period = 1'000'000'000, // Needs non-zero value or PERF_IOC_PERIOD gets confused
-        .sample_type = PERF_SAMPLE_CALLCHAIN,
-        .disabled = 1,
-        .exclude_callchain_user = 1,  // we're using backtrace() to capture the user callchain
-        .wakeup_events = 1,
-    };
-    unsigned long flags = 0;
-    if (internal::kernel_uname().whitelisted({"3.14"})) {
-        flags |= PERF_FLAG_FD_CLOEXEC;
-    }
-    int fd = perf_event_open(&pea, 0, -1, -1, flags);
-    if (fd == -1) {
-        throw std::system_error(errno, std::system_category(), "perf_event_open() failed");
-    }
-    auto desc = file_desc::from_fd(fd);
-    struct f_owner_ex sig_owner = {
-        .type = F_OWNER_TID,
-        .pid = static_cast<pid_t>(syscall(SYS_gettid)),
-    };
-    auto ret1 = ::fcntl(fd, F_SETOWN_EX, &sig_owner);
-    if (ret1 == -1) {
-        abort();
-    }
-    auto ret2 = ::fcntl(fd, F_SETSIG, signal_number());
-    if (ret2 == -1) {
-        abort();
-    }
-    auto fd_flags = ::fcntl(fd, F_GETFL);
-    if (fd_flags == -1) {
-        abort();
-    }
-    auto ret3 = ::fcntl(fd, F_SETFL, fd_flags | O_ASYNC);
-    if (ret3 == -1) {
-        abort();
-    }
-    return std::make_unique<cpu_stall_detector_linux_perf_event>(std::move(desc), std::move(cfg));
+    return std::make_unique<cpu_stall_detector_linux_perf_event>(linux_perf_event::try_make({signal_number()}), std::move(cfg));
 }
 
 
@@ -1613,8 +1687,32 @@ void reactor::test::set_max_task_backlog(unsigned value) noexcept {
 }
 
 void
-reactor::block_notifier(int) {
-    engine()._cpu_stall_detector->on_signal();
+reactor::block_notifier(int signal) {
+    if(signal == internal::cpu_stall_detector::signal_number()) {
+        engine()._cpu_stall_detector->on_signal();
+    } else {
+        engine()._cpu_profiler->on_signal();
+    }
+}
+
+bool reactor::get_cpu_profiler_enabled() {
+    return _cpu_profiler->is_enabled();
+}
+
+void reactor::set_cpu_profiler_enabled(bool b) {
+    _cpu_profiler->update_config({b, _cpu_profiler->period()});
+}
+
+std::chrono::nanoseconds reactor::get_cpu_profiler_period() {
+    return _cpu_profiler->period();
+}
+
+void reactor::set_cpu_profiler_period(std::chrono::nanoseconds ns) {
+    _cpu_profiler->update_config({_cpu_profiler->is_enabled(), ns});
+}
+
+size_t reactor::profiler_results(std::vector<cpu_profiler_trace>& results_buffer) {
+    return _cpu_profiler->results(results_buffer);
 }
 
 class crypto_provider_factory {
@@ -1646,6 +1744,11 @@ void reactor::configure(const reactor_options& opts) {
     csdc.oneline = opts.blocked_reactor_report_format_oneline.get_value();
     _cpu_stall_detector->update_config(csdc);
 
+    internal::cpu_profiler_config prof_cfg;
+    prof_cfg.enabled = opts.profiler_enabled.get_value();
+    prof_cfg.period = std::chrono::milliseconds(opts.profiler_sample_period_ms.get_value());
+    _cpu_profiler->update_config(prof_cfg);
+
     if (_cfg.no_poll_aio) {
         _aio_eventfd = pollable_fd(file_desc::eventfd(0, 0));
     }
@@ -3069,8 +3172,7 @@ reactor::wakeup() {
     _sleeping.store(false, std::memory_order_relaxed);
 
     uint64_t one = 1;
-    auto res = ::write(_notify_eventfd.get(), &one, sizeof(one));
-    SEASTAR_ASSERT(res == sizeof(one) && "write(2) failed on _reactor._notify_eventfd");
+    (void)::write(_notify_eventfd.get(), &one, sizeof(one));
 }
 
 void reactor::start_aio_eventfd_loop() {
@@ -3080,7 +3182,7 @@ void reactor::start_aio_eventfd_loop() {
     future<> loop_done = repeat([this] {
         return _aio_eventfd->readable().then([this] {
             char garbage[8];
-            std::ignore = ::read(_aio_eventfd->get_fd(), garbage, 8); // totally uninteresting
+            (void)::read(_aio_eventfd->get_fd(), garbage, 8); // totally uninteresting
             return _stopping ? stop_iteration::yes : stop_iteration::no;
         });
     });
@@ -3095,8 +3197,7 @@ void reactor::stop_aio_eventfd_loop() {
         return;
     }
     uint64_t one = 1;
-    auto res = ::write(_aio_eventfd->get_fd(), &one, 8);
-    SEASTAR_ASSERT(res == 8 && "write(2) failed on _reactor._aio_eventfd");
+    (void)::write(_aio_eventfd->get_fd(), &one, 8);
 }
 
 inline
@@ -3372,11 +3473,25 @@ int reactor::do_run() {
     _task_quota_timer.timerfd_settime(0, its);
     auto& task_quote_itimerspec = its;
 
+    // Ensure that the same signal isn't being used more than once.
+    auto set_signal = [](sigset_t* mask, int s) {
+        SEASTAR_ASSERT(!sigismember(mask, s));
+        sigaddset(mask, s);
+    };
+
+    sigset_t block_mask;
+    sigemptyset(&block_mask);
+    set_signal(&block_mask, internal::cpu_stall_detector::signal_number());
+    set_signal(&block_mask, internal::cpu_profiler::signal_number());
+
     struct sigaction sa_block_notifier = {};
     sa_block_notifier.sa_handler = &reactor::block_notifier;
     sa_block_notifier.sa_flags = SA_RESTART;
+    sa_block_notifier.sa_mask = block_mask;
     auto r = sigaction(internal::cpu_stall_detector::signal_number(), &sa_block_notifier, nullptr);
     SEASTAR_ASSERT(r == 0);
+    r = sigaction(internal::cpu_profiler::signal_number(), &sa_block_notifier, nullptr);
+    SEASTAR_ASSERT(r == 0);
 
     bool idle = false;
 
@@ -3386,6 +3501,7 @@ int reactor::do_run() {
     const noncopyable_function<bool()> pure_check_for_work = [this] () {
         return pure_poll_once() || have_more_tasks();
     };
+    _cpu_profiler->start();
     while (true) {
         _cpu_sched.run_some_tasks();
         if (_stopped) {
@@ -3425,10 +3541,12 @@ int reactor::do_run() {
                         struct itimerspec zero_itimerspec = {};
                         _task_quota_timer.timerfd_settime(0, zero_itimerspec);
                         _cpu_stall_detector->start_sleep();
+                        _cpu_profiler->stop();
 
                         wait_and_process_events();
                         pollers_exit_interrupt_mode();
 
+                        _cpu_profiler->start();
                         _cpu_stall_detector->end_sleep();
                         // We may have slept for a while, so freshen idle_end
                         idle_end = now();
@@ -3456,6 +3574,8 @@ int reactor::do_run() {
     if (_id == 0) {
         _smp->join_all();
     }
+
+    _cpu_profiler->stop();
     // To prevent ordering issues from rising, destroy the I/O queue explicitly at this point.
     // This is needed because the reactor is destroyed from the thread_local destructors. If
     // the I/O queue happens to use any other infrastructure that is also kept this way (for
@@ -3928,7 +4048,6 @@ static program_options::selection_value<crypto_provider_factory> create_crypto_p
 #ifdef SEASTAR_HAVE_GNUTLS
     candidates.push_back({"gnutls", {new crypto_provider_factory(internal::crypto::create_gnutls_provider), deleter}, {}});
 #endif
-
 #ifdef SEASTAR_HAVE_OPENSSL
     candidates.push_back({"openssl", {new crypto_provider_factory(internal::crypto::create_openssl_provider), deleter}, {}});
 #endif
@@ -3994,6 +4113,8 @@ reactor_options::reactor_options(program_options::option_group* parent_group)
     , blocked_reactor_notify_ms(*this, "blocked-reactor-notify-ms", 25, "threshold in miliseconds over which the reactor is considered blocked if no progress is made")
     , blocked_reactor_reports_per_minute(*this, "blocked-reactor-reports-per-minute", 5, "Maximum number of backtraces reported by stall detector per minute")
     , blocked_reactor_report_format_oneline(*this, "blocked-reactor-report-format-oneline", true, "Print a simplified backtrace on a single line")
+    , profiler_sample_period_ms(*this, "profiler-sample-period-ms", 100, "Profiler sample rate")
+    , profiler_enabled(*this, "profiler-enabled", false, "Enable the profiler")
     , relaxed_dma(*this, "relaxed-dma", "allow using buffered I/O if DMA is not available (reduces performance)")
     , linux_aio_nowait(*this, "linux-aio-nowait", internal::kernel_uname().whitelisted({"4.13"}), // base version where this works
                 "use the Linux NOWAIT AIO feature, which reduces reactor stalls due to aio (autodetected)")
@@ -4061,6 +4182,12 @@ smp_options::smp_options(program_options::option_group* parent_group)
 {
 }
 
+thread_local metrics::impl::metric_implementations metric_impls;
+
+metrics::impl::metric_implementations& metrics::impl::get_metric_implementations() {
+    return metric_impls;
+}
+
 struct reactor_deleter {
     void operator()(reactor* p) {
         p->~reactor();
@@ -4141,6 +4268,9 @@ void smp::cleanup() noexcept {
     _shard_to_numa_node_mapping = decltype(_shard_to_numa_node_mapping)();
     reactor_holder.reset();
     local_engine = nullptr;
+#ifdef SEASTAR_TLS_DUAL_BACKEND
+    internal::crypto::reset_provider();
+#endif
 }
 
 void smp::cleanup_cpu() {
@@ -4341,9 +4471,15 @@ unsigned smp::adjust_max_networking_aio_io_control_blocks(unsigned network_iocbs
 
 void smp::configure(const smp_options& smp_opts, const reactor_options& reactor_opts)
 {
+#ifdef SEASTAR_TLS_DUAL_BACKEND
     // Install the crypto provider before anything else, so it is
     // available to all reactors from the moment they start.
+    //
+    // Only present in dual-backend builds; in single-backend builds the
+    // provider is a static singleton in src/core/crypto.cc and needs no
+    // installation step.
     internal::crypto::set_provider(reactor_opts.crypto_provider.get_selected_candidate()());
+#endif
 
     bool use_transparent_hugepages = !reactor_opts.overprovisioned;
 
@@ -5299,6 +5435,16 @@ future<> destroy_scheduling_supergroup(scheduling_supergroup sg) noexcept {
     });
 }
 
+scheduling_group::stats
+scheduling_group::get_stats() const noexcept {
+    const auto * const tq = engine()._task_queues[_id].get();
+    return {
+        .runtime = tq->_runtime,
+        .waittime = tq->_waittime,
+        .starvetime = tq->_starvetime
+    };
+}
+
 future<scheduling_group>
 create_scheduling_group(sstring name, sstring shortname, float shares, scheduling_supergroup parent) noexcept {
     auto sg = co_await smp::submit_to(0, [name, shortname, shares, parent] {
diff --git a/src/core/reactor_backend.cc b/src/core/reactor_backend.cc
index 04b334961fa..c39f055769d 100644
--- a/src/core/reactor_backend.cc
+++ b/src/core/reactor_backend.cc
@@ -328,6 +328,7 @@ bool aio_storage_context::can_sleep() const {
 
 aio_general_context::aio_general_context(size_t nr)
         : iocbs(new iocb*[nr])
+        , begin(iocbs.get())
         , last(iocbs.get())
         , end(iocbs.get() + nr)
 {
@@ -339,32 +340,50 @@ aio_general_context::~aio_general_context() {
 }
 
 void aio_general_context::queue(linux_abi::iocb* iocb) {
-    SEASTAR_ASSERT(last < end);
-    *last++ = iocb;
+    if (last < end) {
+        *last++ = iocb;
+    } else {
+        iocbs_backlog.push_back(iocb);
+    }
 }
 
 size_t aio_general_context::flush() {
-    auto begin = iocbs.get();
-    using clock = std::chrono::steady_clock;
-    constexpr clock::time_point no_time_point = clock::time_point(clock::duration(0));
-    auto retry_until = no_time_point;
+    auto original_begin = begin;
     while (begin != last) {
         auto r = io_submit(io_context, last - begin, begin);
-        if (__builtin_expect(r > 0, true)) {
-            begin += r;
-            continue;
+        if (__builtin_expect(r <= 0, false)) {
+            // EAGAIN is expected here when "Insufficient resources are available to queue any iocbs" (see io_submit(2)).
+            // This indicates overload on the kernel internal queue.
+            // Returning early below will allow us to reap completions to free up resources for further iocb:s.
+            // Abort on any other error, as those indicate an internal error on our side.
+            if (r < 0 && errno != EAGAIN) {
+                on_fatal_internal_error(seastar_logger, format("aio_general_context::flush: io_submit failed with unexpected system error: {}", errno));
+            }
+            break;
         }
-        // errno == EAGAIN is expected here. We don't explicitly assert that
-        // since the assert below prevents an endless loop for any reason.
-        if (retry_until == no_time_point) {
-            // allow retrying for 1 second
-            retry_until = clock::now() + 1s;
-        } else {
-            SEASTAR_ASSERT(clock::now() < retry_until);
+        begin += r;
+    }
+
+    auto nr = begin - original_begin;
+
+    if (nr != 0 && begin == last) {
+        // If we have succesfully committed all iocbs (begin == last) then we
+        // reset the pointers. Further at this point we move iocbs from the
+        // backlog to the main `iocbs` array if there are any.
+        // We only do this once `iocbs` is fully empty to get batching behaviour
+        // and avoid degenarate cases where only one element gets submitted
+        // which would result in excessive shifting of the elements in `iocbs`
+        // array or the backlog.
+        begin = iocbs.get();
+        last = iocbs.get();
+
+        if (!iocbs_backlog.empty()) {
+            auto max_to_copy = std::min(size_t(end - begin), iocbs_backlog.size());
+            last = std::move(iocbs_backlog.begin(), iocbs_backlog.begin() + max_to_copy, begin);
+            iocbs_backlog.erase(iocbs_backlog.begin(), iocbs_backlog.begin() + max_to_copy);
         }
     }
-    auto nr = last - iocbs.get();
-    last = iocbs.get();
+
     return nr;
 }
 
@@ -1970,15 +1989,15 @@ reactor_backend_selector reactor_backend_selector::default_backend() {
 
 std::vector<reactor_backend_selector> reactor_backend_selector::available() {
     std::vector<reactor_backend_selector> ret;
+    if (has_enough_aio_nr() && detect_aio_poll()) {
+        ret.push_back(reactor_backend_selector("linux-aio"));
+    }
+    ret.push_back(reactor_backend_selector("epoll"));
 #ifdef SEASTAR_HAVE_URING
     if (detect_io_uring()) {
         ret.push_back(reactor_backend_selector("io_uring"));
     }
 #endif
-    if (has_enough_aio_nr() && detect_aio_poll()) {
-        ret.push_back(reactor_backend_selector("linux-aio"));
-    }
-    ret.push_back(reactor_backend_selector("epoll"));
     return ret;
 }
 
diff --git a/src/core/reactor_backend.hh b/src/core/reactor_backend.hh
index 99cbb9752bc..edbcc9056cd 100644
--- a/src/core/reactor_backend.hh
+++ b/src/core/reactor_backend.hh
@@ -50,8 +50,12 @@ struct aio_general_context {
     ~aio_general_context();
     internal::linux_abi::aio_context_t io_context{};
     std::unique_ptr<internal::linux_abi::iocb*[]> iocbs;
+    internal::linux_abi::iocb** begin;
     internal::linux_abi::iocb** last;
     internal::linux_abi::iocb** const end;
+    // in case `iocbs` is full queue here, use std::deque to avoid oversized
+    // allocations
+    std::deque<internal::linux_abi::iocb*> iocbs_backlog;
     void queue(internal::linux_abi::iocb* iocb);
     // submit all queued iocbs and return their count.
     size_t flush();
diff --git a/src/core/scollectd.cc b/src/core/scollectd.cc
index 7e20dccc2ab..fc5d82de8cd 100644
--- a/src/core/scollectd.cc
+++ b/src/core/scollectd.cc
@@ -84,12 +84,12 @@ registration::~registration() {
     unregister();
 }
 
-registration::registration(const type_instance_id& id)
-: _id(id), _impl(seastar::metrics::impl::get_local_impl()) {
+registration::registration(const type_instance_id& id, int handle)
+: _id(id), _impl(seastar::metrics::impl::get_local_impl(handle)) {
 }
 
-registration::registration(type_instance_id&& id)
-: _id(std::move(id)), _impl(seastar::metrics::impl::get_local_impl()) {
+registration::registration(type_instance_id&& id, int handle)
+: _id(std::move(id)), _impl(seastar::metrics::impl::get_local_impl(handle)) {
 }
 
 seastar::metrics::impl::metric_id to_metrics_id(const type_instance_id & id) {
@@ -542,7 +542,7 @@ future<> send_metric(const type_instance_id & id,
     return get_impl().send_metric(id, values);
 }
 
-void configure(const options& opts) {
+void configure(const options& opts, int handle) {
     bool enable = opts.collectd.get_value();
     if (!enable) {
         return;
@@ -551,7 +551,7 @@ void configure(const options& opts) {
     auto period = std::chrono::milliseconds(opts.collectd_poll_period.get_value());
 
     auto host = (opts.collectd_hostname.get_value() == "")
-            ? seastar::metrics::impl::get_local_impl()->get_config().hostname
+            ? seastar::metrics::impl::get_local_impl(handle)->get_config().hostname
             : sstring(opts.collectd_hostname.get_value());
 
     // Now create send loops on each cpu
diff --git a/src/core/signal_mutex.cc b/src/core/signal_mutex.cc
new file mode 100644
index 00000000000..308ef0897f1
--- /dev/null
+++ b/src/core/signal_mutex.cc
@@ -0,0 +1,50 @@
+/*
+ * This file is open source software, licensed to you under the terms
+ * of the Apache License, Version 2.0 (the "License").  See the NOTICE file
+ * distributed with this work for additional information regarding copyright
+ * ownership.  You may not use this file except in compliance with the License.
+ *
+ * You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+/*
+ * Copyright (C) 2025 ScyllaDB
+ */
+
+#include <seastar/core/internal/signal_mutex.hh>
+
+namespace seastar::internal {
+
+signal_mutex::guard::~guard() {
+    if (_mutex == nullptr) {
+        return;
+    }
+    // Ensure the subsequent store isn't hoisted by the the
+    // compiler into the critical section it's intended to
+    // protect.
+    std::atomic_signal_fence(std::memory_order_release);
+    _mutex->_mutex.store(false, std::memory_order_relaxed);
+}
+
+std::optional<signal_mutex::guard> signal_mutex::try_lock() {
+    if (!_mutex.load(std::memory_order_relaxed)) {
+        _mutex.store(true, std::memory_order_relaxed);
+        // Ensure that this read-modify-update operation isn't
+        // mixed into the critical section it's intended to protect
+        // by the compiler.
+        std::atomic_signal_fence(std::memory_order_acq_rel);
+        return {guard(this)};
+    }
+
+    return std::nullopt;
+}
+
+} // namespace seastar::internal
diff --git a/src/core/thread_pool.cc b/src/core/thread_pool.cc
index 7321c7b874b..10e7cf76bdb 100644
--- a/src/core/thread_pool.cc
+++ b/src/core/thread_pool.cc
@@ -62,8 +62,7 @@ void thread_pool::work(sstring name) {
             std::atomic_thread_fence(std::memory_order_seq_cst);
             if (_main_thread_idle.load(std::memory_order_relaxed)) {
                 uint64_t one = 1;
-                auto res = ::write(_notify_eventfd.get(), &one, 8);
-                SEASTAR_ASSERT(res == 8 && "write(2) failed on _reactor._notify_eventfd");
+                (void)::write(_notify_eventfd.get(), &one, 8);
             }
         }
     }
diff --git a/src/http/client.cc b/src/http/client.cc
index 47e10d48b3c..7b76070a9e0 100644
--- a/src/http/client.cc
+++ b/src/http/client.cc
@@ -40,7 +40,7 @@
 #include <seastar/util/string_utils.hh>
 
 namespace seastar {
-logger http_log("http");
+logger http_log("seastar_http_client");
 namespace http {
 namespace internal {
 
diff --git a/src/http/httpd.cc b/src/http/httpd.cc
index 1784e9960af..3b78c4b81f2 100644
--- a/src/http/httpd.cc
+++ b/src/http/httpd.cc
@@ -188,11 +188,14 @@ static void set_header_connection(http::reply& resp, bool keep_alive) {
     }
 }
 
-void connection::generate_error_reply_and_close(std::unique_ptr<http::request> req, http::reply::status_type status, const sstring& msg) {
+void connection::generate_error_reply_and_close(std::unique_ptr<http::request> req, http::reply::status_type status, const sstring& msg, const sstring &content_type) {
     auto resp = std::make_unique<http::reply>();
     // TODO: Handle HTTP/2.0 when it releases
     resp->set_version(req->_version);
     resp->set_status(status, msg);
+    if (!content_type.empty()) {
+        resp->set_content_type(content_type);
+    }
     set_header_connection(*resp, false);
     _done = true;
     _replies.push(std::move(resp));
@@ -210,6 +213,7 @@ future<> connection::read_one() {
 
         req->_server_address = this->_server_addr;
         req->_client_address = this->_client_addr;
+        req->listener_idx = _listener_idx;
 
         if (_tls) {
             req->protocol_name = "https";
@@ -278,7 +282,7 @@ future<> connection::read_one() {
                     // before passing the request to handler - when we were parsing chunks
                     auto err_req = std::make_unique<http::request>();
                     err_req->_version = version;
-                    generate_error_reply_and_close(std::move(err_req), e.status(), e.str());
+                    generate_error_reply_and_close(std::move(err_req), e.status(), e.str(), e.content_type());
                 });
             });
         });
@@ -478,7 +482,7 @@ future<> http_server::do_accept_one(int which, bool tls) {
     }
     auto local_address = ar.connection.local_address();
     auto conn = std::make_unique<connection>(*this, std::move(ar.connection),
-            std::move(ar.remote_address), std::move(local_address), tls);
+            std::move(ar.remote_address), std::move(local_address), tls, which);
     (void)try_with_gate(_task_gate, [conn = std::move(conn)]() mutable {
         return conn->process().handle_exception([conn = std::move(conn)] (std::exception_ptr ex) {
             hlogger.error("request error: {}", ex);
diff --git a/src/http/routes.cc b/src/http/routes.cc
index 1c006e98a48..618c4656b31 100644
--- a/src/http/routes.cc
+++ b/src/http/routes.cc
@@ -75,10 +75,14 @@ std::unique_ptr<http::reply> routes::exception_reply(std::exception_ptr eptr) {
         }
         std::rethrow_exception(eptr);
     } catch (const redirect_exception& _e) {
-       rep.reset(new http::reply());
-       rep->add_header("Location", _e.url).set_status(_e.status());
+       *rep = _e.to_reply();
     } catch (const base_exception& e) {
-        rep->set_status(e.status(), internal::to_json(e));
+        if (e.content_type().size()) {
+            rep->set_status(e.status(), e.str());
+            rep->set_content_type(e.content_type());
+        } else {
+            rep->set_status(e.status(), internal::to_json(e));
+        }
     } catch (...) {
         rep->set_status(http::reply::status_type::internal_server_error,
                 internal::to_json(std::current_exception()));
@@ -96,6 +100,9 @@ future<std::unique_ptr<http::reply> > routes::handle(const sstring& path, std::u
             handler->verify_mandatory_params(*req);
             auto r =  handler->handle(path, std::move(req), std::move(rep));
             return r.handle_exception(_general_handler);
+        } catch (const redirect_exception& _e) {
+            *rep = _e.to_reply();
+            rep->done("json");
         } catch (...) {
             rep = exception_reply(std::current_exception());
         }
diff --git a/src/net/native-stack-impl.hh b/src/net/native-stack-impl.hh
index 496d9e90de9..0d5db010052 100644
--- a/src/net/native-stack-impl.hh
+++ b/src/net/native-stack-impl.hh
@@ -117,8 +117,8 @@ public:
     keepalive_params get_keepalive_parameters() const override;
     int get_sockopt(int level, int optname, void* data, size_t len) const override;
     void set_sockopt(int level, int optname, const void* data, size_t len) override;
-    socket_address local_address() const noexcept override;
-    socket_address remote_address() const noexcept override;
+    socket_address local_address() const override;
+    socket_address remote_address() const override;
     virtual future<> wait_input_shutdown() override;
 };
 
@@ -179,7 +179,7 @@ public:
         if (_cur_frag != _buf.nr_frags()) {
             auto& f = _buf.fragments()[_cur_frag++];
             return make_ready_future<temporary_buffer<char>>(
-                    temporary_buffer<char>(f.base, f.size,
+                    temporary_buffer<char>::maybe_unsafe_from_deleter(f.base, f.size,
                             make_deleter(deleter(), [p = _buf.share()] () mutable {})));
         }
         return _conn->wait_for_data().then([this] {
@@ -301,12 +301,12 @@ int native_connected_socket_impl<Protocol>::get_sockopt(int level, int optname,
 }
 
 template<typename Protocol>
-socket_address native_connected_socket_impl<Protocol>::local_address() const noexcept {
+socket_address native_connected_socket_impl<Protocol>::local_address() const {
     return {_conn->local_ip(), _conn->local_port()};
 }
 
 template<typename Protocol>
-socket_address native_connected_socket_impl<Protocol>::remote_address() const noexcept {
+socket_address native_connected_socket_impl<Protocol>::remote_address() const {
     return {_conn->foreign_ip(), _conn->foreign_port()};
 }
 
diff --git a/src/net/posix-stack.cc b/src/net/posix-stack.cc
index ed6b190d71b..e7d88ba69d5 100644
--- a/src/net/posix-stack.cc
+++ b/src/net/posix-stack.cc
@@ -258,7 +258,7 @@ static void shutdown_socket_fd(pollable_fd& fd, int how) noexcept {
         // EBADF (invalid file descriptor) -- irretrievable
         fd.shutdown(how);
     } catch (...) {
-        on_internal_error(seastar_logger, seastar::format("socket shutdown({}, {}) failed: {}", fd.get_file_desc().fdinfo(), how, std::current_exception()));
+        on_internal_error(seastar_logger, ::seastar::format("socket shutdown({}, {}) failed: {}", fd.get_file_desc().fdinfo(), how, std::current_exception()));
     }
 }
 
@@ -313,10 +313,10 @@ class posix_connected_socket_impl : public connected_socket_impl {
     int get_sockopt(int level, int optname, void* data, size_t len) const override {
         return _ops->get_sockopt(_fd.get_file_desc(), level, optname, data, len);
     }
-    socket_address local_address() const noexcept override {
+    socket_address local_address() const override {
         return _ops->local_address(_fd.get_file_desc());
     }
-    socket_address remote_address() const noexcept override {
+    socket_address remote_address() const override {
         return _ops->remote_address(_fd.get_file_desc());
     }
     future<> wait_input_shutdown() override {
@@ -1155,7 +1155,7 @@ class posix_datagram : public datagram_impl {
     virtual socket_address get_dst() override { return _dst; }
     virtual uint16_t get_dst_port() override {
         if (_dst.family() != AF_INET && _dst.family() != AF_INET6) {
-            throw std::runtime_error(format("get_dst_port() called on non-IP address: {}", _dst));
+            throw std::runtime_error(::seastar::format("get_dst_port() called on non-IP address: {}", _dst));
         }
         return _dst.port();
     }
@@ -1179,7 +1179,7 @@ posix_datagram_channel::receive() {
         auto sg_id = internal::scheduling_group_index(current_scheduling_group());
         bytes_received[sg_id] += size;
         return make_ready_future<datagram>(datagram(std::make_unique<posix_datagram>(
-            _recv._src_addr, dst ? *dst : _address, temporary_buffer<char>(_recv._buffer, size, make_deleter([buf = _recv._buffer] { delete[] buf; })))));
+            _recv._src_addr, dst ? *dst : _address, temporary_buffer<char>::maybe_unsafe_from_deleter(_recv._buffer, size, make_deleter([buf = _recv._buffer] { delete[] buf; })))));
     }).handle_exception([p = _recv._buffer](auto ep) {
         delete[] p;
         return make_exception_future<datagram>(std::move(ep));
diff --git a/src/net/tls-impl.cc b/src/net/tls-impl.cc
index 4303b3aebb0..0b6f1119da1 100644
--- a/src/net/tls-impl.cc
+++ b/src/net/tls-impl.cc
@@ -284,6 +284,30 @@ void tls::certificate_credentials::enable_tls_renegotiation() {
     _impl->enable_tls_renegotiation();
 }
 
+std::optional<std::vector<cert_info>> tls::certificate_credentials::get_cert_info() const noexcept {
+    if (_impl == nullptr) {
+        return std::nullopt;
+    }
+    try {
+        auto result = _impl->get_x509_info();
+        return result;
+    } catch (...) {
+        return std::nullopt;
+    }
+}
+
+std::optional<std::vector<cert_info>> tls::certificate_credentials::get_trust_list_info() const noexcept {
+    if (_impl == nullptr) {
+        return std::nullopt;
+    }
+    try {
+        auto result = _impl->get_x509_trust_list_info();
+        return result;
+    } catch (...) {
+        return std::nullopt;
+    }
+}
+
 tls::server_credentials::server_credentials()
 {}
 
@@ -701,6 +725,30 @@ future<shared_ptr<tls::server_credentials>> tls::credentials_builder::build_relo
     }, tolerance);
 }
 
+tls::reload_callback_ex wrap_reload_callback(tls::reload_callback_with_creds cb) {
+    return [cb{std::move(cb)}](const tls::credentials_builder& builder,
+                               const std::unordered_set<sstring> &files,
+                               std::exception_ptr ep) {
+         auto creds = builder.build_certificate_credentials();
+         return futurize_invoke(cb, files, *creds, ep, builder.get_trust_file_blob());
+    };
+}
+
+future<shared_ptr<tls::certificate_credentials>> tls::credentials_builder::build_reloadable_certificate_credentials(reload_callback_with_creds cb, std::optional<std::chrono::milliseconds> tolerance) const {
+    return build_reloadable_certificate_credentials(wrap_reload_callback(std::move(cb)), tolerance);
+}
+
+future<shared_ptr<tls::server_credentials>> tls::credentials_builder::build_reloadable_server_credentials(reload_callback_with_creds cb, std::optional<std::chrono::milliseconds> tolerance) const {
+    return build_reloadable_server_credentials(wrap_reload_callback(std::move(cb)), tolerance);
+}
+
+std::optional<tls::blob> tls::credentials_builder::get_trust_file_blob() const {
+    if (auto i = _blobs.find(x509_trust_key); i != _blobs.end()) {
+        return std::make_optional<tls::blob>(std::any_cast<const x509_simple&>(i->second).data);
+    }
+    return std::nullopt;
+}
+
 const std::error_category& tls::error_category() {
     return internal::crypto::provider().get_tls_backend().error_category();
 }
@@ -787,6 +835,10 @@ future<std::optional<session_dn>> tls::get_dn_information(connected_socket& sock
     return get_tls_socket(socket)->get_distinguished_name();
 }
 
+future<std::optional<session_dn>> tls::get_dn_information(connected_socket& socket, dn_format format) {
+    return get_tls_socket(socket)->get_distinguished_name(format);
+}
+
 future<std::vector<tls::subject_alt_name>> tls::get_alt_name_information(connected_socket& socket, std::unordered_set<subject_alt_name_type> types) {
     return get_tls_socket(socket)->get_alt_name_information(std::move(types));
 }
@@ -825,8 +877,16 @@ future<> tls::force_rehandshake(connected_socket& socket) {
 
 } // namespace seastar
 
-// Error code globals — initialized at startup by the active backend's
-// init_error_codes() method, called from smp::configure().
+#ifdef SEASTAR_TLS_DUAL_BACKEND
+// Dual-backend build: the error code globals are zero-initialized here and
+// filled in at reactor startup by the active backend's init_error_codes()
+// method (called from smp::configure() via internal::crypto::set_provider()).
+// Accessing them before reactor startup silently reads as 0 — build with a
+// single TLS backend if you need them to be valid at any time.
+//
+// In single-backend builds these globals are instead defined as `const` and
+// statically initialized in the backend's own tls_<backend>.cc, so they are
+// valid at any time including from static initializers.
 int seastar::tls::ERROR_UNKNOWN_COMPRESSION_ALGORITHM = 0;
 int seastar::tls::ERROR_UNKNOWN_CIPHER_TYPE = 0;
 int seastar::tls::ERROR_INVALID_SESSION = 0;
@@ -845,3 +905,4 @@ int seastar::tls::ERROR_UNSUPPORTED_VERSION = 0;
 int seastar::tls::ERROR_NO_CIPHER_SUITES = 0;
 int seastar::tls::ERROR_DECRYPTION_FAILED = 0;
 int seastar::tls::ERROR_MAC_VERIFY_FAILED = 0;
+#endif // SEASTAR_TLS_DUAL_BACKEND
diff --git a/src/net/tls-impl.hh b/src/net/tls-impl.hh
index 6003a1d8e5e..db6bdb7c923 100644
--- a/src/net/tls-impl.hh
+++ b/src/net/tls-impl.hh
@@ -160,6 +160,10 @@ public:
     virtual void set_maximum_tls_version(tls_version) {}
     virtual void enable_tls_renegotiation() {}
 
+    // Certificate info accessors — default no-op for backends that don't implement.
+    virtual std::vector<cert_info> get_x509_info() const { return {}; }
+    virtual std::vector<cert_info> get_x509_trust_list_info() const { return {}; }
+
     // Flag for lazy system trust loading.
     bool _load_system_trust = false;
 };
@@ -178,6 +182,7 @@ public:
     virtual void close() = 0;
     virtual seastar::net::connected_socket_impl& socket() const = 0;
     virtual future<std::optional<session_dn>> get_distinguished_name() = 0;
+    virtual future<std::optional<session_dn>> get_distinguished_name(dn_format) = 0;
     virtual future<std::vector<subject_alt_name>> get_alt_name_information(
         std::unordered_set<subject_alt_name_type> types) = 0;
     virtual future<bool> is_resumed() = 0;
@@ -264,6 +269,9 @@ public:
     future<std::optional<session_dn>> get_distinguished_name() {
         return _session->get_distinguished_name();
     }
+    future<std::optional<session_dn>> get_distinguished_name(dn_format format) {
+        return _session->get_distinguished_name(format);
+    }
     future<std::vector<subject_alt_name>> get_alt_name_information(std::unordered_set<subject_alt_name_type> types) {
         return _session->get_alt_name_information(std::move(types));
     }
diff --git a/src/net/tls_gnutls.cc b/src/net/tls_gnutls.cc
index 0da8983ba4e..c8564092db1 100644
--- a/src/net/tls_gnutls.cc
+++ b/src/net/tls_gnutls.cc
@@ -32,6 +32,7 @@
 #include <numeric>
 
 #include <seastar/util/assert.hh>
+#include <seastar/util/defer.hh>
 
 #include <netinet/in.h>
 #include <sys/stat.h>
@@ -312,6 +313,15 @@ struct gnutls_datum : public gnutls_datum_t {
 
 namespace tls {
 
+static std::vector<std::byte> extract_x509_serial(gnutls_x509_crt_t cert) {
+    constexpr size_t serial_max = 128;
+    size_t serial_size{serial_max};
+    std::vector<std::byte> serial(serial_size);
+    gtls_chk(gnutls_x509_crt_get_serial(cert, serial.data(), &serial_size));
+    serial.resize(serial_size);
+    return serial;
+}
+
 class gnutls_provider_certificate_credentials_impl: public gnutlsobj, public credentials_impl {
 public:
     gnutls_provider_certificate_credentials_impl()
@@ -434,6 +444,50 @@ class gnutls_provider_certificate_credentials_impl: public gnutlsobj, public cre
     friend class credentials_builder;
     friend class session;
 
+    std::vector<cert_info> get_x509_info() const override {
+        gnutls_x509_crt_t *crt_list{};
+        unsigned int crt_list_size{};
+        gtls_chk(gnutls_certificate_get_x509_crt(*this, 0, &crt_list, &crt_list_size));
+        auto cleanup = defer([&crt_list, crt_list_size]() noexcept {
+            for (unsigned int i = 0; i < crt_list_size; ++i) {
+                gnutls_x509_crt_deinit(crt_list[i]);
+            }
+            gnutls_free(crt_list);
+        });
+
+        std::vector<cert_info> result;
+        result.reserve(crt_list_size);
+
+        for (unsigned int i = 0; i < crt_list_size; ++i) {
+            cert_info info = {
+                .serial = extract_x509_serial(crt_list[i]),
+                .expiry = gnutls_x509_crt_get_expiration_time(crt_list[i]),
+            };
+            result.emplace_back(std::move(info));
+        }
+        return result;
+    }
+
+    std::vector<cert_info> get_x509_trust_list_info() const override {
+        gnutls_x509_trust_list_t tlist{};
+        gnutls_certificate_get_trust_list(*this, &tlist);
+        gnutls_x509_trust_list_iter_t iter{};
+        gnutls_x509_crt_t cert{};
+
+        std::vector<cert_info> result;
+        while (GNUTLS_E_REQUESTED_DATA_NOT_AVAILABLE !=
+               gnutls_x509_trust_list_iter_get_ca(tlist, &iter, &cert)) {
+            cert_info info = {
+                .serial = extract_x509_serial(cert),
+                .expiry = gnutls_x509_crt_get_expiration_time(cert),
+            };
+            result.emplace_back(std::move(info));
+            gnutls_x509_crt_deinit(cert);
+        }
+
+        return result;
+    }
+
     bool need_load_system_trust() const {
         return _load_system_trust;
     }
@@ -1194,6 +1248,12 @@ class session : public enable_shared_from_this<session>, public tls::session_imp
             return extract_dn_information();
         });
     }
+    future<std::optional<session_dn>> get_distinguished_name(dn_format) override {
+        // Ignoring parameter as GnuTLS does not provide a mechanism to change the format
+        return state_checked_access([this] {
+            return extract_dn_information();
+        });
+    }
     future<std::vector<subject_alt_name>> get_alt_name_information(std::unordered_set<subject_alt_name_type> types) override {
         return state_checked_access([this](std::unordered_set<subject_alt_name_type> types) {
             std::vector<subject_alt_name> res;
@@ -1405,24 +1465,57 @@ std::unique_ptr<tls::dh_params_impl> tls::gnutls::make_dh_params(const tls::blob
 }
 
 void tls::gnutls::init_error_codes() {
-    tls::ERROR_UNKNOWN_COMPRESSION_ALGORITHM = GNUTLS_E_UNKNOWN_COMPRESSION_ALGORITHM;
-    tls::ERROR_UNKNOWN_CIPHER_TYPE = GNUTLS_E_UNKNOWN_CIPHER_TYPE;
-    tls::ERROR_INVALID_SESSION = GNUTLS_E_INVALID_SESSION;
-    tls::ERROR_UNEXPECTED_HANDSHAKE_PACKET = GNUTLS_E_UNEXPECTED_HANDSHAKE_PACKET;
-    tls::ERROR_UNKNOWN_CIPHER_SUITE = GNUTLS_E_UNKNOWN_CIPHER_SUITE;
-    tls::ERROR_UNKNOWN_ALGORITHM = GNUTLS_E_UNKNOWN_ALGORITHM;
+#ifdef SEASTAR_TLS_DUAL_BACKEND
+    // In dual-backend builds the globals are mutable, zero at static-init
+    // time, and the active backend fills them in here at smp::configure()
+    // time. In single-backend builds these globals are declared `const` and
+    // statically initialized below; this function is a no-op.
+    tls::ERROR_UNKNOWN_COMPRESSION_ALGORITHM   = GNUTLS_E_UNKNOWN_COMPRESSION_ALGORITHM;
+    tls::ERROR_UNKNOWN_CIPHER_TYPE             = GNUTLS_E_UNKNOWN_CIPHER_TYPE;
+    tls::ERROR_INVALID_SESSION                 = GNUTLS_E_INVALID_SESSION;
+    tls::ERROR_UNEXPECTED_HANDSHAKE_PACKET     = GNUTLS_E_UNEXPECTED_HANDSHAKE_PACKET;
+    tls::ERROR_UNKNOWN_CIPHER_SUITE            = GNUTLS_E_UNKNOWN_CIPHER_SUITE;
+    tls::ERROR_UNKNOWN_ALGORITHM               = GNUTLS_E_UNKNOWN_ALGORITHM;
     tls::ERROR_UNSUPPORTED_SIGNATURE_ALGORITHM = GNUTLS_E_UNSUPPORTED_SIGNATURE_ALGORITHM;
-    tls::ERROR_SAFE_RENEGOTIATION_FAILED = GNUTLS_E_SAFE_RENEGOTIATION_FAILED;
-    tls::ERROR_UNSAFE_RENEGOTIATION_DENIED = GNUTLS_E_UNSAFE_RENEGOTIATION_DENIED;
-    tls::ERROR_UNKNOWN_SRP_USERNAME = GNUTLS_E_UNKNOWN_SRP_USERNAME;
-    tls::ERROR_PREMATURE_TERMINATION = GNUTLS_E_PREMATURE_TERMINATION;
-    tls::ERROR_PUSH = GNUTLS_E_PUSH_ERROR;
-    tls::ERROR_PULL = GNUTLS_E_PULL_ERROR;
-    tls::ERROR_UNEXPECTED_PACKET = GNUTLS_E_UNEXPECTED_PACKET;
-    tls::ERROR_UNSUPPORTED_VERSION = GNUTLS_E_UNSUPPORTED_VERSION_PACKET;
-    tls::ERROR_NO_CIPHER_SUITES = GNUTLS_E_NO_CIPHER_SUITES;
-    tls::ERROR_DECRYPTION_FAILED = GNUTLS_E_DECRYPTION_FAILED;
-    tls::ERROR_MAC_VERIFY_FAILED = GNUTLS_E_MAC_VERIFY_FAILED;
+    tls::ERROR_SAFE_RENEGOTIATION_FAILED       = GNUTLS_E_SAFE_RENEGOTIATION_FAILED;
+    tls::ERROR_UNSAFE_RENEGOTIATION_DENIED     = GNUTLS_E_UNSAFE_RENEGOTIATION_DENIED;
+    tls::ERROR_UNKNOWN_SRP_USERNAME            = GNUTLS_E_UNKNOWN_SRP_USERNAME;
+    tls::ERROR_PREMATURE_TERMINATION           = GNUTLS_E_PREMATURE_TERMINATION;
+    tls::ERROR_PUSH                            = GNUTLS_E_PUSH_ERROR;
+    tls::ERROR_PULL                            = GNUTLS_E_PULL_ERROR;
+    tls::ERROR_UNEXPECTED_PACKET               = GNUTLS_E_UNEXPECTED_PACKET;
+    tls::ERROR_UNSUPPORTED_VERSION             = GNUTLS_E_UNSUPPORTED_VERSION_PACKET;
+    tls::ERROR_NO_CIPHER_SUITES                = GNUTLS_E_NO_CIPHER_SUITES;
+    tls::ERROR_DECRYPTION_FAILED               = GNUTLS_E_DECRYPTION_FAILED;
+    tls::ERROR_MAC_VERIFY_FAILED               = GNUTLS_E_MAC_VERIFY_FAILED;
+#endif
 }
 
+#ifndef SEASTAR_TLS_DUAL_BACKEND
+// Single-backend build (GnuTLS only): the legacy ERROR_* globals are declared
+// `const` in <seastar/net/tls.hh> (via SEASTAR_TLS_ERROR_CONST), and defined
+// here with static initializers tied to the GnuTLS constants. As a result
+// they are valid at any time including from static initializers and before
+// reactor startup. In dual-backend builds these globals are mutable, defined
+// in tls-impl.cc, and filled in at reactor startup by init_error_codes().
+const int tls::ERROR_UNKNOWN_COMPRESSION_ALGORITHM   = GNUTLS_E_UNKNOWN_COMPRESSION_ALGORITHM;
+const int tls::ERROR_UNKNOWN_CIPHER_TYPE             = GNUTLS_E_UNKNOWN_CIPHER_TYPE;
+const int tls::ERROR_INVALID_SESSION                 = GNUTLS_E_INVALID_SESSION;
+const int tls::ERROR_UNEXPECTED_HANDSHAKE_PACKET     = GNUTLS_E_UNEXPECTED_HANDSHAKE_PACKET;
+const int tls::ERROR_UNKNOWN_CIPHER_SUITE            = GNUTLS_E_UNKNOWN_CIPHER_SUITE;
+const int tls::ERROR_UNKNOWN_ALGORITHM               = GNUTLS_E_UNKNOWN_ALGORITHM;
+const int tls::ERROR_UNSUPPORTED_SIGNATURE_ALGORITHM = GNUTLS_E_UNSUPPORTED_SIGNATURE_ALGORITHM;
+const int tls::ERROR_SAFE_RENEGOTIATION_FAILED       = GNUTLS_E_SAFE_RENEGOTIATION_FAILED;
+const int tls::ERROR_UNSAFE_RENEGOTIATION_DENIED     = GNUTLS_E_UNSAFE_RENEGOTIATION_DENIED;
+const int tls::ERROR_UNKNOWN_SRP_USERNAME            = GNUTLS_E_UNKNOWN_SRP_USERNAME;
+const int tls::ERROR_PREMATURE_TERMINATION           = GNUTLS_E_PREMATURE_TERMINATION;
+const int tls::ERROR_PUSH                            = GNUTLS_E_PUSH_ERROR;
+const int tls::ERROR_PULL                            = GNUTLS_E_PULL_ERROR;
+const int tls::ERROR_UNEXPECTED_PACKET               = GNUTLS_E_UNEXPECTED_PACKET;
+const int tls::ERROR_UNSUPPORTED_VERSION             = GNUTLS_E_UNSUPPORTED_VERSION_PACKET;
+const int tls::ERROR_NO_CIPHER_SUITES                = GNUTLS_E_NO_CIPHER_SUITES;
+const int tls::ERROR_DECRYPTION_FAILED               = GNUTLS_E_DECRYPTION_FAILED;
+const int tls::ERROR_MAC_VERIFY_FAILED               = GNUTLS_E_MAC_VERIFY_FAILED;
+#endif // !SEASTAR_TLS_DUAL_BACKEND
+
 } // namespace seastar
diff --git a/src/net/tls_gnutls.hh b/src/net/tls_gnutls.hh
index 3464d7b08f1..050f788b5d7 100644
--- a/src/net/tls_gnutls.hh
+++ b/src/net/tls_gnutls.hh
@@ -65,6 +65,12 @@ std::unique_ptr<dh_params_impl> make_dh_params(dh_params::level);
 std::unique_ptr<dh_params_impl> make_dh_params(const blob&, x509_crt_format);
 
 /// Initialize TLS error codes with GnuTLS values.
+///
+/// In dual-backend builds (\c SEASTAR_TLS_DUAL_BACKEND) the legacy
+/// \c seastar::tls::ERROR_* globals are zero at static-init time and this
+/// function fills them in at reactor startup. In single-backend builds the
+/// globals are statically initialized to their GnuTLS values and this is a
+/// no-op.
 void init_error_codes();
 
 } // namespace seastar::tls::gnutls
diff --git a/src/net/tls_openssl.cc b/src/net/tls_openssl.cc
index a0a61d1f982..1e39f27d94c 100644
--- a/src/net/tls_openssl.cc
+++ b/src/net/tls_openssl.cc
@@ -347,6 +347,26 @@ class openssl_provider_dh_params_impl : public tls::dh_params_impl {
 
 namespace tls {
 
+static std::vector<std::byte> extract_x509_serial(X509* cert) {
+    constexpr size_t serial_max = 160;
+    const ASN1_INTEGER *serial_no = X509_get_serialNumber(cert);
+    const size_t serial_size = std::min(serial_max, (size_t)serial_no->length);
+    std::vector<std::byte> serial(
+        reinterpret_cast<std::byte*>(serial_no->data),
+        reinterpret_cast<std::byte*>(serial_no->data + serial_size));
+    return serial;
+}
+
+static time_t extract_x509_expiry(X509* cert) {
+    const ASN1_TIME *not_after = X509_get0_notAfter(cert);
+    if (not_after != nullptr) {
+        tm tm_struct{};
+        ASN1_TIME_to_tm(not_after, &tm_struct);
+        return mktime(&tm_struct);
+    }
+    return -1;
+}
+
 class openssl_provider_certificate_credentials_impl : public tls::credentials_impl {
     struct certkey_pair {
         x509_ptr cert;
@@ -694,6 +714,34 @@ class openssl_provider_certificate_credentials_impl : public tls::credentials_im
         return _load_system_trust;
     }
 
+    std::vector<cert_info> get_x509_info() const override {
+        if (_cert_and_key.cert) {
+            return {
+                cert_info{
+                    .serial = extract_x509_serial(_cert_and_key.cert.get()),
+                    .expiry = extract_x509_expiry(_cert_and_key.cert.get())}
+            };
+        }
+        return {};
+    }
+
+    std::vector<cert_info> get_x509_trust_list_info() const override {
+        std::vector<cert_info> cert_infos;
+        STACK_OF(X509_OBJECT) *chain = X509_STORE_get0_objects(_creds.get());
+        auto num_elements = sk_X509_OBJECT_num(chain);
+        for (auto i = 0; i < num_elements; i++) {
+            auto object = sk_X509_OBJECT_value(chain, i);
+            auto type = X509_OBJECT_get_type(object);
+            if (type == X509_LU_X509) {
+                auto cert = X509_OBJECT_get0_X509(object);
+                cert_infos.push_back(cert_info{
+                        .serial = extract_x509_serial(cert),
+                        .expiry = extract_x509_expiry(cert)});
+            }
+        }
+        return cert_infos;
+    }
+
     certkey_pair _cert_and_key;
     session_ticket_keys _session_ticket_keys;
     x509_ptr _last_cert;
@@ -1509,6 +1557,10 @@ class openssl_session : public enable_shared_from_this<openssl_session>, public
     }
 
     future<std::optional<session_dn>> get_distinguished_name() override {
+        return get_distinguished_name(dn_format::legacy);
+    }
+
+    future<std::optional<session_dn>> get_distinguished_name(dn_format format) override {
         using result_t = std::optional<session_dn>;
         if (_error) {
             return make_exception_future<result_t>(_error);
@@ -1519,9 +1571,9 @@ class openssl_session : public enable_shared_from_this<openssl_session>, public
         }
         if (!connected()) {
             return handshake().then(
-              [this]() mutable { return get_distinguished_name(); });
+              [this, format]() mutable { return get_distinguished_name(format); });
         }
-        result_t dn = extract_dn_information(is_verification_error::no);
+        result_t dn = extract_dn_information(is_verification_error::no, format);
         return make_ready_future<result_t>(std::move(dn));
     }
 
@@ -1651,6 +1703,10 @@ class openssl_session : public enable_shared_from_this<openssl_session>, public
         char buf[256];
         ERR_error_string_n(err, buf, sizeof(buf));
         tls_log.warn("{} stale error on queue before {}: {}", *this, operation, buf);
+        // OpenSSL's API contract is too loose, and the impact too wide
+        // (e.g., low-priority HTTPS traffic could crash the whole process)
+        // to terminate in release builds. Use plain assert() which fires only in debug.
+        assert(0 && "stale errors on OpenSSL error queue");
     }
 
     std::vector<subject_alt_name> do_get_alt_name_information(const x509_ptr &peer_cert,
@@ -1790,7 +1846,7 @@ class openssl_session : public enable_shared_from_this<openssl_session>, public
 
     using is_verification_error = bool_class<struct is_verification_error_tag>;
 
-    std::optional<session_dn> extract_dn_information(is_verification_error verification_error = is_verification_error::no) const {
+    std::optional<session_dn> extract_dn_information(is_verification_error verification_error = is_verification_error::no, dn_format format = dn_format::legacy) const {
         const auto peer_cert = [this, verification_error]{
             if (verification_error) {
                 // If we are attempting to get a DN from a cert that failed verification, then
@@ -1805,8 +1861,8 @@ class openssl_session : public enable_shared_from_this<openssl_session>, public
         if (!peer_cert) {
             return std::nullopt;
         }
-        auto subject = get_dn_string(X509_get_subject_name(peer_cert.get()));
-        auto issuer = get_dn_string(X509_get_issuer_name(peer_cert.get()));
+        auto subject = get_dn_string(X509_get_subject_name(peer_cert.get()), format);
+        auto issuer = get_dn_string(X509_get_issuer_name(peer_cert.get()), format);
         if (!subject || !issuer) {
             throw make_openssl_error(
               "error while extracting certificate DN strings");
@@ -1992,9 +2048,17 @@ class openssl_session : public enable_shared_from_this<openssl_session>, public
         return ssl_ctx;
     }
 
-    static std::optional<sstring> get_dn_string(X509_NAME* name) {
+    static std::optional<sstring> get_dn_string(X509_NAME* name, dn_format format = dn_format::legacy) {
         auto out = bio_ptr(BIO_new(BIO_s_mem()));
-        unsigned long flags = ASN1_STRFLGS_RFC2253 | XN_FLAG_SEP_COMMA_PLUS | XN_FLAG_FN_SN | XN_FLAG_DUMP_UNKNOWN_FIELDS;
+        unsigned long flags = [](dn_format format) {
+            switch(format) {
+            case dn_format::rfc2253:
+                return XN_FLAG_RFC2253;
+            case dn_format::legacy:
+                return ASN1_STRFLGS_RFC2253 | XN_FLAG_SEP_COMMA_PLUS | XN_FLAG_FN_SN | XN_FLAG_DUMP_UNKNOWN_FIELDS;
+            }
+            __builtin_unreachable();
+        }(format);
         if (-1 == X509_NAME_print_ex(out.get(), name, 0, flags)) {
             return std::nullopt;
         }
@@ -2310,26 +2374,60 @@ std::unique_ptr<tls::dh_params_impl> tls::openssl::make_dh_params(const tls::blo
 }
 
 void tls::openssl::init_error_codes() {
-    tls::ERROR_UNKNOWN_COMPRESSION_ALGORITHM = ERR_PACK(ERR_LIB_SSL, 0, SSL_R_UNSUPPORTED_COMPRESSION_ALGORITHM);
-    tls::ERROR_UNKNOWN_CIPHER_TYPE = ERR_PACK(ERR_LIB_SSL, 0, SSL_R_UNKNOWN_CIPHER_TYPE);
-    tls::ERROR_INVALID_SESSION = ERR_PACK(ERR_LIB_SSL, 0, SSL_R_INVALID_SESSION_ID);
-    tls::ERROR_UNEXPECTED_HANDSHAKE_PACKET = ERR_PACK(ERR_LIB_SSL, 0, SSL_R_UNEXPECTED_RECORD);
-    tls::ERROR_UNKNOWN_CIPHER_SUITE = ERR_PACK(ERR_LIB_SSL, 0, SSL_R_UNSUPPORTED_PROTOCOL);
-    tls::ERROR_UNKNOWN_ALGORITHM = ERR_PACK(ERR_LIB_RSA, 0, RSA_R_UNKNOWN_ALGORITHM_TYPE);
+#ifdef SEASTAR_TLS_DUAL_BACKEND
+    // In dual-backend builds the globals are mutable, zero at static-init
+    // time, and the active backend fills them in here at smp::configure()
+    // time. In single-backend builds these globals are declared `const` and
+    // statically initialized below; this function is a no-op.
+    tls::ERROR_UNKNOWN_COMPRESSION_ALGORITHM   = ERR_PACK(ERR_LIB_SSL, 0, SSL_R_UNSUPPORTED_COMPRESSION_ALGORITHM);
+    tls::ERROR_UNKNOWN_CIPHER_TYPE             = ERR_PACK(ERR_LIB_SSL, 0, SSL_R_UNKNOWN_CIPHER_TYPE);
+    tls::ERROR_INVALID_SESSION                 = ERR_PACK(ERR_LIB_SSL, 0, SSL_R_INVALID_SESSION_ID);
+    tls::ERROR_UNEXPECTED_HANDSHAKE_PACKET     = ERR_PACK(ERR_LIB_SSL, 0, SSL_R_UNEXPECTED_RECORD);
+    tls::ERROR_UNKNOWN_CIPHER_SUITE            = ERR_PACK(ERR_LIB_SSL, 0, SSL_R_UNSUPPORTED_PROTOCOL);
+    tls::ERROR_UNKNOWN_ALGORITHM               = ERR_PACK(ERR_LIB_RSA, 0, RSA_R_UNKNOWN_ALGORITHM_TYPE);
     tls::ERROR_UNSUPPORTED_SIGNATURE_ALGORITHM = ERR_PACK(ERR_LIB_SSL, 0, SSL_R_NO_SUITABLE_SIGNATURE_ALGORITHM);
-    tls::ERROR_SAFE_RENEGOTIATION_FAILED = ERR_PACK(ERR_LIB_SSL, 0, SSL_R_RENEGOTIATION_MISMATCH);
-    tls::ERROR_UNSAFE_RENEGOTIATION_DENIED = ERR_PACK(ERR_LIB_SSL, 0, SSL_R_UNSAFE_LEGACY_RENEGOTIATION_DISABLED);
-    tls::ERROR_UNKNOWN_SRP_USERNAME = ERR_PACK(ERR_LIB_SSL, 0, SSL_R_INVALID_SRP_USERNAME);
-    tls::ERROR_PREMATURE_TERMINATION = ERR_PACK(ERR_LIB_SSL, 0, SSL_R_UNEXPECTED_EOF_WHILE_READING);
-    tls::ERROR_PUSH = int(ERR_SYSTEM_FLAG | EPIPE);
-    tls::ERROR_PULL = ERR_PACK(ERR_LIB_SSL, 0, SSL_R_READ_BIO_NOT_SET);
-    tls::ERROR_UNEXPECTED_PACKET = ERR_PACK(ERR_LIB_SSL, 0, SSL_R_UNEXPECTED_MESSAGE);
-    tls::ERROR_UNSUPPORTED_VERSION = ERR_PACK(ERR_LIB_SSL, 0, SSL_R_UNSUPPORTED_SSL_VERSION);
-    tls::ERROR_NO_CIPHER_SUITES = ERR_PACK(ERR_LIB_SSL, 0, SSL_R_NO_CIPHERS_AVAILABLE);
-    tls::ERROR_DECRYPTION_FAILED = ERR_PACK(ERR_LIB_SSL, 0, SSL_R_DECRYPTION_FAILED);
-    tls::ERROR_MAC_VERIFY_FAILED = ERR_PACK(ERR_LIB_SSL, 0, SSL_R_DECRYPTION_FAILED_OR_BAD_RECORD_MAC);
+    tls::ERROR_SAFE_RENEGOTIATION_FAILED       = ERR_PACK(ERR_LIB_SSL, 0, SSL_R_RENEGOTIATION_MISMATCH);
+    tls::ERROR_UNSAFE_RENEGOTIATION_DENIED     = ERR_PACK(ERR_LIB_SSL, 0, SSL_R_UNSAFE_LEGACY_RENEGOTIATION_DISABLED);
+    tls::ERROR_UNKNOWN_SRP_USERNAME            = ERR_PACK(ERR_LIB_SSL, 0, SSL_R_INVALID_SRP_USERNAME);
+    tls::ERROR_PREMATURE_TERMINATION           = ERR_PACK(ERR_LIB_SSL, 0, SSL_R_UNEXPECTED_EOF_WHILE_READING);
+    tls::ERROR_PUSH                            = int(ERR_SYSTEM_FLAG | EPIPE);
+    tls::ERROR_PULL                            = ERR_PACK(ERR_LIB_SSL, 0, SSL_R_READ_BIO_NOT_SET);
+    tls::ERROR_UNEXPECTED_PACKET               = ERR_PACK(ERR_LIB_SSL, 0, SSL_R_UNEXPECTED_MESSAGE);
+    tls::ERROR_UNSUPPORTED_VERSION             = ERR_PACK(ERR_LIB_SSL, 0, SSL_R_UNSUPPORTED_SSL_VERSION);
+    tls::ERROR_NO_CIPHER_SUITES                = ERR_PACK(ERR_LIB_SSL, 0, SSL_R_NO_CIPHERS_AVAILABLE);
+    tls::ERROR_DECRYPTION_FAILED               = ERR_PACK(ERR_LIB_SSL, 0, SSL_R_DECRYPTION_FAILED);
+    tls::ERROR_MAC_VERIFY_FAILED               = ERR_PACK(ERR_LIB_SSL, 0, SSL_R_DECRYPTION_FAILED_OR_BAD_RECORD_MAC);
+#endif
 }
 
+#ifndef SEASTAR_TLS_DUAL_BACKEND
+// Single-backend build (OpenSSL only): the legacy ERROR_* globals are
+// declared `const` in <seastar/net/tls.hh> (via SEASTAR_TLS_ERROR_CONST), and
+// defined here with static initializers tied to the OpenSSL constants. As a
+// result they are valid at any time including from static initializers and
+// before reactor startup. In dual-backend builds these globals are mutable,
+// defined in tls-impl.cc, and filled in at reactor startup by
+// init_error_codes().
+const int tls::ERROR_UNKNOWN_COMPRESSION_ALGORITHM   = ERR_PACK(ERR_LIB_SSL, 0, SSL_R_UNSUPPORTED_COMPRESSION_ALGORITHM);
+const int tls::ERROR_UNKNOWN_CIPHER_TYPE             = ERR_PACK(ERR_LIB_SSL, 0, SSL_R_UNKNOWN_CIPHER_TYPE);
+const int tls::ERROR_INVALID_SESSION                 = ERR_PACK(ERR_LIB_SSL, 0, SSL_R_INVALID_SESSION_ID);
+const int tls::ERROR_UNEXPECTED_HANDSHAKE_PACKET     = ERR_PACK(ERR_LIB_SSL, 0, SSL_R_UNEXPECTED_RECORD);
+const int tls::ERROR_UNKNOWN_CIPHER_SUITE            = ERR_PACK(ERR_LIB_SSL, 0, SSL_R_UNSUPPORTED_PROTOCOL);
+const int tls::ERROR_UNKNOWN_ALGORITHM               = ERR_PACK(ERR_LIB_RSA, 0, RSA_R_UNKNOWN_ALGORITHM_TYPE);
+const int tls::ERROR_UNSUPPORTED_SIGNATURE_ALGORITHM = ERR_PACK(ERR_LIB_SSL, 0, SSL_R_NO_SUITABLE_SIGNATURE_ALGORITHM);
+const int tls::ERROR_SAFE_RENEGOTIATION_FAILED       = ERR_PACK(ERR_LIB_SSL, 0, SSL_R_RENEGOTIATION_MISMATCH);
+const int tls::ERROR_UNSAFE_RENEGOTIATION_DENIED     = ERR_PACK(ERR_LIB_SSL, 0, SSL_R_UNSAFE_LEGACY_RENEGOTIATION_DISABLED);
+const int tls::ERROR_UNKNOWN_SRP_USERNAME            = ERR_PACK(ERR_LIB_SSL, 0, SSL_R_INVALID_SRP_USERNAME);
+const int tls::ERROR_PREMATURE_TERMINATION           = ERR_PACK(ERR_LIB_SSL, 0, SSL_R_UNEXPECTED_EOF_WHILE_READING);
+const int tls::ERROR_PUSH                            = int(ERR_SYSTEM_FLAG | EPIPE);
+const int tls::ERROR_PULL                            = ERR_PACK(ERR_LIB_SSL, 0, SSL_R_READ_BIO_NOT_SET);
+const int tls::ERROR_UNEXPECTED_PACKET               = ERR_PACK(ERR_LIB_SSL, 0, SSL_R_UNEXPECTED_MESSAGE);
+const int tls::ERROR_UNSUPPORTED_VERSION             = ERR_PACK(ERR_LIB_SSL, 0, SSL_R_UNSUPPORTED_SSL_VERSION);
+const int tls::ERROR_NO_CIPHER_SUITES                = ERR_PACK(ERR_LIB_SSL, 0, SSL_R_NO_CIPHERS_AVAILABLE);
+const int tls::ERROR_DECRYPTION_FAILED               = ERR_PACK(ERR_LIB_SSL, 0, SSL_R_DECRYPTION_FAILED);
+const int tls::ERROR_MAC_VERIFY_FAILED               = ERR_PACK(ERR_LIB_SSL, 0, SSL_R_DECRYPTION_FAILED_OR_BAD_RECORD_MAC);
+#endif // !SEASTAR_TLS_DUAL_BACKEND
+
 } // namespace seastar
 
 auto fmt::formatter<seastar::tls::openssl_session>::format(
diff --git a/src/net/tls_openssl.hh b/src/net/tls_openssl.hh
index 765bcee1f94..53b63322e93 100644
--- a/src/net/tls_openssl.hh
+++ b/src/net/tls_openssl.hh
@@ -65,6 +65,12 @@ std::unique_ptr<dh_params_impl> make_dh_params(dh_params::level);
 std::unique_ptr<dh_params_impl> make_dh_params(const blob&, x509_crt_format);
 
 /// Initialize TLS error codes with OpenSSL values.
+///
+/// In dual-backend builds (\c SEASTAR_TLS_DUAL_BACKEND) the legacy
+/// \c seastar::tls::ERROR_* globals are zero at static-init time and this
+/// function fills them in at reactor startup. In single-backend builds the
+/// globals are statically initialized to their OpenSSL values and this is a
+/// no-op.
 void init_error_codes();
 
 } // namespace seastar::tls::openssl
diff --git a/src/net/udp.cc b/src/net/udp.cc
index 121913da02e..5d5eddb8912 100644
--- a/src/net/udp.cc
+++ b/src/net/udp.cc
@@ -100,7 +100,7 @@ class native_channel : public datagram_channel_impl {
     }
 
     virtual future<> send(const socket_address& dst, const char* msg) override {
-        temporary_buffer<char> buf(const_cast<char *>(msg), strlen(msg), deleter());
+        auto buf = temporary_buffer<char>::maybe_unsafe_from_deleter(const_cast<char *>(msg), strlen(msg), deleter());
         return send(dst, std::span(&buf, 1));
     }
 
diff --git a/src/rpc/rpc.cc b/src/rpc/rpc.cc
index dc06e01c567..10f7559ea57 100644
--- a/src/rpc/rpc.cc
+++ b/src/rpc/rpc.cc
@@ -82,14 +82,14 @@ snd_buf make_shard_local_buffer_copy(snd_buf* org, std::function<deleter(snd_buf
     auto* one = std::get_if<temporary_buffer<char>>(&org->bufs);
 
     if (one) {
-        buf.bufs = temporary_buffer<char>(one->get_write(), one->size(), make_deleter(org));
+        buf.bufs = temporary_buffer<char>::maybe_unsafe_from_deleter(one->get_write(), one->size(), make_deleter(org));
     } else {
         auto& orgbufs = std::get<std::vector<temporary_buffer<char>>>(org->bufs);
         std::vector<temporary_buffer<char>> newbufs;
         newbufs.reserve(orgbufs.size());
         auto d = make_deleter(org);
         for (auto&& b : orgbufs) {
-            newbufs.emplace_back(b.get_write(), b.size(), d.share());
+            newbufs.emplace_back(temporary_buffer<char>::maybe_unsafe_from_deleter(b.get_write(), b.size(), d.share()));
         }
         buf.bufs = std::move(newbufs);
     }
@@ -107,14 +107,14 @@ rcv_buf make_shard_local_buffer_copy(foreign_ptr<std::unique_ptr<rcv_buf>> org)
     auto* one = std::get_if<temporary_buffer<char>>(&org->bufs);
 
     if (one) {
-        buf.bufs = temporary_buffer<char>(one->get_write(), one->size(), make_object_deleter(std::move(org)));
+        buf.bufs = temporary_buffer<char>::maybe_unsafe_from_deleter(one->get_write(), one->size(), make_object_deleter(std::move(org)));
     } else {
         auto& orgbufs = std::get<std::vector<temporary_buffer<char>>>(org->bufs);
         std::vector<temporary_buffer<char>> newbufs;
         newbufs.reserve(orgbufs.size());
         deleter d = make_object_deleter(std::move(org));
         for (auto&& b : orgbufs) {
-            newbufs.emplace_back(b.get_write(), b.size(), d.share());
+            newbufs.push_back(temporary_buffer<char>::maybe_unsafe_from_deleter(b.get_write(), b.size(), d.share()));
         }
         buf.bufs = std::move(newbufs);
     }
diff --git a/src/util/backtrace.cc b/src/util/backtrace.cc
index 327c9073d03..701986a4c2a 100644
--- a/src/util/backtrace.cc
+++ b/src/util/backtrace.cc
@@ -88,6 +88,18 @@ frame decorate(uintptr_t addr) noexcept {
     return {&so, addr - so.begin};
 }
 
+#ifndef SEASTAR_BACKTRACE_UNIMPLEMENTED
+int guarded_backtrace(void **array, int size) noexcept {
+    static thread_local internal::signal_mutex mux{};
+    // ::backtrace isn't re-entrant so avoid calling it concurrently from the same thread.
+    if (auto guard_opt = mux.try_lock(); guard_opt.has_value()) {
+        return ::backtrace(array, size);
+    }
+
+    return 0;
+}
+#endif
+
 simple_backtrace current_backtrace_tasklocal() noexcept {
     simple_backtrace::vector_type v;
     backtrace([&] (frame f) {
diff --git a/src/util/process.cc b/src/util/process.cc
index fab551e61f2..b3c05f48d65 100644
--- a/src/util/process.cc
+++ b/src/util/process.cc
@@ -30,7 +30,7 @@
 
 namespace seastar {
 
-namespace {
+namespace process_internal {
 class pipe_data_source_impl final : public data_source_impl {
     static constexpr std::size_t buffer_size = 8192;
     struct buffer_allocator : public internal::buffer_allocator {
@@ -109,7 +109,7 @@ class pipe_data_sink_impl final : public data_sink_impl {
         return _buffer_size;
     }
 };
-}
+} // namespace process_internal
 
 process::process(create_tag, pid_t pid, file_desc&& cin, file_desc&& cout, file_desc&& cerr)
     : _pid(pid)
@@ -150,15 +150,15 @@ future<process> process::spawn(const std::filesystem::path& pathname) {
 }
 
 output_stream<char> process::cin() {
-    return output_stream<char>(data_sink(pipe_data_sink_impl::from_fd(std::move(_stdin))));
+    return output_stream<char>(data_sink(process_internal::pipe_data_sink_impl::from_fd(std::move(_stdin))));
 }
 
 input_stream<char> process::cout() {
-    return input_stream<char>(data_source(pipe_data_source_impl::from_fd(std::move(_stdout))));
+    return input_stream<char>(data_source(process_internal::pipe_data_source_impl::from_fd(std::move(_stdout))));
 }
 
 input_stream<char> process::cerr() {
-    return input_stream<char>(data_source(pipe_data_source_impl::from_fd(std::move(_stderr))));
+    return input_stream<char>(data_source(process_internal::pipe_data_source_impl::from_fd(std::move(_stderr))));
 }
 
 }
diff --git a/tests/perf/linux_perf_event.cc b/tests/perf/linux_perf_event.cc
index b4c76c0014e..54c38aa64c4 100644
--- a/tests/perf/linux_perf_event.cc
+++ b/tests/perf/linux_perf_event.cc
@@ -62,8 +62,7 @@ linux_perf_event::read() {
         return 0;
     }
     uint64_t ret;
-    auto res = ::read(_fd, &ret, sizeof(ret));
-    SEASTAR_ASSERT(res == sizeof(ret) && "read(2) failed on perf_event fd");
+    (void)::read(_fd, &ret, sizeof(ret));
     return ret;
 }
 
diff --git a/tests/unit/CMakeLists.txt b/tests/unit/CMakeLists.txt
index 89d14282d16..b44c2b3b667 100644
--- a/tests/unit/CMakeLists.txt
+++ b/tests/unit/CMakeLists.txt
@@ -445,6 +445,9 @@ seastar_add_test (lowres_clock
 seastar_add_test (metrics
   SOURCES metrics_test.cc)
 
+seastar_add_test (metrics_family_replication
+  SOURCES metric_family_replication_test.cc)
+
 seastar_add_test (net_config
   KIND BOOST
   SOURCES net_config_test.cc)
@@ -456,6 +459,10 @@ seastar_add_test (noncopyable_function
 seastar_add_test (input_stream
   SOURCES input_stream_test.cc)
 
+seastar_add_test (cpu_profiler_alloc
+  KIND BOOST
+  SOURCES cpu_profiler_alloc_test.cc)
+
 seastar_add_test (output_stream
   SOURCES
     output_stream_test.cc
@@ -529,6 +536,9 @@ seastar_add_test (sstring
 seastar_add_test (stall_detector
   SOURCES stall_detector_test.cc)
 
+seastar_add_test (cpu_profiler
+  SOURCES cpu_profiler_test.cc)
+
 seastar_add_test (stream_reader
   SOURCES stream_reader_test.cc)
 
diff --git a/tests/unit/alloc_test.cc b/tests/unit/alloc_test.cc
index 87ed601bc03..2686f4a5750 100644
--- a/tests/unit/alloc_test.cc
+++ b/tests/unit/alloc_test.cc
@@ -19,6 +19,7 @@
  * Copyright (C) 2015 Cloudius Systems, Ltd.
  */
 
+#include <seastar/core/future.hh>
 #include <seastar/core/memory.hh>
 #include <seastar/core/shard_id.hh>
 #include <seastar/core/smp.hh>
@@ -29,11 +30,12 @@
 #include <seastar/util/log.hh>
 #include <seastar/util/memory_diagnostics.hh>
 
+#include <boost/test/unit_test.hpp>
+
 #include <memory>
 #include <new>
 #include <vector>
 #include <future>
-#include <iostream>
 
 #include <malloc.h>
 #include <stdlib.h>
@@ -305,6 +307,114 @@ SEASTAR_TEST_CASE(test_enable_abort_on_oom) {
     return make_ready_future<>();
 }
 
+// Run the fallback alloc test with the given alignment,
+// 1 means use the default (not explicitly aligned) allocation
+// functions.
+static auto do_test_fallback_alloc(size_t align, size_t alloc_size) {
+    using namespace seastar::memory;
+    auto orig_stats = stats();
+
+    // alignment must be a power of two, and at least 1
+    BOOST_REQUIRE(align > 0 && ((align & (align - 1)) == 0));
+
+    std::vector<std::unique_ptr<char []>> ptrs;
+
+    // so we don't get a vector reallocation screwing up our logic
+    auto too_many_allocs = orig_stats.free_memory() * 2 / alloc_size;
+    ptrs.reserve(too_many_allocs);
+
+    auto alloc_one = [&] {
+        char *p = align != 1 ? new (std::align_val_t(align)) char[alloc_size] : new char[alloc_size];
+        BOOST_REQUIRE(p != nullptr);
+        // check alignment
+        BOOST_REQUIRE((reinterpret_cast<uintptr_t>(p) % align) == 0);
+        ptrs.emplace_back(p);
+    };
+
+    auto alloc_one_expect_fail = [&] {
+        BOOST_REQUIRE_THROW(alloc_one(), std::bad_alloc);
+    };
+
+    // get the point where new alloc_size allocs are failing
+    for (size_t iters = 0; ; ++iters) {
+        try {
+            alloc_one();
+        } catch (const std::bad_alloc&) {
+            break;
+        }
+        BOOST_REQUIRE(iters < too_many_allocs);
+    }
+
+    BOOST_REQUIRE_EQUAL(stats().failed_allocations(),
+            orig_stats.failed_allocations() + 1);
+
+    // check that we will still fail
+    alloc_one_expect_fail();
+
+    BOOST_REQUIRE_EQUAL(stats().failed_allocations(),
+            orig_stats.failed_allocations() + 2);
+
+    BOOST_REQUIRE_EQUAL(stats().fallback_allocations(),
+            orig_stats.fallback_allocations());
+
+    // shouldn't be any foreign allocs yet
+    BOOST_REQUIRE_EQUAL(stats().foreign_mallocs(),
+        orig_stats.foreign_mallocs());
+
+    // open a no-fail scope
+    {
+        seastar::memory::scoped_system_alloc_fallback scope0;
+
+        // this should fallback and increment fallback count
+        alloc_one();
+        BOOST_REQUIRE_EQUAL(stats().failed_allocations(),
+                orig_stats.failed_allocations() + 2);
+        BOOST_REQUIRE_EQUAL(stats().fallback_allocations(),
+                orig_stats.fallback_allocations() + 1);
+
+        // nested scope
+        {
+            seastar::memory::scoped_system_alloc_fallback scope1;
+            alloc_one();
+            BOOST_REQUIRE_EQUAL(stats().fallback_allocations(),
+                    orig_stats.fallback_allocations() + 2);
+        }
+
+        // one more outside the inner nested region
+        alloc_one();
+
+        // each of these should be a foreign alloc
+        BOOST_REQUIRE_EQUAL(stats().foreign_mallocs(),
+            orig_stats.foreign_mallocs() + 3);
+    }
+
+    // now we should fail again
+    set_abort_on_allocation_failure(false);
+    alloc_one_expect_fail();
+
+    // check that we haven't done any foreign frees yet
+    BOOST_REQUIRE_EQUAL(stats().foreign_cross_frees(),
+            orig_stats.foreign_cross_frees());
+
+    // now clear all pointers and we should have three foreign frees
+    // from the three fallbacks above
+    ptrs.clear();
+    BOOST_REQUIRE_EQUAL(stats().foreign_cross_frees(),
+            orig_stats.foreign_cross_frees() + 3);
+
+    return make_ready_future();
+}
+
+SEASTAR_TEST_CASE(test_fallback_alloc_unaligned) {
+    // size must be larger than the small allocation threshold
+    return do_test_fallback_alloc(1, 32 * 1024);
+}
+
+SEASTAR_TEST_CASE(test_fallback_alloc_aligned) {
+    // must be larger than the small allocation threshold
+    return do_test_fallback_alloc(1024, 32 * 1024);
+}
+
 void * volatile sink;
 
 SEASTAR_TEST_CASE(test_bad_alloc_throws) {
diff --git a/tests/unit/cpu_profiler_alloc_test.cc b/tests/unit/cpu_profiler_alloc_test.cc
new file mode 100644
index 00000000000..2e601ac5cfd
--- /dev/null
+++ b/tests/unit/cpu_profiler_alloc_test.cc
@@ -0,0 +1,66 @@
+/* This file is open source software, licensed to you under the terms
+ * of the Apache License, Version 2.0 (the "License").  See the NOTICE file
+ * distributed with this work for additional information regarding copyright
+ * ownership.  You may not use this file except in compliance with the License.
+ *
+ * You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+/*
+ * Copyright (C) 2023 ScyllaDB Ltd.
+ */
+
+#include <chrono>
+#define BOOST_TEST_MODULE core
+
+#include <boost/test/unit_test.hpp>
+
+#include <string_view>
+#include <concepts>
+#include <seastar/core/internal/cpu_profiler.hh>
+#include <seastar/core/memory.hh>
+#include <seastar/core/smp.hh>
+
+template <typename Func>
+requires (std::is_invocable_v<Func>)
+void check_function_allocation(const char *name, size_t expected_allocs, Func f) {
+  auto before = seastar::memory::stats();
+  f();
+  auto after = seastar::memory::stats();
+
+  BOOST_TEST_INFO("After function: " << name);
+  BOOST_REQUIRE_EQUAL(expected_allocs, after.mallocs() - before.mallocs());
+}
+
+class cpu_profiler_test : public seastar::internal::cpu_profiler {
+public:
+  cpu_profiler_test(seastar::internal::cpu_profiler_config cfg)
+      : seastar::internal::cpu_profiler(cfg) {}
+
+  virtual ~cpu_profiler_test() override = default;
+  virtual void arm_timer(std::chrono::nanoseconds) override {
+    // noop
+  }
+  virtual void disarm_timer() override {
+    // noop
+  }
+};
+
+BOOST_AUTO_TEST_CASE(signal_handler_doesnt_alloc) {
+  cpu_profiler_test profiler(seastar::internal::cpu_profiler_config{
+      true, std::chrono::milliseconds(1)});
+  profiler.start();
+  check_function_allocation("cpu_profiler_on_signal", 0, [&profiler] {
+    for (int i = 0; i < 1'000'000; i++) {
+      profiler.on_signal();
+    }
+  });
+}
diff --git a/tests/unit/cpu_profiler_test.cc b/tests/unit/cpu_profiler_test.cc
new file mode 100644
index 00000000000..92734977d8d
--- /dev/null
+++ b/tests/unit/cpu_profiler_test.cc
@@ -0,0 +1,391 @@
+/*
+ * This file is open source software, licensed to you under the terms
+ * of the Apache License, Version 2.0 (the "License").  See the NOTICE file
+ * distributed with this work for additional information regarding copyright
+ * ownership.  You may not use this file except in compliance with the License.
+ *
+ * You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+/*
+ * Copyright (C) 2023 ScyllaDB Ltd.
+ */
+
+#include <atomic>
+#include <chrono>
+#include <cstddef>
+
+#include <seastar/core/internal/cpu_profiler.hh>
+#include <seastar/core/internal/stall_detector.hh>
+#include <seastar/core/loop.hh>
+#include <seastar/core/reactor.hh>
+#include <seastar/core/scheduling.hh>
+#include <seastar/core/thread_cputime_clock.hh>
+#include <seastar/core/with_scheduling_group.hh>
+#include <seastar/testing/test_case.hh>
+#include <seastar/testing/thread_test_case.hh>
+#include <seastar/util/backtrace.hh>
+#include <seastar/util/defer.hh>
+#include <seastar/util/later.hh>
+
+#include "stall_detector_test_utilities.hh"
+
+#include <sys/mman.h>
+
+#include <boost/test/tools/old/interface.hpp>
+
+#ifdef SEASTAR_BACKTRACE_UNIMPLEMENTED
+
+// If backtrace is not implemented, we cannot test the profiler.
+// empty test case to satisfy the requirement that there is at least one test case
+SEASTAR_THREAD_TEST_CASE(simple_case) {
+}
+
+#else
+
+namespace {
+
+// If true, the acceptable thresholds are greatly increased "close enough"
+// checks, which can reduce the flakiness on heavily loaded or otherwise
+// unpredictable systems. If false, the thresholds are much stricter and
+// should be used for more deterministic systems.
+// We default to true to avoid flakes in CI, but when running locally you
+// can consider setting this to false to get a more accurate picture of
+// the profiler's behavior.
+constexpr bool use_loose_thresholds = true;
+
+struct temporary_profiler_settings {
+    std::chrono::nanoseconds prev_ns;
+    bool prev_enabled;
+
+    temporary_profiler_settings(bool enable, std::chrono::nanoseconds ns) {
+        prev_ns = engine().get_cpu_profiler_period();
+        prev_enabled = engine().get_cpu_profiler_enabled();
+
+        engine().set_cpu_profiler_period(ns);
+        engine().set_cpu_profiler_enabled(enable);
+    }
+
+    ~temporary_profiler_settings() {
+        engine().set_cpu_profiler_period(prev_ns);
+        engine().set_cpu_profiler_enabled(prev_enabled);
+    }
+};
+
+// If we set a timer to fire in N ms we can expect it to fire between N and (N + E) ms from
+// when it was set. Where E is some fixed error that arises from how granular a given timer
+// is. Therefore over a given period of time, M, if the timer is continously reset every
+// time it fires we can expect the timer to fire between M/N and M/(N+E) times.
+//
+// The function below takes this error into account and allows the actual samples taken
+// to be slightly less than the expect number of samples if there was no error.
+bool close_to_expected(size_t actual_size, size_t expected_size) {
+
+    constexpr double allowed_dev = 0.15;
+
+    size_t lower_bound, upper_bound;
+
+    if (use_loose_thresholds) {
+        // widen the thresholds a lot
+        lower_bound = round(pow(1 - allowed_dev, 4)) * expected_size;
+        upper_bound = round(pow(1 + allowed_dev, 4)) * expected_size;
+    } else {
+        lower_bound = round((1 - allowed_dev) * expected_size);
+        upper_bound = round((1 + allowed_dev) * expected_size);
+    }
+
+    BOOST_TEST_INFO("actual_size: " << actual_size << ", lower_bound " << lower_bound << ", upper_bound " << upper_bound);
+
+    return actual_size <= upper_bound && actual_size >= lower_bound;
+}
+
+// If loose thresholds are enabled, this call maps to close_to_exepected, otherwise
+// it does an exact equality check.
+void maybe_exact(size_t actual, size_t expected, auto message) {
+    BOOST_TEST_INFO(message);
+    if (use_loose_thresholds) {
+        close_to_expected(actual, expected);
+    } else {
+        BOOST_REQUIRE_EQUAL(actual, expected);
+    }
+}
+
+/*
+ * Get the current profile results and dropped count. If sg_in_main is true, also validates that
+ * the sg associated with the profile is always main, as we expect unless some SG have been
+ * created explicitly.
+ */
+std::pair<std::vector<cpu_profiler_trace>, size_t> get_profile_and_dropped(bool sg_is_main = true) {
+    std::vector<cpu_profiler_trace> results;
+    auto dropped = engine().profiler_results(results);
+
+    for (auto& result: results) {
+        BOOST_CHECK(result.sg == default_scheduling_group());
+    }
+
+    return {results, dropped};
+}
+
+
+// get profile and validate results
+std::vector<cpu_profiler_trace> get_profile() {
+    return get_profile_and_dropped().first;
+}
+
+}
+
+
+
+SEASTAR_THREAD_TEST_CASE(config_case) {
+    // Ensure that repeatedly configuring the profiler results
+    // in expected behavior.
+    {
+        temporary_profiler_settings cp_0{true, 10ms};
+        temporary_profiler_settings cp_1{true, 20ms};
+        temporary_profiler_settings cp_2{false, 30ms};
+        temporary_profiler_settings cp_3{true, 10ms};
+        temporary_profiler_settings cp_4{true, 100ms};
+
+        spin_some_cooperatively(120*10ms);
+
+        auto results = get_profile();
+        BOOST_REQUIRE(close_to_expected(results.size(), 12));
+    }
+
+    spin_some_cooperatively(128*10ms);
+    auto results = get_profile();
+    BOOST_REQUIRE_EQUAL(results.size(), 0);
+}
+
+SEASTAR_THREAD_TEST_CASE(simple_case) {
+    temporary_profiler_settings cp{true, 100ms};
+
+    spin_some_cooperatively(120*10ms);
+
+    auto [results, dropped_samples] = get_profile_and_dropped();
+    BOOST_REQUIRE(close_to_expected(results.size(), 12));
+    BOOST_REQUIRE_EQUAL(dropped_samples, 0);
+}
+
+SEASTAR_THREAD_TEST_CASE(overwrite_case) {
+    // Ensure that older samples are being overridden in
+    // the cases where we can't collect results fast enough.
+    temporary_profiler_settings cp{true, 10ms};
+
+    spin_some_cooperatively(256*10ms);
+
+    auto [results, dropped_samples] = get_profile_and_dropped();
+    // 128 is the maximum number of samples the profiler can
+    // retain.
+    BOOST_REQUIRE_EQUAL(results.size(), 128);
+    BOOST_REQUIRE(dropped_samples > 0);
+}
+
+SEASTAR_THREAD_TEST_CASE(mixed_case) {
+    // Ensure that the profiler and cpu_stall_detector don't effect
+    // the functioning of the other.
+    std::atomic<unsigned> reports{};
+    temporary_stall_detector_settings tsds(10ms, [&] { ++reports; });
+    temporary_profiler_settings cp{true, 100ms};
+
+    unsigned nr = 10;
+    for (unsigned i = 0; i < nr; ++i) {
+        spin_some_cooperatively(100ms);
+        spin(20ms);
+    }
+
+    maybe_exact(reports, 5, "reports");
+    auto results = get_profile();
+    BOOST_REQUIRE(close_to_expected(results.size(), 12));
+}
+
+SEASTAR_THREAD_TEST_CASE(spin_in_kernel) {
+    // Check that we are correctly sampling the kernel stack.
+    temporary_profiler_settings cp{true, 10ms};
+
+    spin_some_cooperatively(100ms, [] { mmap_populate(128 * 1024); });
+
+    auto results = get_profile();
+    int count = 0;
+    for(auto& result : results) {
+        if(result.kernel_backtrace.size() > 0){
+            count++;
+        }
+    }
+
+    // There is no way to ensure every result has a kernel callstack.
+    // And if we're using the posix timer then no callstacks will be
+    // sampled. So we can't have an assertion here.
+    testlog.info("sampled {} kernel callstacks", count);
+
+    BOOST_REQUIRE(results.size() > 0);
+}
+
+SEASTAR_THREAD_TEST_CASE(signal_mutex_basic) {
+    // A very basic test that ensures the signal_mutex
+    // can't be re-locked after it's already been acquired.
+    internal::signal_mutex mutex;
+
+    {
+        auto guard_opt_1 = mutex.try_lock();
+        BOOST_REQUIRE(guard_opt_1.has_value());
+
+        auto guard_opt_2 = mutex.try_lock();
+        BOOST_REQUIRE(!guard_opt_2.has_value());
+    }
+
+    auto guard_opt_3 = mutex.try_lock();
+    BOOST_REQUIRE(guard_opt_3.has_value());
+}
+
+namespace {
+void random_exception_catcher(int p, int a);
+
+[[gnu::noinline]] void
+random_exception_thrower(int a) {
+  static thread_local std::random_device rd;
+  static thread_local std::mt19937 gen(rd());
+  std::uniform_int_distribution<> d(1, 100);
+
+  a -= 1;
+
+  if (a <= 0) {
+    throw std::invalid_argument("noop");
+  }
+
+  random_exception_catcher(d(gen), a);
+}
+
+[[gnu::noinline]] void random_exception_catcher(int p, int a) {
+  static thread_local std::random_device rd;
+  static thread_local std::mt19937 gen(rd());
+  std::uniform_int_distribution<> d(1, 100);
+
+  try {
+    random_exception_thrower(a);
+  } catch (...) {
+    int r = d(gen);
+    if (r > p) {
+      throw;
+    }
+  }
+}
+
+} // namespace
+
+SEASTAR_THREAD_TEST_CASE(exception_handler_case) {
+
+  // disable for now, CORE-9144
+  return;
+  // Ensure that exception unwinding doesn't cause any issues
+  // while profiling.
+  temporary_profiler_settings cp{true, 1us};
+
+  std::random_device rd;
+  std::mt19937 gen(rd());
+  std::uniform_int_distribution<> d(1, 100);
+  for (int a = 0; a < 10000; a++) {
+    random_exception_catcher(100, d(gen));
+  }
+
+  auto [results, dropped_samples] = get_profile_and_dropped();
+  BOOST_REQUIRE_EQUAL(results.size(), 128);
+  BOOST_REQUIRE(dropped_samples > 0);
+}
+
+SEASTAR_THREAD_TEST_CASE(manually_disable) {
+  // Ensure that manually disabling the profile backtracing works
+  seastar::internal::scoped_disable_profile_temporarily profiling_disabled;
+  temporary_profiler_settings cp{true, 10us};
+
+  spin_some_cooperatively(100ms);
+
+  auto [_, dropped_samples] = get_profile_and_dropped();
+  BOOST_REQUIRE(dropped_samples > 0);
+}
+
+SEASTAR_THREAD_TEST_CASE(config_thrashing) {
+
+  // disable for now, CORE-9144
+  return;
+  // Ensure that fast config changes leave the profiler in a valid
+  // state.
+  temporary_profiler_settings cp{true, 1us};
+
+  std::random_device rd;
+  std::mt19937 gen(rd());
+  std::uniform_int_distribution<> d(1, 100);
+
+  for (int a = 0; a < 100; a++) {
+    int r = d(gen);
+    temporary_profiler_settings cp_0{r % 2 == 0, std::chrono::microseconds(r)};
+    spin_some_cooperatively(1us);
+  }
+
+  auto results = get_profile();
+  BOOST_REQUIRE(results.size() > 0);
+}
+
+SEASTAR_THREAD_TEST_CASE(scheduling_group_test) {
+
+    [[maybe_unused]] auto sg_a = create_scheduling_group("sg_a", 200).get();
+    [[maybe_unused]] auto sg_b = create_scheduling_group("sg_b", 200).get();
+
+    auto destoy_groups = defer([&]() noexcept {
+        destroy_scheduling_group(sg_b).get();
+        destroy_scheduling_group(sg_a).get();
+    });
+
+    temporary_profiler_settings cp{true, 100ms};
+
+    auto fut_a = with_scheduling_group(sg_a, [] {
+        return spin_some_cooperatively_coro(2100ms);
+    });
+
+    with_scheduling_group(sg_b, [] {
+        return spin_some_cooperatively_coro(2100ms);
+    }).get();
+
+    std::move(fut_a).get();
+
+    std::vector<cpu_profiler_trace> results;
+    auto dropped_samples = engine().profiler_results(results);
+
+    size_t count_a = 0, count_b = 0, count_main = 0;
+    for (auto& r : results) {
+        if (r.sg == sg_a) {
+            ++count_a;
+        } else if (r.sg == sg_b) {
+            ++count_b;
+        } else if (r.sg == default_scheduling_group()) {
+            // this happens when the profiler triggers during non-task
+            // work, such as in the reactor pollers
+            ++count_main;
+        } else {
+            BOOST_TEST_FAIL("unexpected SG: " << r.sg.name());
+        }
+    }
+
+    // We expect a and b to be a 1:1 ratio, though we accept large
+    // variance since this is random sampling of two "randomly" scheduled
+    // groups so we don't really have the same guarantees we do in the
+    // single group case where we expect sort of +/- 1 due to the way we
+    // calculate the sampling intervals.
+    // Nominally the split is 10/10/0 for a/b/main, but we just look for
+    // at least 1 event in each to avoid flakiness.
+    BOOST_CHECK_GT(count_a + count_b, 10);
+    BOOST_CHECK_GT(count_a, 0);
+    BOOST_CHECK_GT(count_b, 0);
+    BOOST_CHECK_LT(count_main, 10);
+    BOOST_CHECK_LT(dropped_samples, 10);
+}
+
+#endif
diff --git a/tests/unit/metric_family_replication_test.cc b/tests/unit/metric_family_replication_test.cc
new file mode 100644
index 00000000000..584ba13f479
--- /dev/null
+++ b/tests/unit/metric_family_replication_test.cc
@@ -0,0 +1,96 @@
+#include <seastar/core/metrics.hh>
+#include <seastar/core/metrics_api.hh>
+#include <seastar/core/metrics_registration.hh>
+#include <seastar/testing/test_case.hh>
+#include <seastar/testing/test_runner.hh>
+#include <seastar/testing/thread_test_case.hh>
+
+namespace sm = seastar::metrics;
+namespace smi = seastar::metrics::impl;
+
+bool metric_family_exists(int handle, const seastar::sstring& name) {
+    return smi::get_value_map(handle).contains(name);
+}
+
+void assert_metric_families_equivalent(int source, int destination,
+                                       const seastar::sstring& name) {
+    const auto& source_value_map = smi::get_value_map(source);
+    const auto& destination_value_map = smi::get_value_map(destination);
+
+    BOOST_REQUIRE(source_value_map.contains(name));
+    BOOST_REQUIRE(destination_value_map.contains(name));
+
+    const auto& source_family = source_value_map.at(name);
+    const auto& destination_family = destination_value_map.at(name);
+    for (const auto& [labels, source_metric]: source_family) {
+        auto replica_iter = destination_family.find(labels.labels());
+        BOOST_REQUIRE(replica_iter != destination_family.end());
+
+        const auto& replica_metric = replica_iter->second;
+        BOOST_REQUIRE(source_metric->get_id() == replica_metric->get_id());
+
+        auto source_current_value = source_metric->get_function()().i();
+        auto replica_current_value = replica_metric->get_function()().i();
+        BOOST_REQUIRE(source_current_value == replica_current_value);
+    }
+}
+
+SEASTAR_THREAD_TEST_CASE(replicate_metrics_test) {
+    int foo_handle = sm::default_handle();
+    sm::metric_groups foo(foo_handle);
+    foo.add_group("a", {
+        sm::make_gauge(
+            "gauge",
+            [] { return 0; })});
+
+    int bar_handle = sm::default_handle() + 1;
+    int baz_handle = sm::default_handle() + 2;
+    sm::replicate_metric_families(foo_handle, {
+            {"a_gauge", bar_handle},
+            {"a_gauge", baz_handle}
+    }).get();
+
+    assert_metric_families_equivalent(foo_handle, bar_handle, "a_gauge");
+    assert_metric_families_equivalent(foo_handle, baz_handle, "a_gauge");
+}
+
+SEASTAR_THREAD_TEST_CASE(replicate_same_metric_test) {
+    int foo_handle = sm::default_handle();
+
+    sm::metric_groups foo(foo_handle);
+    foo.add_group("a", {
+        sm::make_gauge(
+            "x",
+            [] { return 0; },
+            sm::description("a_x_description"),
+            {sm::label("id")("1")}),
+        sm::make_gauge(
+            "x",
+            [] { return 0; },
+            sm::description("a_x_description"),
+            {sm::label("id")("2")}),
+        sm::make_gauge(
+            "y",
+            [] { return 0; },
+            sm::description("a_y_description"),
+            {sm::label("id")("1")}),
+    });
+
+    int bar_handle = sm::default_handle() + 1;
+    sm::metric_groups bar(bar_handle);
+
+    // Test that subsequent attempts to replicate the same metric
+    // family are ignored.
+    sm::replicate_metric_families(foo_handle, {{"a_x", bar_handle}}).get();
+    assert_metric_families_equivalent(foo_handle, bar_handle, "a_x");
+    sm::replicate_metric_families(foo_handle, {{"a_x", bar_handle}}).get();
+    assert_metric_families_equivalent(foo_handle, bar_handle, "a_x");
+
+
+    // Ensure that when the set of replicated metric families is changed
+    // the replicas that are not in the new set are removed.
+    sm::replicate_metric_families(foo_handle, {{"a_y", bar_handle}}).get();
+    assert_metric_families_equivalent(foo_handle, bar_handle, "a_y");
+
+    BOOST_REQUIRE(metric_family_exists(bar_handle, "a_y"));
+}
diff --git a/tests/unit/stall_detector_test.cc b/tests/unit/stall_detector_test.cc
index f28a41ca3cb..8ba07f1c924 100644
--- a/tests/unit/stall_detector_test.cc
+++ b/tests/unit/stall_detector_test.cc
@@ -35,59 +35,7 @@
 #include <sys/mman.h>
 
 #ifndef SEASTAR_DEBUG
-
-using namespace seastar;
-using namespace std::chrono_literals;
-
-static seastar::logger testlog("testlog");
-
-class temporary_stall_detector_settings {
-    std::chrono::milliseconds _old_threshold;
-    std::function<void ()> _old_report;
-public:
-    /**
-     * Temporarily (until destructor) overload the stall detector threshold and reporting function.
-     *
-     * Also resets the reported stalls counter to zero, so the next backtraces will not be supressed.
-     */
-    temporary_stall_detector_settings(std::chrono::duration<double> threshold, std::function<void ()> report = {})
-            : _old_threshold(engine().get_blocked_reactor_notify_ms())
-            , _old_report(reactor::test::get_stall_detector_report_function()) {
-        engine().update_blocked_reactor_notify_ms(std::chrono::duration_cast<std::chrono::milliseconds>(threshold));
-        reactor::test::set_stall_detector_report_function(std::move(report));
-    }
-
-    ~temporary_stall_detector_settings() {
-        engine().update_blocked_reactor_notify_ms(_old_threshold);
-        reactor::test::set_stall_detector_report_function(std::move(_old_report));
-    }
-};
-
-using void_fn = std::function<void()>;
-
-void spin(std::chrono::duration<double> how_much, void_fn body = []{}) {
-    auto end = internal::cpu_stall_detector::clock_type::now() + how_much;
-    while (internal::cpu_stall_detector::clock_type::now() < end) {
-        body(); // spin!
-    }
-}
-
-static void spin_user_hires(std::chrono::duration<double> how_much) {
-    auto end = std::chrono::high_resolution_clock::now() + how_much;
-    while (std::chrono::high_resolution_clock::now() < end) {
-
-    }
-}
-
-void spin_some_cooperatively(std::chrono::duration<double> how_much, void_fn body = []{}) {
-    auto end = std::chrono::steady_clock::now() + how_much;
-    while (std::chrono::steady_clock::now() < end) {
-        spin(200us, body);
-        if (need_preempt()) {
-            thread::yield();
-        }
-    }
-}
+#include "stall_detector_test_utilities.hh"
 
 SEASTAR_THREAD_TEST_CASE(normal_case) {
     std::atomic<unsigned> reports{};
@@ -131,46 +79,11 @@ SEASTAR_THREAD_TEST_CASE(no_poll_no_stall) {
     BOOST_REQUIRE_EQUAL(reports, 0);
 }
 
-// Triggers stalls by spinning with a specify "body" function
-// which takes most of the spin time.
-static void test_spin_with_body(const char* what, void_fn body) {
-    // The !count_stacks mode outputs stall notification to stderr as usual
-    // and do not assert anything, but are intended for diagnosing
-    // stall problems by inspecting the output. We expect the userspace
-    // spin test to show no kernel callstack, and the kernel test to
-    // show kernel backtraces in the mmap or munmap path, but this is
-    // not exact since neither test spends 100% of its time in the
-    // selected mode (of course, kernel stacks only appear if the
-    // perf-based stall detected could be enabled).
-    //
-    // Then the count_stacks mode tests that the right number of stacks
-    // were output.
-    for (auto count_stacks : {false, true}) {
-        testlog.info("Starting spin test: {}", what);
-        std::atomic<unsigned> reports{};
-        std::function<void()> reporter = count_stacks ? std::function<void()>{[&]{ ++reports; }} : nullptr;
-        temporary_stall_detector_settings tsds(10ms, std::move(reporter));
-        constexpr unsigned nr = 5;
-        for (unsigned i = 0; i < nr; ++i) {
-            spin_some_cooperatively(100ms, body);
-            spin(20ms, body);
-        }
-        testlog.info("Ending spin test: {}", what);
-        BOOST_CHECK_EQUAL(reports, count_stacks ? 5 : 0);
-    }
-}
-
 SEASTAR_THREAD_TEST_CASE(spin_in_userspace) {
     // a body which spends almost all of its time in userspace
     test_spin_with_body("userspace", [] { spin_user_hires(1ms); });
 }
 
-static void mmap_populate(size_t len) {
-    void *p = mmap(nullptr, len, PROT_READ | PROT_WRITE, MAP_PRIVATE | MAP_ANONYMOUS | MAP_POPULATE, 0, 0);
-    BOOST_REQUIRE(p != MAP_FAILED);
-    BOOST_REQUIRE(munmap(p, len) == 0);
-}
-
 SEASTAR_THREAD_TEST_CASE(spin_in_kernel) {
     // a body which spends almost all of its time in the kernel
     // doing 128K mmaps
diff --git a/tests/unit/stall_detector_test_utilities.hh b/tests/unit/stall_detector_test_utilities.hh
new file mode 100644
index 00000000000..48fa5055f4a
--- /dev/null
+++ b/tests/unit/stall_detector_test_utilities.hh
@@ -0,0 +1,140 @@
+/*
+ * This file is open source software, licensed to you under the terms
+ * of the Apache License, Version 2.0 (the "License").  See the NOTICE file
+ * distributed with this work for additional information regarding copyright
+ * ownership.  You may not use this file except in compliance with the License.
+ *
+ * You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+/*
+ * Copyright (C) 2023 ScyllaDB Ltd.
+ */
+
+#pragma once
+
+#include <cstddef>
+#include <seastar/core/internal/stall_detector.hh>
+#include <seastar/core/reactor.hh>
+#include "seastar/core/scheduling.hh"
+#include "seastar/core/thread.hh"
+#include "seastar/coroutine/maybe_yield.hh"
+#include <seastar/core/thread_cputime_clock.hh>
+#include <seastar/core/loop.hh>
+#include <seastar/util/later.hh>
+#include <atomic>
+#include <chrono>
+#include <sys/mman.h>
+#include <boost/test/tools/old/interface.hpp>
+
+namespace {
+
+using namespace seastar;
+using namespace std::chrono_literals;
+
+static seastar::logger testlog("testlog");
+
+class temporary_stall_detector_settings {
+    std::chrono::milliseconds _old_threshold;
+    std::function<void ()> _old_report;
+public:
+    /**
+     * Temporarily (until destructor) overload the stall detector threshold and reporting function.
+     *
+     * Also resets the reported stalls counter to zero, so the next backtraces will not be supressed.
+     */
+    temporary_stall_detector_settings(std::chrono::duration<double> threshold, std::function<void ()> report = {})
+            : _old_threshold(engine().get_blocked_reactor_notify_ms())
+            , _old_report(reactor::test::get_stall_detector_report_function()) {
+        engine().update_blocked_reactor_notify_ms(std::chrono::duration_cast<std::chrono::milliseconds>(threshold));
+        reactor::test::set_stall_detector_report_function(std::move(report));
+    }
+
+    ~temporary_stall_detector_settings() {
+        engine().update_blocked_reactor_notify_ms(_old_threshold);
+        reactor::test::set_stall_detector_report_function(std::move(_old_report));
+    }
+};
+
+using void_fn = std::function<void()>;
+
+void spin(std::chrono::duration<double> how_much, void_fn body = []{}) {
+    auto end = internal::cpu_stall_detector::clock_type::now() + how_much;
+    while (internal::cpu_stall_detector::clock_type::now() < end) {
+        body(); // spin!
+    }
+}
+
+// Function unused in debug mode
+[[maybe_unused]] void spin_user_hires(std::chrono::duration<double> how_much) {
+    auto end = std::chrono::high_resolution_clock::now() + how_much;
+    while (std::chrono::high_resolution_clock::now() < end) {
+
+    }
+}
+
+void spin_some_cooperatively(std::chrono::duration<double> how_much, void_fn body = []{}) {
+    auto end = std::chrono::steady_clock::now() + how_much;
+    while (std::chrono::steady_clock::now() < end) {
+        spin(200us, body);
+        if (need_preempt()) {
+            thread::yield();
+        }
+    }
+}
+
+[[maybe_unused]]
+future<> spin_some_cooperatively_coro(std::chrono::duration<double> how_much, void_fn body = []{}) {
+    auto end = std::chrono::steady_clock::now() + how_much;
+    while (std::chrono::steady_clock::now() < end) {
+        // fmt::print("GC: {}\n", current_scheduling_group().name());
+        spin(200us, body);
+        co_await coroutine::maybe_yield();
+    }
+}
+
+
+// Triggers stalls by spinning with a specify "body" function
+// which takes most of the spin time.
+inline void test_spin_with_body(const char* what, void_fn body) {
+    // The !count_stacks mode outputs stall notification to stderr as usual
+    // and do not assert anything, but are intended for diagnosing
+    // stall problems by inspecting the output. We expect the userspace
+    // spin test to show no kernel callstack, and the kernel test to
+    // show kernel backtraces in the mmap or munmap path, but this is
+    // not exact since neither test spends 100% of its time in the
+    // selected mode (of course, kernel stacks only appear if the
+    // perf-based stall detected could be enabled).
+    //
+    // Then the count_stacks mode tests that the right number of stacks
+    // were output.
+    for (auto count_stacks : {false, true}) {
+        testlog.info("Starting spin test: {}", what);
+        std::atomic<unsigned> reports{};
+        std::function<void()> reporter = count_stacks ? std::function<void()>{[&]{ ++reports; }} : nullptr;
+        temporary_stall_detector_settings tsds(10ms, std::move(reporter));
+        constexpr unsigned nr = 5;
+        for (unsigned i = 0; i < nr; ++i) {
+            spin_some_cooperatively(100ms, body);
+            spin(20ms, body);
+        }
+        testlog.info("Ending spin test: {}", what);
+        BOOST_CHECK_EQUAL(reports, count_stacks ? 5 : 0);
+    }
+}
+
+inline void mmap_populate(size_t len) {
+    void *p = mmap(nullptr, len, PROT_READ | PROT_WRITE, MAP_PRIVATE | MAP_ANONYMOUS | MAP_POPULATE, 0, 0);
+    BOOST_REQUIRE(p != MAP_FAILED);
+    BOOST_REQUIRE(munmap(p, len) == 0);
+}
+
+} // namespace
diff --git a/tests/unit/tls_test.cc b/tests/unit/tls_test.cc
index e522ba6d036..fc4059fb223 100644
--- a/tests/unit/tls_test.cc
+++ b/tests/unit/tls_test.cc
@@ -1054,6 +1054,65 @@ SEASTAR_THREAD_TEST_CASE(test_reload_certificates) {
     }
 }
 
+SEASTAR_THREAD_TEST_CASE(test_reload_certificates_with_creds) {
+    tmpdir tmp;
+
+    namespace fs = std::filesystem;
+
+    fs::copy_file(certfile("other.crt"), tmp.path() / "test.crt");
+    fs::copy_file(certfile("other.key"), tmp.path() / "test.key");
+
+    auto cert = (tmp.path() / "test.crt").native();
+    auto key = (tmp.path() / "test.key").native();
+    std::unordered_set<sstring> changed;
+    promise<> p;
+
+    tls::credentials_builder b;
+    b.set_x509_key_file(cert, key, tls::x509_crt_format::PEM).get();
+    b.set_dh_level();
+
+    auto certs = b.build_reloadable_server_credentials([&](const std::unordered_set<sstring> &files,
+                                                           const tls::certificate_credentials &creds,
+                                                           std::exception_ptr ep,
+                                                           std::optional<tls::blob> trust_file_contents) {
+        if (ep) {
+            return;
+        }
+
+        changed.insert(files.begin(), files.end());
+        if (changed.count(cert) && changed.count(key)) {
+            p.set_value();
+        }
+
+        auto certs_info = creds.get_cert_info();
+        auto trust_list_info = creds.get_trust_list_info();
+
+        BOOST_CHECK(certs_info.has_value() && !certs_info.value().empty());
+        BOOST_CHECK(trust_list_info.has_value() && trust_list_info.value().empty());
+        BOOST_CHECK(!trust_file_contents.has_value());
+
+    }).get();
+
+    BOOST_CHECK(certs != nullptr);
+
+    auto certs_info = certs->get_cert_info();
+    auto trust_list_info = certs->get_trust_list_info();
+
+    BOOST_CHECK(certs_info.has_value() && !certs_info.value().empty());
+    BOOST_CHECK(trust_list_info.has_value());
+    BOOST_CHECK(!b.get_trust_file_blob().has_value());
+
+    fs::copy_file(certfile("test.crt"), tmp.path() / "test0.crt");
+    fs::copy_file(certfile("test.key"), tmp.path() / "test0.key");
+
+    rename_file((tmp.path() / "test0.crt").native(), (tmp.path() / "test.crt").native()).get();
+    rename_file((tmp.path() / "test0.key").native(), (tmp.path() / "test.key").native()).get();
+
+    p.get_future().get();
+
+    BOOST_CHECK(!changed.empty());
+}
+
 SEASTAR_THREAD_TEST_CASE(test_reload_broken_certificates) {
     tmpdir tmp;