redpanda-data
diff --git a/‎src/v/cloud_topics/BUILD‎
Lines changed: 13 additions & 0 deletions b/‎src/v/cloud_topics/BUILD‎
Lines changed: 13 additions & 0 deletions
diff --git a/‎src/v/cloud_topics/app.cc‎
Lines changed: 30 additions & 1 deletion b/‎src/v/cloud_topics/app.cc‎
Lines changed: 30 additions & 1 deletion
diff --git a/‎src/v/cloud_topics/app.h‎
Lines changed: 4 additions & 1 deletion b/‎src/v/cloud_topics/app.h‎
Lines changed: 4 additions & 1 deletion
diff --git a/‎src/v/cloud_topics/level_one/metastore/BUILD‎
Lines changed: 24 additions & 0 deletions b/‎src/v/cloud_topics/level_one/metastore/BUILD‎
Lines changed: 24 additions & 0 deletions
diff --git a/‎src/v/cloud_topics/level_one/metastore/flush_loop.cc‎
Lines changed: 153 additions & 0 deletions b/‎src/v/cloud_topics/level_one/metastore/flush_loop.cc‎
Lines changed: 153 additions & 0 deletions
diff --git a/‎src/v/cloud_topics/level_one/metastore/flush_loop.h‎
Lines changed: 62 additions & 0 deletions b/‎src/v/cloud_topics/level_one/metastore/flush_loop.h‎
Lines changed: 62 additions & 0 deletions
diff --git a/‎src/v/cloud_topics/level_one/metastore/tests/replicated_metastore_test.cc‎
Lines changed: 9 additions & 2 deletions b/‎src/v/cloud_topics/level_one/metastore/tests/replicated_metastore_test.cc‎
Lines changed: 9 additions & 2 deletions
@@ -24,6 +24,18 @@ redpanda_cc_library(
     ],
 )
 
+redpanda_cc_library(
+    name = "test_fixture_cfg",
+    hdrs = [
+        "test_fixture_cfg.h",
+    ],
+    visibility = [
+        "//src/v/cloud_topics/tests:__pkg__",
+        "//src/v/redpanda:__pkg__",
+        "//src/v/redpanda/tests:__pkg__",
+    ],
+)
+
 redpanda_cc_library(
     name = "types",
     srcs = [
@@ -80,6 +92,7 @@ redpanda_cc_library(
         ":cluster_services_interface",
         ":data_plane_impl",
         "//src/v/cloud_topics/housekeeper:manager",
+        "//src/v/cloud_topics/level_one/metastore:flush_loop",
         "//src/v/cloud_topics/level_one/metastore:topic_purger",
         "//src/v/cloud_topics/level_zero/gc:level_zero_gc",
         "//src/v/cloud_topics/manager",
 
@@ -15,6 +15,7 @@
 #include "cloud_topics/data_plane_impl.h"
 #include "cloud_topics/housekeeper/manager.h"
 #include "cloud_topics/level_one/compaction/scheduler.h"
+#include "cloud_topics/level_one/metastore/flush_loop.h"
 #include "cloud_topics/level_one/metastore/topic_purger.h"
 #include "cloud_topics/level_zero/gc/level_zero_gc.h"
 #include "cloud_topics/manager/manager.h"
@@ -45,7 +46,8 @@ ss::future<> app::construct(
   ss::sharded<cluster::metadata_cache>* metadata_cache,
   ss::sharded<rpc::connection_cache>* connection_cache,
   cloud_storage_clients::bucket_name bucket,
-  ss::sharded<storage::api>* storage) {
+  ss::sharded<storage::api>* storage,
+  bool skip_flush_loop) {
     data_plane = co_await make_data_plane(
       ssx::sformat("{}::data_plane", _logger_name),
       remote,
@@ -103,6 +105,13 @@ ss::future<> app::construct(
       &controller->get_topics_state(),
       &controller->get_topics_frontend());
 
+    if (!skip_flush_loop) {
+        co_await construct_service(
+          flush_loop_manager, ss::sharded_parameter([this] {
+              return &replicated_metastore.local();
+          }));
+    }
+
     co_await construct_service(
       reconciler,
       ss::sharded_parameter([this] { return &l1_io.local(); }),
@@ -153,6 +162,10 @@ ss::future<> app::start() {
     co_await housekeeper_manager.invoke_on_all(&housekeeper_manager::start);
     co_await compaction_scheduler->start();
     co_await l0_gc.invoke_on_all(&level_zero_gc::start);
+    if (flush_loop_manager.local_is_initialized()) {
+        co_await flush_loop_manager.invoke_on_all(
+          &l1::flush_loop_manager::start);
+    }
 
     // When start is called, we must have registered all the callbacks before
     // this as starting the manager will invoke callbacks for partitions already
@@ -175,6 +188,22 @@ ss::future<> app::wire_up_notifications() {
             purge_mgr.enqueue_loop_reset(needs_loop);
         });
     });
+    if (flush_loop_manager.local_is_initialized()) {
+        co_await flush_loop_manager.invoke_on_all([this](auto& flm) {
+            manager.local().on_l1_domain_leader(
+              [&flm](
+                const model::ntp& ntp,
+                const auto&,
+                const auto& partition) noexcept {
+                  if (ntp.tp.partition != model::partition_id{0}) {
+                      return;
+                  }
+                  auto needs_loop = l1::flush_loop_manager::needs_loop{
+                    bool(partition)};
+                  flm.enqueue_loop_reset(needs_loop);
+              });
+        });
+    }
     co_await housekeeper_manager.invoke_on_all([this](auto& hm) {
         manager.local().on_ctp_partition_leader(
           [&hm](
 
@@ -40,6 +40,7 @@ class level_zero_gc;
 class housekeeper_manager;
 
 namespace l1 {
+class flush_loop_manager;
 class topic_purger_manager;
 } // namespace l1
 
@@ -63,7 +64,8 @@ class app : public ssx::sharded_service_container {
       ss::sharded<cluster::metadata_cache>*,
       ss::sharded<rpc::connection_cache>*,
       cloud_storage_clients::bucket_name,
-      ss::sharded<storage::api>*);
+      ss::sharded<storage::api>*,
+      bool skip_flush_loop = false);
 
     ss::future<> start();
 
@@ -92,6 +94,7 @@ class app : public ssx::sharded_service_container {
     ss::sharded<l1::domain_supervisor> domain_supervisor;
     ss::sharded<l1::leader_router> l1_metastore_router;
     ss::sharded<l1::topic_purger_manager> topic_purge_manager;
+    ss::sharded<l1::flush_loop_manager> flush_loop_manager;
     ss::sharded<cloud_topics_manager> manager;
     ss::sharded<level_zero_gc> l0_gc;
     ss::sharded<housekeeper_manager> housekeeper_manager;
 
@@ -349,6 +349,30 @@ redpanda_cc_library(
     ],
 )
 
+redpanda_cc_library(
+    name = "flush_loop",
+    srcs = [
+        "flush_loop.cc",
+    ],
+    hdrs = [
+        "flush_loop.h",
+    ],
+    implementation_deps = [
+        ":metastore",
+        "//src/v/base",
+        "//src/v/cloud_topics:logger",
+        "//src/v/config",
+        "//src/v/ssx:semaphore",
+        "//src/v/ssx:time",
+    ],
+    visibility = ["//visibility:public"],
+    deps = [
+        "//src/v/base",
+        "//src/v/ssx:actor",
+        "@seastar",
+    ],
+)
+
 redpanda_cc_library(
     name = "extent_metadata_reader",
     srcs = [
 
@@ -0,0 +1,153 @@
+/*
+ * Copyright 2026 Redpanda Data, Inc.
+ *
+ * Licensed as a Redpanda Enterprise file under the Redpanda Community
+ * License (the "License"); you may not use this file except in compliance with
+ * the License. You may obtain a copy of the License at
+ *
+ * https://github.com/redpanda-data/redpanda/blob/master/licenses/rcl.md
+ */
+#include "cloud_topics/level_one/metastore/flush_loop.h"
+
+#include "base/vlog.h"
+#include "cloud_topics/level_one/metastore/metastore.h"
+#include "cloud_topics/logger.h"
+#include "config/configuration.h"
+#include "ssx/semaphore.h"
+#include "ssx/time.h"
+
+namespace cloud_topics::l1 {
+
+// Loop that flushes the metastore periodically until stopped.
+class flush_loop {
+public:
+    explicit flush_loop(
+      metastore* metastore,
+      config::binding<std::chrono::milliseconds> flush_interval)
+      : metastore_(metastore)
+      , flush_interval_(std::move(flush_interval)) {
+        flush_interval_.watch([this] { sem_.signal(); });
+    }
+
+    void start() {
+        ssx::spawn_with_gate(gate_, [this] { return run_loop(); });
+    }
+
+    ss::future<> stop_and_wait() {
+        vlog(cd_log.debug, "Metastore flush loop stopping...");
+        as_.request_abort();
+        sem_.broken();
+        co_await gate_.close();
+        vlog(cd_log.debug, "Metastore flush loop stopped");
+    }
+
+private:
+    ss::future<> run_loop() {
+        const auto retry_interval = ssx::duration::seconds(10);
+        while (!as_.abort_requested()) {
+            auto start = ssx::instant::from_chrono(ss::lowres_clock::now());
+            auto res = co_await metastore_->flush();
+            auto finish = ssx::instant::from_chrono(ss::lowres_clock::now());
+
+            ssx::duration sleep_duration;
+            if (!res.has_value()) {
+                vlog(
+                  cd_log.warn,
+                  "Failed to flush metastore, retrying in {}: {}",
+                  retry_interval,
+                  res.error());
+                sleep_duration = retry_interval;
+            } else {
+                auto flush_interval = ssx::duration::from_chrono(
+                  flush_interval_());
+                auto flush_time = finish - start;
+                sleep_duration = flush_interval - flush_time;
+            }
+
+            if (sleep_duration > ssx::duration::zero()) {
+                try {
+                    co_await sem_.wait(
+                      sleep_duration.to_chrono<std::chrono::milliseconds>(),
+                      std::max(sem_.current(), size_t(1)));
+                } catch (const ss::semaphore_timed_out&) {
+                    // Time to wake up! Continue onto the next iteration.
+                } catch (...) {
+                    auto eptr = std::current_exception();
+                    auto log_lvl = ssx::is_shutdown_exception(eptr)
+                                     ? ss::log_level::debug
+                                     : ss::log_level::warn;
+                    vlogl(
+                      cd_log,
+                      log_lvl,
+                      "Metastore flush loop hit exception while sleeping: {}",
+                      eptr);
+                }
+            }
+        }
+    }
+
+    ss::gate gate_;
+    ss::abort_source as_;
+    metastore* metastore_;
+    config::binding<std::chrono::milliseconds> flush_interval_;
+    ssx::semaphore sem_{0, "flush_loop"};
+};
+
+flush_loop_manager::flush_loop_manager(metastore* metastore)
+  : metastore_(metastore) {}
+
+flush_loop_manager::~flush_loop_manager() = default;
+
+ss::future<> flush_loop_manager::reset_flush_loop(
+  flush_loop_manager::needs_loop needs_loop) {
+    if (!needs_loop) {
+        // We should not have a running loop. Stop it if one exists.
+        if (flush_loop_) {
+            auto loop = std::exchange(flush_loop_, nullptr);
+            auto stop_fut = co_await ss::coroutine::as_future(
+              loop->stop_and_wait());
+            if (stop_fut.failed()) {
+                auto ex = stop_fut.get_exception();
+                vlog(cd_log.error, "Stopping flush loop failed: {}", ex);
+            }
+        }
+        co_return;
+    }
+    if (flush_loop_) {
+        // We need a loop and already have one.
+        co_return;
+    }
+    auto loop = std::make_unique<flush_loop>(
+      metastore_,
+      config::shard_local_cfg().cloud_topics_long_term_flush_interval.bind());
+    loop->start();
+    flush_loop_ = std::move(loop);
+}
+
+void flush_loop_manager::enqueue_loop_reset(
+  flush_loop_manager::needs_loop needs_loop) {
+    tell(needs_loop);
+}
+
+ss::future<>
+flush_loop_manager::process(flush_loop_manager::needs_loop needs_loop) {
+    return reset_flush_loop(needs_loop);
+}
+
+void flush_loop_manager::on_error(std::exception_ptr ex) noexcept {
+    vlog(cd_log.error, "Unexpected flush loop manager error: {}", ex);
+}
+
+ss::future<> flush_loop_manager::stop() {
+    co_await actor::stop();
+    if (flush_loop_) {
+        auto fut = co_await ss::coroutine::as_future(
+          flush_loop_->stop_and_wait());
+        if (fut.failed()) {
+            auto ex = fut.get_exception();
+            vlog(cd_log.error, "Error stopping flush loop manager: {}", ex);
+        }
+    }
+}
+
+} // namespace cloud_topics::l1
@@ -0,0 +1,62 @@
+/*
+ * Copyright 2026 Redpanda Data, Inc.
+ *
+ * Licensed as a Redpanda Enterprise file under the Redpanda Community
+ * License (the "License"); you may not use this file except in compliance with
+ * the License. You may obtain a copy of the License at
+ *
+ * https://github.com/redpanda-data/redpanda/blob/master/licenses/rcl.md
+ */
+#pragma once
+
+#include "base/seastarx.h"
+#include "ssx/actor.h"
+
+#include <seastar/core/future.hh>
+
+#include <memory>
+
+namespace cloud_topics::l1 {
+
+class metastore;
+class flush_loop;
+
+// Manages a loop to flush the metastore that runs only on leadership of
+// partition 0 of the metastore topic. Under the hood, each flush will request
+// flushes of each partition, so it's sufficient to only run this on one
+// partition.
+//
+// TODO: it may be worth having each domain independently flush (e.g. if
+// there's a lull in traffic), and then have this loop request flushes if there
+// hasn't been a domain flush within some time bound. Giving some control to
+// individual domain could help us avoid potential added latencies that may
+// come from flushing while the domain is serving a high volume of requests.
+class flush_loop_manager
+  : public ssx::actor<
+      ss::bool_class<struct flush_needs_loop_tag>,
+      1,
+      ssx::overflow_policy::drop_oldest> {
+public:
+    using needs_loop = ss::bool_class<struct flush_needs_loop_tag>;
+
+    explicit flush_loop_manager(metastore* metastore);
+    ~flush_loop_manager() override;
+
+    // Enqueues a reset of the loop such that eventually a flush_loop will be
+    // running if needs_loop is true, or not running if false.
+    void enqueue_loop_reset(needs_loop needs);
+
+    ss::future<> stop() override;
+
+protected:
+    ss::future<> process(needs_loop needs) override;
+    void on_error(std::exception_ptr ex) noexcept override;
+
+private:
+    ss::future<> reset_flush_loop(needs_loop needs);
+
+    metastore* metastore_;
+    std::unique_ptr<flush_loop> flush_loop_;
+};
+
+} // namespace cloud_topics::l1
@@ -41,9 +41,16 @@ class ReplicatedMetastoreTest
 
     bool is_lsm_backend() const { return GetParam() == metastore_backend::lsm; }
 
+    cloud_topics::test_fixture_cfg fixture_cfg() const {
+        return {
+          .use_lsm_metastore = is_lsm_backend(),
+          // Skip flushing since tests may exercise flushing.
+          .skip_flush_loop = true,
+        };
+    }
     void SetUp() override {
         for (size_t i = 0; i < num_brokers; i++) {
-            add_node(is_lsm_backend());
+            add_node(fixture_cfg());
         }
         wait_for_all_members(5s).get();
     }
@@ -1007,7 +1014,7 @@ TEST_P(ReplicatedMetastoreTest, TestBasicFlushAndRestore) {
     // Restart all nodes.
     // NOTE: the added nodes get the same node IDs 0, 1, 2.
     for (size_t i = 0; i < num_brokers; i++) {
-        add_node(is_lsm_backend());
+        add_node(fixture_cfg());
     }
     wait_for_all_members(5s).get();