ct/frontend: allow concurrent requests per producer

rockwotj · rockwotj · commit f4623c883c44 · 2025-12-22T15:00:39.000Z
Currently, we can only upload a single batch from a producer at once in
order to preserve the ordering of requests into rm_stm for idempotency.

That is undesirable for both latency and cost (of s3 uploads). To fix
this, mark requests as enqueued before they are uploaded into s3, but
mark their order. Once the request is uploaded we re-enforce ordering
of batches to preserve the requirements for rm_stm to do its thing.
diff --git a/src/v/cloud_topics/frontend/frontend.cc b/src/v/cloud_topics/frontend/frontend.cc
@@ -542,11 +542,16 @@ ss::future<> bg_upload_and_replicate(
   bool cache_enabled) {
     vassert(api != nullptr, "cloud topics api is not initialized");
 
+    auto ticket = op->ctp_stm_api->producer_queue().reserve(
+      op->batch_id.pid.get_id());
+    // Now that we've acquired our ticket and determined our ordering, we can
+    // say that the request is enqueued and get more produce requests.
+    op->request_enqueued.set_value();
+
     auto fallback = ss::defer([op] {
         // This guarantees that the promises are set.
         // The error code used here does not represent the
         // actual error.
-        op->request_enqueued.set_value();
         op->replicate_finished.set_value(raft::errc::timeout);
     });
 
@@ -568,6 +573,7 @@ ss::future<> bg_upload_and_replicate(
     if (cache_enabled) {
         rb_copy = clone_batches(op->batches);
     }
+
     auto timeout = op->timeout == 0ms ? L0_upload_default_timeout : op->timeout;
     auto res = co_await api->write_and_debounce(
       op->ntp,
@@ -614,26 +620,29 @@ ss::future<> bg_upload_and_replicate(
 
     chunked_vector<model::record_batch_header> headers;
     headers.push_back(header);
-    auto placeholders = co_await convert_to_placeholders(
-      res.value(), std::move(headers));
+    auto placeholders = co_await convert_to_placeholders(res.value(), headers);
 
     vassert(
       placeholders.batches.size() == 1,
       "Expected single batch, got {}",
       placeholders.batches.size());
-
-    // Replicate
+    // Wait for all previous requests from this producer to be processed
+    co_await ticket.redeem();
+    // Replicate now that our ticket is redeemed
     op->opts = update_replicate_options(op->opts, fence.term);
     auto replicate_stages = partition->replicate_in_stages(
       op->batch_id, std::move(placeholders.batches.front()), op->opts);
 
     fallback.cancel();
 
-    // Forward future result to the 'op'. The expectation is that at this point
-    // the target promises (inside 'op') are used to generate futures and these
-    // futures are awaited.
-    replicate_stages.request_enqueued.forward_to(
-      std::move(op->request_enqueued));
+    // Once the request is enqueued in raft and our order is guaranteed we can
+    // release our ticket and further requests can be enqueued into the raft
+    // layer.
+    ssx::background = replicate_stages.request_enqueued.then_wrapped(
+      [t = std::move(ticket)](ss::future<> fut) mutable {
+          t.release();
+          fut.ignore_ready_future();
+      });
 
     auto replicate_fut
       = std::move(replicate_stages.replicate_finished)