Compare commits

..

10 Commits

Author SHA1 Message Date
5dccbbc9d1 v25.11.23
Some checks failed
Default (tags) / security (push) Failing after 1s
Default (tags) / test (push) Failing after 1s
Default (tags) / release (push) Has been skipped
Default (tags) / metadata (push) Has been skipped
2026-03-17 12:22:51 +00:00
92d7113c6c fix(rustproxy-http,rustproxy-metrics): reduce per-frame metrics overhead by batching body byte accounting 2026-03-17 12:22:51 +00:00
8f6bb30367 v25.11.22
Some checks failed
Default (tags) / security (push) Failing after 1s
Default (tags) / test (push) Failing after 1s
Default (tags) / release (push) Has been skipped
Default (tags) / metadata (push) Has been skipped
2026-03-17 12:12:24 +00:00
ef9bac80ff fix(rustproxy-http): reuse healthy HTTP/2 upstream connections after requests with bodies 2026-03-17 12:12:24 +00:00
9c78701038 v25.11.21
Some checks failed
Default (tags) / security (push) Failing after 1s
Default (tags) / test (push) Failing after 1s
Default (tags) / release (push) Has been skipped
Default (tags) / metadata (push) Has been skipped
2026-03-17 11:33:34 +00:00
26fd9409a7 fix(rustproxy-http): reuse pooled HTTP/2 connections for requests with and without bodies 2026-03-17 11:33:34 +00:00
cfff128499 v25.11.20
Some checks failed
Default (tags) / security (push) Failing after 1s
Default (tags) / test (push) Failing after 1s
Default (tags) / release (push) Has been skipped
Default (tags) / metadata (push) Has been skipped
2026-03-17 01:32:35 +00:00
3baff354bd fix(rustproxy-http): avoid downgrading cached backend protocol on H2 stream errors 2026-03-17 01:32:35 +00:00
c2eacd1b30 v25.11.19
Some checks failed
Default (tags) / security (push) Failing after 1s
Default (tags) / test (push) Failing after 2s
Default (tags) / release (push) Has been skipped
Default (tags) / metadata (push) Has been skipped
2026-03-16 20:53:39 +00:00
1fdbfcf0aa fix(rustproxy-http): avoid reusing pooled HTTP/2 connections for requests with bodies to prevent upload flow-control stalls 2026-03-16 20:53:39 +00:00
6 changed files with 128 additions and 67 deletions

View File

@@ -1,5 +1,37 @@
# Changelog # Changelog
## 2026-03-17 - 25.11.23 - fix(rustproxy-http,rustproxy-metrics)
reduce per-frame metrics overhead by batching body byte accounting
- Buffer HTTP body byte counts and flush them every 64 KB, at end of stream, and on drop to keep totals accurate while preserving throughput sampling.
- Skip zero-value counter updates in metrics collection to avoid unnecessary atomic and DashMap operations for the unused direction.
## 2026-03-17 - 25.11.22 - fix(rustproxy-http)
reuse healthy HTTP/2 upstream connections after requests with bodies
- Registers successful HTTP/2 connections in the pool regardless of whether the proxied request included a body
- Continues to avoid pooling upstream connections that returned 502 Bad Gateway responses
## 2026-03-17 - 25.11.21 - fix(rustproxy-http)
reuse pooled HTTP/2 connections for requests with and without bodies
- remove the bodyless-request restriction from HTTP/2 pool checkout
- always return successful HTTP/2 senders to the connection pool after requests
## 2026-03-17 - 25.11.20 - fix(rustproxy-http)
avoid downgrading cached backend protocol on H2 stream errors
- Treat HTTP/2 stream-level failures as retryable request errors instead of evidence that the backend only supports HTTP/1.1
- Keep protocol cache entries unchanged after successful H2 handshakes so future requests continue using HTTP/2
- Lower log severity for this fallback path from warning to debug while still recording backend H2 failure metrics
## 2026-03-16 - 25.11.19 - fix(rustproxy-http)
avoid reusing pooled HTTP/2 connections for requests with bodies to prevent upload flow-control stalls
- Limit HTTP/2 pool checkout to bodyless requests such as GET, HEAD, and DELETE
- Skip re-registering HTTP/2 connections in the pool after requests that send a body
- Prevent stalled uploads caused by depleted connection-level flow control windows on reused HTTP/2 connections
## 2026-03-16 - 25.11.18 - fix(repo) ## 2026-03-16 - 25.11.18 - fix(repo)
no changes to commit no changes to commit

View File

@@ -1,6 +1,6 @@
{ {
"name": "@push.rocks/smartproxy", "name": "@push.rocks/smartproxy",
"version": "25.11.18", "version": "25.11.23",
"private": false, "private": false,
"description": "A powerful proxy package with unified route-based configuration for high traffic management. Features include SSL/TLS support, flexible routing patterns, WebSocket handling, advanced security options, and automatic ACME certificate management.", "description": "A powerful proxy package with unified route-based configuration for high traffic management. Features include SSL/TLS support, flexible routing patterns, WebSocket handling, advanced security options, and automatic ACME certificate management.",
"main": "dist_ts/index.js", "main": "dist_ts/index.js",

View File

@@ -9,10 +9,17 @@ use bytes::Bytes;
use http_body::Frame; use http_body::Frame;
use rustproxy_metrics::MetricsCollector; use rustproxy_metrics::MetricsCollector;
/// Flush accumulated bytes to the metrics collector every 64 KB.
/// This reduces per-frame DashMap shard-locked reads from ~15 to ~1 per 4 frames
/// (assuming typical 16 KB upload frames). The 1 Hz throughput sampler still sees
/// data within one sampling period even at low transfer rates.
const BYTE_FLUSH_THRESHOLD: u64 = 65_536;
/// Wraps any `http_body::Body` and counts data bytes passing through. /// Wraps any `http_body::Body` and counts data bytes passing through.
/// ///
/// Each chunk is reported to the `MetricsCollector` immediately so that /// Bytes are accumulated and flushed to the `MetricsCollector` every
/// the throughput tracker (sampled at 1 Hz) reflects real-time data flow. /// [`BYTE_FLUSH_THRESHOLD`] bytes (and on Drop) so the throughput tracker
/// (sampled at 1 Hz) reflects real-time data flow without per-frame overhead.
/// ///
/// The inner body is pinned on the heap to support `!Unpin` types like `hyper::body::Incoming`. /// The inner body is pinned on the heap to support `!Unpin` types like `hyper::body::Incoming`.
pub struct CountingBody<B> { pub struct CountingBody<B> {
@@ -22,6 +29,8 @@ pub struct CountingBody<B> {
source_ip: Option<String>, source_ip: Option<String>,
/// Whether we count bytes as "in" (request body) or "out" (response body). /// Whether we count bytes as "in" (request body) or "out" (response body).
direction: Direction, direction: Direction,
/// Accumulated bytes not yet flushed to the metrics collector.
pending_bytes: u64,
/// Optional connection-level activity tracker. When set, poll_frame updates this /// Optional connection-level activity tracker. When set, poll_frame updates this
/// to keep the idle watchdog alive during active body streaming (uploads/downloads). /// to keep the idle watchdog alive during active body streaming (uploads/downloads).
connection_activity: Option<Arc<AtomicU64>>, connection_activity: Option<Arc<AtomicU64>>,
@@ -57,6 +66,7 @@ impl<B> CountingBody<B> {
route_id, route_id,
source_ip, source_ip,
direction, direction,
pending_bytes: 0,
connection_activity: None, connection_activity: None,
activity_start: None, activity_start: None,
active_requests: None, active_requests: None,
@@ -81,14 +91,19 @@ impl<B> CountingBody<B> {
self self
} }
/// Report a chunk of bytes immediately to the metrics collector. /// Flush accumulated bytes to the metrics collector.
#[inline] #[inline]
fn report_chunk(&self, len: u64) { fn flush_pending(&mut self) {
if self.pending_bytes == 0 {
return;
}
let bytes = self.pending_bytes;
self.pending_bytes = 0;
let route_id = self.route_id.as_deref(); let route_id = self.route_id.as_deref();
let source_ip = self.source_ip.as_deref(); let source_ip = self.source_ip.as_deref();
match self.direction { match self.direction {
Direction::In => self.metrics.record_bytes(len, 0, route_id, source_ip), Direction::In => self.metrics.record_bytes(bytes, 0, route_id, source_ip),
Direction::Out => self.metrics.record_bytes(0, len, route_id, source_ip), Direction::Out => self.metrics.record_bytes(0, bytes, route_id, source_ip),
} }
} }
} }
@@ -113,9 +128,12 @@ where
Poll::Ready(Some(Ok(frame))) => { Poll::Ready(Some(Ok(frame))) => {
if let Some(data) = frame.data_ref() { if let Some(data) = frame.data_ref() {
let len = data.len() as u64; let len = data.len() as u64;
// Report bytes immediately so the 1 Hz throughput sampler sees them this.pending_bytes += len;
this.report_chunk(len); if this.pending_bytes >= BYTE_FLUSH_THRESHOLD {
// Keep the connection-level idle watchdog alive during body streaming this.flush_pending();
}
// Keep the connection-level idle watchdog alive on every frame
// (this is just one atomic store — cheap enough per-frame)
if let (Some(activity), Some(start)) = (&this.connection_activity, &this.activity_start) { if let (Some(activity), Some(start)) = (&this.connection_activity, &this.activity_start) {
activity.store(start.elapsed().as_millis() as u64, Ordering::Relaxed); activity.store(start.elapsed().as_millis() as u64, Ordering::Relaxed);
} }
@@ -123,7 +141,11 @@ where
Poll::Ready(Some(Ok(frame))) Poll::Ready(Some(Ok(frame)))
} }
Poll::Ready(Some(Err(e))) => Poll::Ready(Some(Err(e))), Poll::Ready(Some(Err(e))) => Poll::Ready(Some(Err(e))),
Poll::Ready(None) => Poll::Ready(None), Poll::Ready(None) => {
// End of stream — flush any remaining bytes
this.flush_pending();
Poll::Ready(None)
}
Poll::Pending => Poll::Pending, Poll::Pending => Poll::Pending,
} }
} }
@@ -139,6 +161,8 @@ where
impl<B> Drop for CountingBody<B> { impl<B> Drop for CountingBody<B> {
fn drop(&mut self) { fn drop(&mut self) {
// Flush any remaining accumulated bytes so totals stay accurate
self.flush_pending();
// Decrement the active-request counter so the HTTP idle watchdog // Decrement the active-request counter so the HTTP idle watchdog
// knows this response body is no longer streaming. // knows this response body is no longer streaming.
if let Some(ref counter) = self.active_requests { if let Some(ref counter) = self.active_requests {

View File

@@ -677,11 +677,9 @@ impl HttpProxyService {
h2: use_h2, h2: use_h2,
}; };
// H2 pool checkout with async readiness validation. // H2 pool checkout — reuse pooled connections for all requests.
// checkout_h2 does synchronous is_closed()/is_ready() checks, but these // The h2 crate properly replenishes connection-level flow control
// reflect cached state — the H2 connection driver (a separate tokio task) // windows via release_capacity() as data is consumed.
// may not have processed a pending GOAWAY/RST yet. The ready().await
// forces the runtime to yield, giving the driver a chance to detect failures.
if use_h2 { if use_h2 {
if let Some((mut sender, age)) = self.connection_pool.checkout_h2(&pool_key) { if let Some((mut sender, age)) = self.connection_pool.checkout_h2(&pool_key) {
match tokio::time::timeout( match tokio::time::timeout(
@@ -1040,7 +1038,6 @@ impl HttpProxyService {
}); });
} }
// Clone sender for potential pool registration; register only after first request succeeds
let sender_for_pool = sender.clone(); let sender_for_pool = sender.clone();
let result = self.forward_h2_with_sender(sender, parts, body, upstream_headers, upstream_path, route, route_id, source_ip, Some(pool_key), domain, conn_activity).await; let result = self.forward_h2_with_sender(sender, parts, body, upstream_headers, upstream_path, route, route_id, source_ip, Some(pool_key), domain, conn_activity).await;
if matches!(&result, Ok(ref resp) if resp.status() != StatusCode::BAD_GATEWAY) { if matches!(&result, Ok(ref resp) if resp.status() != StatusCode::BAD_GATEWAY) {
@@ -1369,29 +1366,24 @@ impl HttpProxyService {
match sender.send_request(upstream_req).await { match sender.send_request(upstream_req).await {
Ok(upstream_response) => { Ok(upstream_response) => {
// H2 works! Register sender in pool for multiplexed reuse
let g = self.connection_pool.register_h2(pool_key.clone(), sender); let g = self.connection_pool.register_h2(pool_key.clone(), sender);
gen_holder.store(g, std::sync::atomic::Ordering::Relaxed); gen_holder.store(g, std::sync::atomic::Ordering::Relaxed);
self.build_streaming_response(upstream_response, route, route_id, source_ip, conn_activity).await self.build_streaming_response(upstream_response, route, route_id, source_ip, conn_activity).await
} }
Err(e) => { Err(e) => {
// H2 request failed — backend advertises h2 via ALPN but doesn't // H2 request failed on a stream level (e.g. RST_STREAM PROTOCOL_ERROR).
// actually speak it. Update cache so future requests use H1. // The H2 handshake succeeded, so the backend genuinely speaks H2 — don't
// poison the protocol cache. Only handshake-level failures (below) should
// downgrade the cache to H1.
let bk = format!("{}:{}", upstream.host, upstream.port); let bk = format!("{}:{}", upstream.host, upstream.port);
warn!( debug!(
backend = %bk, backend = %bk,
domain = %domain, domain = %domain,
error = %e, error = %e,
error_debug = ?e, error_debug = ?e,
"Auto-detect: H2 request failed, falling back to H1" "H2 stream error, retrying this request as H1"
); );
self.metrics.backend_h2_failure(&bk); self.metrics.backend_h2_failure(&bk);
let cache_key = crate::protocol_cache::ProtocolCacheKey {
host: upstream.host.clone(),
port: upstream.port,
requested_host: requested_host.clone(),
};
self.protocol_cache.insert(cache_key, crate::protocol_cache::DetectedProtocol::H1);
// Retry as H1 for bodyless requests; return 502 for requests with bodies // Retry as H1 for bodyless requests; return 502 for requests with bodies
if let Some((method, headers)) = retry_state { if let Some((method, headers)) = retry_state {

View File

@@ -259,40 +259,49 @@ impl MetricsCollector {
/// Called per-chunk in the TCP copy loop. Only touches AtomicU64 counters — /// Called per-chunk in the TCP copy loop. Only touches AtomicU64 counters —
/// no Mutex is taken. The throughput trackers are fed during `sample_all()`. /// no Mutex is taken. The throughput trackers are fed during `sample_all()`.
pub fn record_bytes(&self, bytes_in: u64, bytes_out: u64, route_id: Option<&str>, source_ip: Option<&str>) { pub fn record_bytes(&self, bytes_in: u64, bytes_out: u64, route_id: Option<&str>, source_ip: Option<&str>) {
self.total_bytes_in.fetch_add(bytes_in, Ordering::Relaxed); // Short-circuit: only touch counters for the direction that has data.
self.total_bytes_out.fetch_add(bytes_out, Ordering::Relaxed); // CountingBody always calls with one direction zero — skipping the zero
// direction avoids ~50% of DashMap shard-locked reads per call.
// Accumulate into lock-free pending throughput counters if bytes_in > 0 {
self.global_pending_tp_in.fetch_add(bytes_in, Ordering::Relaxed); self.total_bytes_in.fetch_add(bytes_in, Ordering::Relaxed);
self.global_pending_tp_out.fetch_add(bytes_out, Ordering::Relaxed); self.global_pending_tp_in.fetch_add(bytes_in, Ordering::Relaxed);
}
if bytes_out > 0 {
self.total_bytes_out.fetch_add(bytes_out, Ordering::Relaxed);
self.global_pending_tp_out.fetch_add(bytes_out, Ordering::Relaxed);
}
// Per-route tracking: use get() first (zero-alloc fast path for existing entries), // Per-route tracking: use get() first (zero-alloc fast path for existing entries),
// fall back to entry() with to_string() only on the rare first-chunk miss. // fall back to entry() with to_string() only on the rare first-chunk miss.
if let Some(route_id) = route_id { if let Some(route_id) = route_id {
if let Some(counter) = self.route_bytes_in.get(route_id) { if bytes_in > 0 {
counter.fetch_add(bytes_in, Ordering::Relaxed); if let Some(counter) = self.route_bytes_in.get(route_id) {
} else { counter.fetch_add(bytes_in, Ordering::Relaxed);
self.route_bytes_in.entry(route_id.to_string()) } else {
.or_insert_with(|| AtomicU64::new(0)) self.route_bytes_in.entry(route_id.to_string())
.fetch_add(bytes_in, Ordering::Relaxed); .or_insert_with(|| AtomicU64::new(0))
.fetch_add(bytes_in, Ordering::Relaxed);
}
} }
if let Some(counter) = self.route_bytes_out.get(route_id) { if bytes_out > 0 {
counter.fetch_add(bytes_out, Ordering::Relaxed); if let Some(counter) = self.route_bytes_out.get(route_id) {
} else { counter.fetch_add(bytes_out, Ordering::Relaxed);
self.route_bytes_out.entry(route_id.to_string()) } else {
.or_insert_with(|| AtomicU64::new(0)) self.route_bytes_out.entry(route_id.to_string())
.fetch_add(bytes_out, Ordering::Relaxed); .or_insert_with(|| AtomicU64::new(0))
.fetch_add(bytes_out, Ordering::Relaxed);
}
} }
// Accumulate into per-route pending throughput counters (lock-free) // Accumulate into per-route pending throughput counters (lock-free)
if let Some(entry) = self.route_pending_tp.get(route_id) { if let Some(entry) = self.route_pending_tp.get(route_id) {
entry.0.fetch_add(bytes_in, Ordering::Relaxed); if bytes_in > 0 { entry.0.fetch_add(bytes_in, Ordering::Relaxed); }
entry.1.fetch_add(bytes_out, Ordering::Relaxed); if bytes_out > 0 { entry.1.fetch_add(bytes_out, Ordering::Relaxed); }
} else { } else {
let entry = self.route_pending_tp.entry(route_id.to_string()) let entry = self.route_pending_tp.entry(route_id.to_string())
.or_insert_with(|| (AtomicU64::new(0), AtomicU64::new(0))); .or_insert_with(|| (AtomicU64::new(0), AtomicU64::new(0)));
entry.0.fetch_add(bytes_in, Ordering::Relaxed); if bytes_in > 0 { entry.0.fetch_add(bytes_in, Ordering::Relaxed); }
entry.1.fetch_add(bytes_out, Ordering::Relaxed); if bytes_out > 0 { entry.1.fetch_add(bytes_out, Ordering::Relaxed); }
} }
} }
@@ -302,30 +311,34 @@ impl MetricsCollector {
// This prevents orphaned entries when record_bytes races with // This prevents orphaned entries when record_bytes races with
// connection_closed (which evicts all per-IP data on last close). // connection_closed (which evicts all per-IP data on last close).
if self.ip_connections.contains_key(ip) { if self.ip_connections.contains_key(ip) {
if let Some(counter) = self.ip_bytes_in.get(ip) { if bytes_in > 0 {
counter.fetch_add(bytes_in, Ordering::Relaxed); if let Some(counter) = self.ip_bytes_in.get(ip) {
} else { counter.fetch_add(bytes_in, Ordering::Relaxed);
self.ip_bytes_in.entry(ip.to_string()) } else {
.or_insert_with(|| AtomicU64::new(0)) self.ip_bytes_in.entry(ip.to_string())
.fetch_add(bytes_in, Ordering::Relaxed); .or_insert_with(|| AtomicU64::new(0))
.fetch_add(bytes_in, Ordering::Relaxed);
}
} }
if let Some(counter) = self.ip_bytes_out.get(ip) { if bytes_out > 0 {
counter.fetch_add(bytes_out, Ordering::Relaxed); if let Some(counter) = self.ip_bytes_out.get(ip) {
} else { counter.fetch_add(bytes_out, Ordering::Relaxed);
self.ip_bytes_out.entry(ip.to_string()) } else {
.or_insert_with(|| AtomicU64::new(0)) self.ip_bytes_out.entry(ip.to_string())
.fetch_add(bytes_out, Ordering::Relaxed); .or_insert_with(|| AtomicU64::new(0))
.fetch_add(bytes_out, Ordering::Relaxed);
}
} }
// Accumulate into per-IP pending throughput counters (lock-free) // Accumulate into per-IP pending throughput counters (lock-free)
if let Some(entry) = self.ip_pending_tp.get(ip) { if let Some(entry) = self.ip_pending_tp.get(ip) {
entry.0.fetch_add(bytes_in, Ordering::Relaxed); if bytes_in > 0 { entry.0.fetch_add(bytes_in, Ordering::Relaxed); }
entry.1.fetch_add(bytes_out, Ordering::Relaxed); if bytes_out > 0 { entry.1.fetch_add(bytes_out, Ordering::Relaxed); }
} else { } else {
let entry = self.ip_pending_tp.entry(ip.to_string()) let entry = self.ip_pending_tp.entry(ip.to_string())
.or_insert_with(|| (AtomicU64::new(0), AtomicU64::new(0))); .or_insert_with(|| (AtomicU64::new(0), AtomicU64::new(0)));
entry.0.fetch_add(bytes_in, Ordering::Relaxed); if bytes_in > 0 { entry.0.fetch_add(bytes_in, Ordering::Relaxed); }
entry.1.fetch_add(bytes_out, Ordering::Relaxed); if bytes_out > 0 { entry.1.fetch_add(bytes_out, Ordering::Relaxed); }
} }
} }
} }

View File

@@ -3,6 +3,6 @@
*/ */
export const commitinfo = { export const commitinfo = {
name: '@push.rocks/smartproxy', name: '@push.rocks/smartproxy',
version: '25.11.18', version: '25.11.23',
description: 'A powerful proxy package with unified route-based configuration for high traffic management. Features include SSL/TLS support, flexible routing patterns, WebSocket handling, advanced security options, and automatic ACME certificate management.' description: 'A powerful proxy package with unified route-based configuration for high traffic management. Features include SSL/TLS support, flexible routing patterns, WebSocket handling, advanced security options, and automatic ACME certificate management.'
} }