danieltroger · April 20, 2026 15:14
diff --git a/README.md b/README.md
diff --git a/echo-server.mjs b/echo-server.mjs
 // HTTP server used as the fetch target in the repro.
 // - Each request sleeps `delayMs` before responding.
 // - Tracks simultaneous in-flight requests and exposes /stats so the worker
 //   can report exactly how many of its fetches were in flight at once.
 //
 // Usage: node echo-server.mjs [port=9192] [delayMs=1000]

 import http from "node:http";

 const port = Number(process.argv[2] ?? 9192);
 const delayMs = Number(process.argv[3] ?? 1000);

 let inFlight = 0;
 let maxInFlight = 0;

 const server = http.createServer((req, res) => {
  if (req.url === "/stats") {
    res.writeHead(200, { "content-type": "application/json" });
    res.end(JSON.stringify({ inFlight, maxInFlight }));
    return;
  }
  if (req.url === "/reset") {
    maxInFlight = inFlight;
    res.writeHead(200, { "content-type": "application/json" });
    res.end(JSON.stringify({ reset: true, inFlight, maxInFlight }));
    return;
  }
  inFlight++;
  if (inFlight > maxInFlight) maxInFlight = inFlight;
  setTimeout(() => {
    inFlight--;
    res.writeHead(200, { "content-type": "application/json" });
    res.end(JSON.stringify({ ok: true }));
  }, delayMs);
 });

 server.maxConnections = 100000;
 server.listen(port, () => {
  console.log(`echo-server on ${port}, delay=${delayMs}ms`);
 });
diff --git a/index.ts b/index.ts
 // Minimal repro: wrangler dev does not enforce the "6 simultaneous open
 // connections" limit that applies in production
 // https://developers.cloudflare.com/workers/platform/limits/#simultaneous-open-connections
 //
 // Quote from the docs:
 //   "Each Worker invocation can have up to six connections simultaneously
 //    waiting for response headers. ... If a seventh connection is attempted
 //    while six are already waiting for headers, it is queued until one of the
 //    existing connections receives its response headers."
 //
 // This handler fires N concurrent fetch()es to a local echo server that
 // tracks the maximum number of simultaneous in-flight requests it observed.
 // Running this deployed to production reports maxInFlight=6. Running it
 // against `wrangler dev` reports maxInFlight=N.
 //
 // Endpoints:
 //   GET /storm?n=100&target=http://localhost:9192/
 //     Fires N fetches in parallel, then queries target/stats.
 //     Returns { n, maxInFlightObservedByTarget, elapsedMs }.
 //
 //   GET /probe
 //     Trivial endpoint. Run it in parallel with /storm to observe dev-server
 //     freezes: probes time out while /storm is in flight.

 export default {
  async fetch(req: Request): Promise<Response> {
    const url = new URL(req.url);

    if (url.pathname === "/probe") {
      return Response.json({ ok: true, t: Date.now() });
    }

    if (url.pathname === "/storm") {
      const n = Number(url.searchParams.get("n") ?? "100");
      const target = url.searchParams.get("target") ?? "http://localhost:9192/";
      const statsUrl = new URL("/stats", target).toString();
      const resetUrl = new URL("/reset", target).toString();

      await fetch(resetUrl).then(r => r.body?.cancel());

      const started = performance.now();
      const results = await Promise.allSettled(
        Array.from({ length: n }, () =>
          fetch(target).then(r => {
            r.body?.cancel();
            return r.status;
          })
        )
      );
      const elapsedMs = Math.round(performance.now() - started);

      const stats = (await (await fetch(statsUrl)).json()) as {
        maxInFlight: number;
      };

      const ok = results.filter(r => r.status === "fulfilled").length;
      return Response.json({
        n,
        ok,
        failed: n - ok,
        maxInFlightObservedByTarget: stats.maxInFlight,
        elapsedMs,
      });
    }

    return Response.json(
      { error: "try /storm?n=100 or /probe" },
      { status: 404 }
    );
  },
 };
diff --git a/package.json b/package.json
 {
  "name": "cf-simul-connections-repro",
  "version": "1.0.0",
  "private": true,
  "scripts": {
    "start": "wrangler dev"
  },
  "devDependencies": {
    "wrangler": "^4.83.0"
  }
 }
diff --git a/wrangler.jsonc b/wrangler.jsonc
 {
  "name": "cf-simul-connections-repro",
  "main": "src/index.ts",
  "compatibility_date": "2026-04-15",
  "dev": { "port": 9191 }
 }
	// HTTP server used as the fetch target in the repro.
	// - Each request sleeps `delayMs` before responding.
	// - Tracks simultaneous in-flight requests and exposes /stats so the worker
	// can report exactly how many of its fetches were in flight at once.
	//
	// Usage: node echo-server.mjs [port=9192] [delayMs=1000]

	import http from "node:http";

	const port = Number(process.argv[2] ?? 9192);
	const delayMs = Number(process.argv[3] ?? 1000);

	let inFlight = 0;
	let maxInFlight = 0;

	const server = http.createServer((req, res) => {
	if (req.url === "/stats") {
	res.writeHead(200, { "content-type": "application/json" });
	res.end(JSON.stringify({ inFlight, maxInFlight }));
	return;
	}
	if (req.url === "/reset") {
	maxInFlight = inFlight;
	res.writeHead(200, { "content-type": "application/json" });
	res.end(JSON.stringify({ reset: true, inFlight, maxInFlight }));
	return;
	}
	inFlight++;
	if (inFlight > maxInFlight) maxInFlight = inFlight;
	setTimeout(() => {
	inFlight--;
	res.writeHead(200, { "content-type": "application/json" });
	res.end(JSON.stringify({ ok: true }));
	}, delayMs);
	});

	server.maxConnections = 100000;
	server.listen(port, () => {
	console.log(`echo-server on ${port}, delay=${delayMs}ms`);
	});
	// Minimal repro: wrangler dev does not enforce the "6 simultaneous open
	// connections" limit that applies in production
	// https://developers.cloudflare.com/workers/platform/limits/#simultaneous-open-connections
	//
	// Quote from the docs:
	// "Each Worker invocation can have up to six connections simultaneously
	// waiting for response headers. ... If a seventh connection is attempted
	// while six are already waiting for headers, it is queued until one of the
	// existing connections receives its response headers."
	//
	// This handler fires N concurrent fetch()es to a local echo server that
	// tracks the maximum number of simultaneous in-flight requests it observed.
	// Running this deployed to production reports maxInFlight=6. Running it
	// against `wrangler dev` reports maxInFlight=N.
	//
	// Endpoints:
	// GET /storm?n=100&target=http://localhost:9192/
	// Fires N fetches in parallel, then queries target/stats.
	// Returns { n, maxInFlightObservedByTarget, elapsedMs }.
	//
	// GET /probe
	// Trivial endpoint. Run it in parallel with /storm to observe dev-server
	// freezes: probes time out while /storm is in flight.

	export default {
	async fetch(req: Request): Promise<Response> {
	const url = new URL(req.url);

	if (url.pathname === "/probe") {
	return Response.json({ ok: true, t: Date.now() });
	}

	if (url.pathname === "/storm") {
	const n = Number(url.searchParams.get("n") ?? "100");
	const target = url.searchParams.get("target") ?? "http://localhost:9192/";
	const statsUrl = new URL("/stats", target).toString();
	const resetUrl = new URL("/reset", target).toString();

	await fetch(resetUrl).then(r => r.body?.cancel());

	const started = performance.now();
	const results = await Promise.allSettled(
	Array.from({ length: n }, () =>
	fetch(target).then(r => {
	r.body?.cancel();
	return r.status;
	})
	)
	);
	const elapsedMs = Math.round(performance.now() - started);

	const stats = (await (await fetch(statsUrl)).json()) as {
	maxInFlight: number;
	};

	const ok = results.filter(r => r.status === "fulfilled").length;
	return Response.json({
	n,
	ok,
	failed: n - ok,
	maxInFlightObservedByTarget: stats.maxInFlight,
	elapsedMs,
	});
	}

	return Response.json(
	{ error: "try /storm?n=100 or /probe" },
	{ status: 404 }
	);
	},
	};
	{
	"name": "cf-simul-connections-repro",
	"version": "1.0.0",
	"private": true,
	"scripts": {
	"start": "wrangler dev"
	},
	"devDependencies": {
	"wrangler": "^4.83.0"
	}
	}
	{
	"name": "cf-simul-connections-repro",
	"main": "src/index.ts",
	"compatibility_date": "2026-04-15",
	"dev": { "port": 9191 }
	}