github · Mossaka · Apr 7, 2026 · Apr 7, 2026 · Apr 7, 2026 · Copilot
@@ -11,7 +11,7 @@
  * Outputs structured JSON with mean, median, p95, p99 per metric.
  */
 
-import { execSync, ExecSyncOptions } from "child_process";
+import { execSync, ExecSyncOptions, spawn, ChildProcess } from "child_process";
 
 // ── Configuration ──────────────────────────────────────────────────
 
@@ -159,45 +159,130 @@ function benchmarkHttpsLatency(): BenchmarkResult {
   return { metric: "squid_https_latency", unit: "ms", values, ...stats(values) };
 }
 
-function benchmarkMemory(): BenchmarkResult {
+/**
+ * Wait for Docker containers to be running, polling at 500ms intervals.
+ * Uses exact name matching (anchored regex) to avoid false positives from
+ * containers with similar names (e.g., "awf-squid-old").
+ * Throws if containers are not running within timeoutMs.
+ */
+function waitForContainers(containerNames: string[], timeoutMs: number): Promise<void> {
+  const start = Date.now();
+  return new Promise((resolve, reject) => {
+    const poll = (): void => {
+      if (Date.now() - start > timeoutMs) {
+        reject(new Error(`Containers not running after ${timeoutMs}ms`));
+        return;
+      }
+      try {
+        const allRunning = containerNames.every((name) => {
+          const result = execSync(
+            `sudo docker ps --filter name=^${name}$ --filter status=running --format '{{.Names}}' 2>/dev/null`,
+            { encoding: "utf-8", timeout: 5_000 }
+          )
+            .trim()
+            .split("\n")
+            .map((n) => n.trim())
+            .filter(Boolean);
+          return result.some((n) => n === name);
+        });
+        if (allRunning) {
+          resolve();
+          return;
+        }
+      } catch {
+        // container not ready yet
+      }
+      setTimeout(poll, 500);
+    };
+    poll();
+  });
+}
+
+/**
+ * Parse a Docker memory usage string like "123.4MiB / 7.773GiB" into MB.
+ */
+function parseMb(s: string): number {
+  const match = s.match(/([\d.]+)\s*(MiB|GiB|KiB)/i);
+  if (!match) return 0;
+  const val = parseFloat(match[1]);
+  const unit = match[2].toLowerCase();
+  if (unit === "gib") return val * 1024;
+  if (unit === "kib") return val / 1024;
+  return val;
+}
+
+/**
+ * Kill a spawned background process and its entire process group, best-effort.
+ * Sends SIGTERM then SIGKILL to the process group so descendant processes
+ * (e.g., sudo, awf, docker) don't survive.
+ */
+function killBackground(child: ChildProcess): void {
+  const pid = child.pid;
+  if (!pid) return;
+
+  try {
+    // SIGTERM the process group to allow graceful shutdown
+    process.kill(-pid, "SIGTERM");
+  } catch {
+    // Process group may have already exited
+  }
+
+  try {
-  try {
-    if (child.pid) {
-      // Kill the process group (negative PID) to catch child processes
-      process.kill(-child.pid, "SIGTERM");
-    }
-  } catch {
-    // Process may have already exited
-  }
-  try {
+  const pid = child.pid;
+
+  if (!pid) {
+    return;
+  }
+
+  try {
+    // Kill the process group (negative PID) to catch child processes
+    process.kill(-pid, "SIGTERM");
+  } catch {
+    // Process group may have already exited
+  }
+
+  try {
+    // Force-kill the entire process group so descendant processes do not survive
+    process.kill(-pid, "SIGKILL");
+  } catch {
+    // Process group may have already exited
+  }
+
+  try {
+    // Best-effort fallback for the direct child process
-  try {
-    if (child.pid) {
-      // Kill the process group (negative PID) to catch child processes
-      process.kill(-child.pid, "SIGTERM");
-    }
-  } catch {
-    // Process may have already exited
-  }
-  try {
+  const pid = child.pid;
+
+  if (!pid) {
+    return;
+  }
+
+  try {
+    // Kill the process group (negative PID) to catch child processes
+    process.kill(-pid, "SIGTERM");
+  } catch {
+    // Process group may have already exited
+  }
+
+  try {
+    // Force-kill the entire process group so descendant processes do not survive
+    process.kill(-pid, "SIGKILL");
+  } catch {
+    // Process group may have already exited
+  }
+
+  try {
+    // Best-effort fallback for the direct child process
+    // SIGKILL the entire process group to ensure nothing survives
+    process.kill(-pid, "SIGKILL");
+  } catch {
+    // Process group may have already exited
+  }
+}
+
+async function benchmarkMemory(): Promise<BenchmarkResult> {
   console.error("  Benchmarking memory footprint...");
   const values: number[] = [];
 
   for (let i = 0; i < ITERATIONS; i++) {
     cleanup();
-    // Start containers, measure memory, then stop
+    let child: ChildProcess | null = null;
     try {
-      // Run a sleep command so containers stay up, then check memory
-      const output = exec(
-        `${AWF_CMD} --allow-domains ${ALLOWED_DOMAIN} --log-level error --keep-containers -- ` +
-          `echo measuring_memory`
+      // Start awf with a long-running command in the background so containers stay alive.
+      // Derive spawn args from AWF_CMD to stay consistent with the rest of the script.
+      const awfParts = AWF_CMD.split(/\s+/);
+      child = spawn(
+        awfParts[0],
+        [...awfParts.slice(1), "--allow-domains", ALLOWED_DOMAIN, "--log-level", "error", "--", "sleep", "30"],
+        {
+          detached: true,
+          stdio: "ignore",
+        }
       );
-      );
+      );
+      child.unref();
-      );
+      );
+      child.unref();
-      // Get memory stats for both containers
+      // Unref so the parent process won't be kept alive if cleanup fails
+      child.unref();
+
+      // Wait for both containers to be running (up to 30s)
+      await waitForContainers(["awf-squid", "awf-agent"], 30_000);
+
+      // Give containers a moment to stabilize memory usage
+      await new Promise((resolve) => setTimeout(resolve, 2000));
+
+      // Get memory stats while containers are alive
       const squidMem = exec(
         "sudo docker stats awf-squid --no-stream --format '{{.MemUsage}}' 2>/dev/null || echo '0MiB'"
       );
       const agentMem = exec(
         "sudo docker stats awf-agent --no-stream --format '{{.MemUsage}}' 2>/dev/null || echo '0MiB'"
       );
 
-      // Parse memory values (format: "123.4MiB / 7.773GiB")
-      const parseMb = (s: string): number => {
-        const match = s.match(/([\d.]+)\s*(MiB|GiB|KiB)/i);
-        if (!match) return 0;
-        const val = parseFloat(match[1]);
-        const unit = match[2].toLowerCase();
-        if (unit === "gib") return val * 1024;
-        if (unit === "kib") return val / 1024;
-        return val;
-      };
-
       const totalMb = Math.round(parseMb(squidMem) + parseMb(agentMem));
       values.push(totalMb);
       console.error(`    Iteration ${i + 1}/${ITERATIONS}: ${totalMb}MB (squid: ${squidMem}, agent: ${agentMem})`);
-    } catch {
-      console.error(`    Iteration ${i + 1}/${ITERATIONS}: failed (skipped)`);
+    } catch (err) {
+      console.error(`    Iteration ${i + 1}/${ITERATIONS}: failed (skipped) - ${err}`);
+    } finally {
+      // Always clean up the background process and containers
+      if (child) {
+        killBackground(child);
+      }
+      cleanup();
     }
-    cleanup();
   }
 
   if (values.length === 0) {
@@ -248,7 +333,7 @@ async function main(): Promise<void> {
   results.push(benchmarkWarmStart());
   results.push(benchmarkColdStart());
   results.push(benchmarkHttpsLatency());
-  results.push(benchmarkMemory());
+  results.push(await benchmarkMemory());
 
   // Final cleanup
   cleanup();