mirror of
https://github.com/openclaw/openclaw.git
synced 2026-03-18 21:40:53 +00:00
154 lines
3.5 KiB
Bash
Executable File
154 lines
3.5 KiB
Bash
Executable File
#!/usr/bin/env bash
|
|
# Scan for orphaned coding agent processes after a gateway restart.
|
|
#
|
|
# Background coding agents (Claude Code, Codex CLI) spawned by the gateway
|
|
# can outlive the session that started them when the gateway restarts.
|
|
# This script finds them and reports their state.
|
|
#
|
|
# Usage:
|
|
# recover-orphaned-processes.sh
|
|
#
|
|
# Output: JSON object with `orphaned` array and `ts` timestamp.
|
|
set -euo pipefail
|
|
|
|
usage() {
|
|
cat <<'USAGE'
|
|
Usage: recover-orphaned-processes.sh
|
|
|
|
Scans for likely orphaned coding agent processes and prints JSON.
|
|
USAGE
|
|
}
|
|
|
|
if [ "${1:-}" = "--help" ] || [ "${1:-}" = "-h" ]; then
|
|
usage
|
|
exit 0
|
|
fi
|
|
|
|
if [ "$#" -gt 0 ]; then
|
|
usage >&2
|
|
exit 2
|
|
fi
|
|
|
|
if ! command -v node &>/dev/null; then
|
|
echo '{"error":"node not found on PATH","orphaned":[],"ts":"'"$(date -u +%Y-%m-%dT%H:%M:%SZ)"'"}'
|
|
exit 0
|
|
fi
|
|
|
|
node <<'NODE'
|
|
const { execFileSync } = require("node:child_process");
|
|
const fs = require("node:fs");
|
|
|
|
let username = process.env.USER || process.env.LOGNAME || "";
|
|
|
|
if (username && !/^[a-zA-Z0-9._-]+$/.test(username)) {
|
|
username = "";
|
|
}
|
|
|
|
function runFile(file, args) {
|
|
try {
|
|
return execFileSync(file, args, {
|
|
encoding: "utf8",
|
|
stdio: ["ignore", "pipe", "ignore"],
|
|
});
|
|
} catch (err) {
|
|
if (err && typeof err.stdout === "string") {
|
|
return err.stdout;
|
|
}
|
|
if (err && err.stdout && Buffer.isBuffer(err.stdout)) {
|
|
return err.stdout.toString("utf8");
|
|
}
|
|
return "";
|
|
}
|
|
}
|
|
|
|
function resolveStarted(pid) {
|
|
const started = runFile("ps", ["-o", "lstart=", "-p", String(pid)]).trim();
|
|
return started.length > 0 ? started : "unknown";
|
|
}
|
|
|
|
function resolveCwd(pid) {
|
|
if (process.platform === "linux") {
|
|
try {
|
|
return fs.readlinkSync(`/proc/${pid}/cwd`);
|
|
} catch {
|
|
return "unknown";
|
|
}
|
|
}
|
|
const lsof = runFile("lsof", ["-a", "-d", "cwd", "-p", String(pid), "-Fn"]);
|
|
const match = lsof.match(/^n(.+)$/m);
|
|
return match ? match[1] : "unknown";
|
|
}
|
|
|
|
// Pre-filter candidate PIDs using pgrep to avoid scanning all processes.
|
|
// Falls back to a user-scoped ps scan if pgrep is unavailable.
|
|
const candidatePids = runFile(
|
|
"pgrep",
|
|
username.length > 0
|
|
? ["-u", username, "-f", "codex|claude"]
|
|
: ["-f", "codex|claude"],
|
|
)
|
|
.split("\n")
|
|
.map((s) => s.trim())
|
|
.filter((s) => s.length > 0 && /^\d+$/.test(s));
|
|
|
|
let lines;
|
|
if (candidatePids.length > 0) {
|
|
// Fetch command info only for candidate PIDs.
|
|
lines = runFile("ps", ["-o", "pid=,command=", "-p", candidatePids.join(",")]).split(
|
|
"\n",
|
|
);
|
|
} else if (username.length > 0) {
|
|
lines = runFile("ps", ["-U", username, "-o", "pid=,command="]).split("\n");
|
|
} else {
|
|
lines = runFile("ps", ["-axo", "pid=,command="]).split("\n");
|
|
}
|
|
|
|
const includePattern = /codex|claude/i;
|
|
|
|
const excludePatterns = [
|
|
/openclaw-gateway/i,
|
|
/signal-cli/i,
|
|
/node_modules\/\.bin\/openclaw/i,
|
|
/recover-orphaned-processes\.sh/i,
|
|
];
|
|
|
|
const orphaned = [];
|
|
|
|
for (const rawLine of lines) {
|
|
const line = rawLine.trim();
|
|
if (!line) {
|
|
continue;
|
|
}
|
|
const match = line.match(/^(\d+)\s+(.+)$/);
|
|
if (!match) {
|
|
continue;
|
|
}
|
|
|
|
const pid = Number(match[1]);
|
|
const cmd = match[2];
|
|
if (!Number.isInteger(pid) || pid <= 0 || pid === process.pid) {
|
|
continue;
|
|
}
|
|
if (!includePattern.test(cmd)) {
|
|
continue;
|
|
}
|
|
if (excludePatterns.some((pattern) => pattern.test(cmd))) {
|
|
continue;
|
|
}
|
|
|
|
orphaned.push({
|
|
pid,
|
|
cmd,
|
|
cwd: resolveCwd(pid),
|
|
started: resolveStarted(pid),
|
|
});
|
|
}
|
|
|
|
process.stdout.write(
|
|
JSON.stringify({
|
|
orphaned,
|
|
ts: new Date().toISOString(),
|
|
}) + "\n",
|
|
);
|
|
NODE
|