Phase 3: scripts/kb-objects-map.py + audit/objects-map.json + projects/_index.md
Авто-генератор реестра: парсит netbird-inventory + frontmatter каждого проекта, выводит JSON для бота и человекочитаемый index с wiki-ссылками. Пока 16 проектов / 38 orphan-пиров без своих карточек — выявленные дыры станут input для Фазы 4 (stub-генератора). Скрипт идемпотентный, без deps (pure stdlib), запуск: cd ~/knowledge-base && python3 scripts/kb-objects-map.py Парсер обрабатывает offline-таблицу netbird (другой порядок колонок), normalize ye→e уравнивает Знаменское/Znamenskoe. Source of truth — frontmatter каждого проекта; добавление aliases/owner/region там сразу подхватится при следующем run. Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
This commit is contained in:
242
scripts/kb-objects-map.py
Normal file
242
scripts/kb-objects-map.py
Normal file
@@ -0,0 +1,242 @@
|
||||
#!/usr/bin/env python3
|
||||
"""kb-objects-map — собирает машиночитаемый реестр объектов и хостов.
|
||||
|
||||
Источники:
|
||||
projects/dttb/netbird-inventory.md — netbird-пиры (источник правды по железу)
|
||||
projects/<dir>/README.md — frontmatter каждого проекта (aliases, tags, status)
|
||||
projects/<file>.md — singleton-проекты
|
||||
|
||||
Output:
|
||||
audit/objects-map.json — структура для бота / structured-поиска
|
||||
projects/_index.md — человеко-читаемый индекс с wiki-ссылками
|
||||
|
||||
Запускать вручную или cron:
|
||||
cd ~/knowledge-base && python3 scripts/kb-objects-map.py
|
||||
"""
|
||||
from datetime import date, datetime
|
||||
from pathlib import Path
|
||||
import json
|
||||
import re
|
||||
|
||||
VAULT = Path(__file__).resolve().parent.parent
|
||||
INV = VAULT / "projects/dttb/netbird-inventory.md"
|
||||
JSON_OUT = VAULT / "audit/objects-map.json"
|
||||
MD_OUT = VAULT / "projects/_index.md"
|
||||
|
||||
|
||||
def parse_frontmatter(text: str) -> dict:
|
||||
m = re.match(r"^---\n(.+?)\n---\n", text, re.S)
|
||||
if not m:
|
||||
return {}
|
||||
fm = {}
|
||||
for line in m.group(1).splitlines():
|
||||
if ":" not in line or line.startswith("#"):
|
||||
continue
|
||||
k, _, v = line.partition(":")
|
||||
k, v = k.strip(), v.strip()
|
||||
if v.startswith("[") and v.endswith("]"):
|
||||
v = [x.strip().strip("\"'") for x in v[1:-1].split(",") if x.strip()]
|
||||
elif v.startswith('"') and v.endswith('"'):
|
||||
v = v[1:-1]
|
||||
fm[k] = v
|
||||
return fm
|
||||
|
||||
|
||||
ROW_RE = re.compile(
|
||||
r"^\|\s*([^|]+?)\s*\|\s*(\d+\.\d+\.\d+\.\d+)\s*\|\s*([^|]*?)\s*\|\s*([^|]*?)\s*\|\s*([^|]*?)\s*\|"
|
||||
)
|
||||
|
||||
|
||||
def parse_netbird(path: Path) -> list[dict]:
|
||||
"""Парсит online + offline-таблицы netbird-inventory.md."""
|
||||
if not path.exists():
|
||||
return []
|
||||
text = path.read_text()
|
||||
parts = re.split(r"^##\s+(?:Оффлайн|Offline)\b.*$", text, maxsplit=1, flags=re.M)
|
||||
online_text, offline_text = parts[0], parts[1] if len(parts) > 1 else ""
|
||||
|
||||
peers = []
|
||||
for line in online_text.splitlines():
|
||||
m = ROW_RE.match(line)
|
||||
if not m:
|
||||
continue
|
||||
name = m.group(1).strip()
|
||||
if name in ("Имя", "---"):
|
||||
continue
|
||||
peers.append({
|
||||
"name": name, "ip": m.group(2).strip(),
|
||||
"os": m.group(3).strip(), "city": m.group(4).strip(),
|
||||
"version": m.group(5).strip(), "online": True,
|
||||
})
|
||||
# offline-таблица: | Имя | IP | ОС | Последний раз онлайн | Город |
|
||||
for line in offline_text.splitlines():
|
||||
m = ROW_RE.match(line)
|
||||
if not m:
|
||||
continue
|
||||
name = m.group(1).strip()
|
||||
if name in ("Имя", "---"):
|
||||
continue
|
||||
peers.append({
|
||||
"name": name, "ip": m.group(2).strip(),
|
||||
"os": m.group(3).strip(),
|
||||
"last_seen": m.group(4).strip(), "city": m.group(5).strip(),
|
||||
"version": "", "online": False,
|
||||
})
|
||||
return peers
|
||||
|
||||
|
||||
def _norm(s: str) -> str:
|
||||
"""Нормализация для нечёткого сравнения. ye→e уравнивает Знаменское/Znamenskoe."""
|
||||
return (s or "").lower().replace("ye", "e").replace(" ", "").replace("_", "").replace("-", "")
|
||||
|
||||
|
||||
def name_match(peer_name: str, candidates: list[str]) -> bool:
|
||||
pn = _norm(peer_name)
|
||||
if not pn:
|
||||
return False
|
||||
for c in candidates:
|
||||
cn = _norm(c)
|
||||
if cn and (cn in pn or pn in cn):
|
||||
return True
|
||||
return False
|
||||
|
||||
|
||||
def main() -> None:
|
||||
peers = parse_netbird(INV)
|
||||
objects = []
|
||||
seen_files = set()
|
||||
|
||||
project_dirs = sorted(p for p in (VAULT / "projects").iterdir() if p.is_dir())
|
||||
for d in project_dirs:
|
||||
readme = d / "README.md"
|
||||
fm = parse_frontmatter(readme.read_text()) if readme.exists() else {}
|
||||
rel_file = f"projects/{d.name}/README.md" if readme.exists() else None
|
||||
aliases = fm.get("aliases", [])
|
||||
if isinstance(aliases, str):
|
||||
aliases = [aliases]
|
||||
names = sorted({d.name, *aliases})
|
||||
nb = [p for p in peers if name_match(p["name"], names)]
|
||||
objects.append({
|
||||
"id": d.name,
|
||||
"type": "project",
|
||||
"names": names,
|
||||
"netbird_peers": nb,
|
||||
"tags": fm.get("tags", []),
|
||||
"owner": fm.get("owner") or fm.get("client"),
|
||||
"region": fm.get("region"),
|
||||
"status": fm.get("status", "unknown"),
|
||||
"file": rel_file,
|
||||
})
|
||||
if rel_file:
|
||||
seen_files.add(rel_file)
|
||||
|
||||
for f in sorted((VAULT / "projects").glob("*.md")):
|
||||
if f.name == "_index.md":
|
||||
continue
|
||||
rel = f"projects/{f.name}"
|
||||
if rel in seen_files:
|
||||
continue
|
||||
fm = parse_frontmatter(f.read_text())
|
||||
objects.append({
|
||||
"id": f.stem,
|
||||
"type": "project-note",
|
||||
"names": [f.stem],
|
||||
"netbird_peers": [],
|
||||
"tags": fm.get("tags", []),
|
||||
"owner": fm.get("owner"),
|
||||
"region": fm.get("region"),
|
||||
"status": fm.get("status", "unknown"),
|
||||
"file": rel,
|
||||
})
|
||||
|
||||
matched_peer_names = {p["name"] for o in objects for p in o["netbird_peers"]}
|
||||
for p in peers:
|
||||
if p["name"] in matched_peer_names:
|
||||
continue
|
||||
objects.append({
|
||||
"id": p["name"].replace(" ", "_"),
|
||||
"type": "netbird-only",
|
||||
"names": [p["name"]],
|
||||
"netbird_peers": [p],
|
||||
"tags": [],
|
||||
"owner": None,
|
||||
"region": p["city"] or None,
|
||||
"status": "no-project-page",
|
||||
"file": None,
|
||||
})
|
||||
|
||||
JSON_OUT.parent.mkdir(parents=True, exist_ok=True)
|
||||
JSON_OUT.write_text(json.dumps(objects, indent=2, ensure_ascii=False) + "\n")
|
||||
|
||||
today = date.today().isoformat()
|
||||
now = datetime.now().isoformat(timespec="minutes")
|
||||
n_proj = sum(1 for o in objects if o["type"] in ("project", "project-note"))
|
||||
n_with_nb = sum(1 for o in objects if o["type"] == "project" and o["netbird_peers"])
|
||||
n_orphan = sum(1 for o in objects if o["type"] == "netbird-only")
|
||||
|
||||
md = [
|
||||
"---",
|
||||
f"date: {today}",
|
||||
"type: index",
|
||||
"source: scripts/kb-objects-map.py",
|
||||
"tags: [index, registry, objects, netbird]",
|
||||
"---",
|
||||
"",
|
||||
"# Реестр объектов и netbird-пиров",
|
||||
"",
|
||||
f"Авто-сгенерировано `{now}` из [[dttb/netbird-inventory]] + frontmatter в `projects/`.",
|
||||
"**Не править вручную** — перепишется. Источник правды — frontmatter в каждом README.",
|
||||
"",
|
||||
f"- Проектов: **{n_proj}**, из них с netbird-привязкой: **{n_with_nb}**",
|
||||
f"- NetBird-пиров без projects-страницы: **{n_orphan}** (TODO — создать стабы)",
|
||||
"",
|
||||
"## Проекты с netbird-привязкой",
|
||||
"",
|
||||
"| ID | Имена | NetBird IP | OS | Город | Файл | Статус |",
|
||||
"|---|---|---|---|---|---|---|",
|
||||
]
|
||||
for o in sorted(objects, key=lambda x: x["id"]):
|
||||
if o["type"] == "project" and o["netbird_peers"]:
|
||||
nb_ip = ", ".join(p["ip"] for p in o["netbird_peers"])
|
||||
nb_os = ", ".join(sorted({p["os"] for p in o["netbird_peers"] if p["os"]}))
|
||||
nb_city = ", ".join(sorted({p["city"] for p in o["netbird_peers"] if p["city"]}))
|
||||
file_link = f"[[{o['file'][:-3]}]]" if o["file"] else "—"
|
||||
names = ", ".join(o["names"][:5])
|
||||
md.append(f"| {o['id']} | {names} | {nb_ip} | {nb_os} | {nb_city} | {file_link} | {o['status']} |")
|
||||
|
||||
md.extend([
|
||||
"",
|
||||
"## Проекты без netbird-привязки",
|
||||
"",
|
||||
"| ID | Тип | Файл | Статус |",
|
||||
"|---|---|---|---|",
|
||||
])
|
||||
for o in sorted(objects, key=lambda x: x["id"]):
|
||||
if o["type"] in ("project", "project-note") and not o["netbird_peers"]:
|
||||
file_link = f"[[{o['file'][:-3]}]]" if o["file"] else "—"
|
||||
md.append(f"| {o['id']} | {o['type']} | {file_link} | {o['status']} |")
|
||||
|
||||
md.extend([
|
||||
"",
|
||||
"## NetBird-пиры без projects-страницы — TODO",
|
||||
"",
|
||||
"Эти пиры есть в инвентаре, но у них нет своей карточки в `projects/`. Бот не сможет ответить на «найди мне X» — нет файла. Нужно создать стабы (Фаза 4 плана).",
|
||||
"",
|
||||
"| Имя в NetBird | IP | OS | Город | Версия |",
|
||||
"|---|---|---|---|---|",
|
||||
])
|
||||
for o in sorted(objects, key=lambda x: x["id"]):
|
||||
if o["type"] == "netbird-only":
|
||||
p = o["netbird_peers"][0]
|
||||
md.append(f"| `{p['name']}` | {p['ip']} | {p['os']} | {p['city']} | {p['version']} |")
|
||||
|
||||
md.append("")
|
||||
MD_OUT.write_text("\n".join(md))
|
||||
|
||||
print(f"Wrote {JSON_OUT.relative_to(VAULT)} ({len(objects)} entries: "
|
||||
f"{n_proj} projects, {n_orphan} netbird-only)")
|
||||
print(f"Wrote {MD_OUT.relative_to(VAULT)}")
|
||||
|
||||
|
||||
if __name__ == "__main__":
|
||||
main()
|
||||
Reference in New Issue
Block a user