From 74aab8a42c479cdeeda9371dbd591a19d070c48e Mon Sep 17 00:00:00 2001 From: Daniele Nicolodi Date: Sat, 11 Jan 2025 17:13:14 +0100 Subject: docs: Add a test to validate URLs in markdown/Users.md Avoid piling up dead URLs. --- docs/validatelinks.py | 42 ++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 42 insertions(+) create mode 100644 docs/validatelinks.py (limited to 'docs/validatelinks.py') diff --git a/docs/validatelinks.py b/docs/validatelinks.py new file mode 100644 index 000000000..69544ab0e --- /dev/null +++ b/docs/validatelinks.py @@ -0,0 +1,42 @@ +#!/usr/bin/env python3 + +# SPDX-License-Identifier: Apache-2.0 +# Copyright 2025 The Meson development team + +import sys +import re +import aiohttp +import asyncio + +LINK = re.compile(r'\[(?P[A-Za-z0-9 ]+)\]\((?P.*?)\)') + + +async def fetch(session, name, url, timeout): + try: + async with session.get(url, timeout=timeout) as r: + if not r.ok: + return (name, url, r.status) + except Exception as e: + return (name, url, str(e)) + + +async def main(filename): + with open(filename) as f: + text = f.read() + timeout = aiohttp.ClientTimeout(total=60) + async with aiohttp.ClientSession() as session: + tasks = [] + for link in LINK.finditer(text): + name, url = link.groups() + task = asyncio.ensure_future(fetch(session, name, url, timeout)) + tasks.append(task) + responses = asyncio.gather(*tasks) + errors = [r for r in await responses if r is not None] + for name, url, result in errors: + print(f'"{name}" {url} {result}') + if errors: + sys.exit(1) + + +if __name__ == '__main__': + asyncio.run(main(sys.argv[1])) -- cgit v1.2.3