From b46eb8b8daca5af7c92a144d27237c897805669e Mon Sep 17 00:00:00 2001 From: Carol Willing Date: Tue, 23 Jun 2026 18:29:26 -0700 Subject: [PATCH 1/4] Adjust max concurrency and user agent in lychee.toml Adjust lychee CI to reduce errors. --- lychee.toml | 8 +++++--- 1 file changed, 5 insertions(+), 3 deletions(-) diff --git a/lychee.toml b/lychee.toml index b35f38cd..0f6c5f97 100644 --- a/lychee.toml +++ b/lychee.toml @@ -27,7 +27,8 @@ cache_exclude_status = "500.." ############################# Runtime ############################## -max_concurrency = 14 +# Reduce concurrency since lychee can check 500+ links in 1 minute with 1 worker +max_concurrency = 1 max_redirects = 10 max_retries = 2 # Wait longer between retries to give slow servers room to recover. @@ -37,8 +38,9 @@ timeout = 45 ############################# Requests ############################# -# Some sites block lychee's default UA. Use a generic browser-ish UA. -user_agent = "Mozilla/5.0 (compatible; lychee-link-checker)" +# Some sites block lychee's default user agent (curl). Use a generic browser. +user_agent = "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/120.0.0.0 Safari/537.36" + # Accept 200–403 as success. 401/403 are common on bot-protected or # auth-walled pages we still want to consider "reachable". From 8cd25546ab26858b8355aa5a69a08f9c0a60bd23 Mon Sep 17 00:00:00 2001 From: Carol Willing Date: Tue, 23 Jun 2026 18:36:18 -0700 Subject: [PATCH 2/4] Add exclusion for neonscience.org in lychee.toml --- lychee.toml | 1 + 1 file changed, 1 insertion(+) diff --git a/lychee.toml b/lychee.toml index 0f6c5f97..ad8f4b4c 100644 --- a/lychee.toml +++ b/lychee.toml @@ -61,6 +61,7 @@ include_verbatim = false # Regex excludes. Plain-domain skips belong in .lycheeignore. exclude = [ + 'https://(www\.)?neonscience\.org/.*', 'zenodo\.org', # Self-references to the deployed site lag the build, producing false # 404s for new pages. Internal links are validated via relative paths. From dc756f2ff4460869f9c5f6223ca681a2b902ced5 Mon Sep 17 00:00:00 2001 From: Carol Willing Date: Tue, 23 Jun 2026 18:41:05 -0700 Subject: [PATCH 3/4] Disable internal link check for pyopensci.org Comment out the internal link check for pyopensci.org in lychee.toml. --- lychee.toml | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/lychee.toml b/lychee.toml index ad8f4b4c..49fa0e12 100644 --- a/lychee.toml +++ b/lychee.toml @@ -65,5 +65,6 @@ exclude = [ 'zenodo\.org', # Self-references to the deployed site lag the build, producing false # 404s for new pages. Internal links are validated via relative paths. - '^https?://(www\.)?pyopensci\.org/', + # Note: testing if we can check internal link now that we are using hugo + #'^https?://(www\.)?pyopensci\.org/', ] From f7e391d4c9087c742d095dea0c07943edf884f19 Mon Sep 17 00:00:00 2001 From: Carol Willing Date: Tue, 23 Jun 2026 18:45:25 -0700 Subject: [PATCH 4/4] Clean up exclude list in lychee.toml Remove commented-out self-reference exclusion for validation. --- lychee.toml | 4 ---- 1 file changed, 4 deletions(-) diff --git a/lychee.toml b/lychee.toml index 49fa0e12..0b66dfef 100644 --- a/lychee.toml +++ b/lychee.toml @@ -63,8 +63,4 @@ include_verbatim = false exclude = [ 'https://(www\.)?neonscience\.org/.*', 'zenodo\.org', - # Self-references to the deployed site lag the build, producing false - # 404s for new pages. Internal links are validated via relative paths. - # Note: testing if we can check internal link now that we are using hugo - #'^https?://(www\.)?pyopensci\.org/', ]