Use spec-mode for annotate-links post processing

As suggested in #1055 (comment)
w3c · dontcallmedom · Sep 5, 2022 · Sep 1, 2022 · Sep 2, 2022 · Sep 2, 2022
commit 6565feb05144cecae400eff00cd67156f4b88b98
diff --git a/src/lib/specs-crawler.js b/src/lib/specs-crawler.js
@@ -294,7 +294,7 @@ async function saveSpecResults(spec, settings) {
 async function crawlList(speclist, crawlOptions) {
     // Make a shallow copy of crawl options object since we're going
     // to modify properties in place
-    crawlOptions = Object.assign({}, crawlOptions);
+    crawlOptions = Object.assign({speclist}, crawlOptions);
 
     // Expand list of processing modules to use if not already done
     crawlOptions.modules = expandBrowserModules(crawlOptions.modules);

diff --git a/src/postprocessing/annotate-links.js b/src/postprocessing/annotate-links.js
@@ -22,37 +22,22 @@ const needsSaving = {};
 
 module.exports = {
   dependsOn: ['links'],
-  input: 'crawl',
+  input: 'spec',
   property: 'links',
 
-  run: function(crawl, options) {
-    crawl.results.forEach(s => {
-      for (let link of Object.keys(s.links || {})) {
-	// Annotate with the spec to which the page belong if we can find one
-	const specUrl = canonicalizeUrl(link);
-	let matchingSpec = crawl.results.find(s => s?.release?.url === specUrl || s?.nightly?.url === specUrl || (s?.series?.currentSpecification === s?.shortname && (s?.series?.nightlyUrl === specUrl || s?.series?.releaseUrl === specUrl)) || s?.nightly?.pages?.includes(specUrl) || s?.release?.pages?.includes(specUrl));
-	if (matchingSpec) {
-	  needsSaving[s.shortname] = true;
-	  s.links[link].specShortname = matchingSpec.shortname;
-	}
+  run: function(spec, {speclist}) {
+    if (!speclist || !speclist.length) {
+      console.error("No spec list passed as input, cannot annotate links in post-processing");
+      return spec;
+    }
+    for (let link of Object.keys(spec.links || {})) {
+      // Annotate with the spec to which the page belong if we can find one
+      const specUrl = canonicalizeUrl(link);
+      let matchingSpec = speclist.find(s => s?.release?.url === specUrl || s?.nightly?.url === specUrl || (s?.series?.currentSpecification === s?.shortname && (s?.series?.nightlyUrl === specUrl || s?.series?.releaseUrl === specUrl)) || s?.nightly?.pages?.includes(specUrl) || s?.release?.pages?.includes(specUrl));
+      if (matchingSpec) {
+        spec.links[link].specShortname = matchingSpec.shortname;
       }
-    });
-    return crawl;
-  },
-
-  save: async function({results}, options) {
-    return Promise.all(Object.values(results).map(async spec => {
-      const contents = {
-        spec: {
-          title: spec.title,
-          url: spec.crawled
-        },
-	links: spec.links
-      };
-      const json = JSON.stringify(contents, null, 2);
-      const folder = path.join(options.output, "links");
-      const filename = path.join(folder, `${spec.shortname}.json`);
-      return await fs.promises.writeFile(filename, json);
-    }));
+    }
+    return spec;
   }
 };