From 2065cef4c41a83af39020e9015f5e87d34d9572c Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Fran=C3=A7ois=20Daoust?= Date: Wed, 9 Nov 2022 12:12:39 +0100 Subject: [PATCH] Prevent duplicates in dfns extracts (#1110) This makes the dfns extraction code skip over a re-defined term (same linking text, same type, same namespace), and report a warning when a duplicate dfn is encountered and skipped. Warnings are easily glossed over but we don't really have a better mechanism in place right now to report issues found during extractions. Apart from making the whole extraction fail that is, which seems overkill. Fixes https://github.com/w3c/webref/issues/783 --- src/browserlib/extract-dfns.mjs | 24 +++++++++++++++++++++++- tests/extract-dfns.js | 4 ++++ 2 files changed, 27 insertions(+), 1 deletion(-) diff --git a/src/browserlib/extract-dfns.mjs b/src/browserlib/extract-dfns.mjs index dcb20f44..167690c4 100644 --- a/src/browserlib/extract-dfns.mjs +++ b/src/browserlib/extract-dfns.mjs @@ -24,6 +24,13 @@ import {parse} from "../../node_modules/webidl2/index.js"; * "prose" (last one indicates that definition appears in the main body of * the spec) * + * The extraction ignores definitions with an unknown type. A warning is issued + * to the console when that happens. + * + * The extraction uses the first definition it finds when it bumps into a term + * that is defined more than once (same "linkingText", same "type", same "for"). + * A warning is issued to the console when that happens. + * * @function * @public * @return {Array(Object)} An Array of definitions @@ -99,6 +106,20 @@ function hasValidType(el) { return isValid; } +// Return true when definition is not already defined in the list, +// Return false and issue a warning when it is already defined. +function isNotAlreadyDefined(dfn, idx, list) { + const first = list.find(d => d === dfn || + (d.type === dfn.type && + d.linkingText.length === dfn.linkingText.length && + d.linkingText.every(lt => dfn.linkingText.find(t => t == lt)) && + d.for.length === dfn.for.length && + d.for.every(lt => dfn.for.find(t => t === lt)))); + if (first !== dfn) { + console.warn('[reffy]', `Duplicate dfn found for "${dfn.linkingText[0]}", type="${dfn.type}", for="${dfn.for[0]}"`); + } + return first === dfn; +} function definitionMapper(el, idToHeading) { let definedIn = 'prose'; @@ -237,7 +258,8 @@ export default function (spec, idToHeading = {}) { const link = node.querySelector('a[href^="http"]'); return !link || (node.textContent.trim() !== link.textContent.trim()); }) - .map(node => definitionMapper(node, idToHeading)); + .map(node => definitionMapper(node, idToHeading)) + .filter(isNotAlreadyDefined); } function preProcessEcmascript() { diff --git a/tests/extract-dfns.js b/tests/extract-dfns.js index 62eee508..062c9f1d 100644 --- a/tests/extract-dfns.js +++ b/tests/extract-dfns.js @@ -152,6 +152,10 @@ const tests = [ html: "Foo", changesToBaseDfn: [] }, + {title: "ignores dfns already defined", + html: "Foo. Foo is already defined.", + changesToBaseDfn: [{}] + }, {title: "automatically fixes internal slots dfns with an invalid 'idl' data-dfn-type", html: "Foo", changesToBaseDfn: [{type: "attribute", access: "public"}]