From 1771bb9874dbbb2ca79c3b3fd0cf23dab80661ca Mon Sep 17 00:00:00 2001 From: Francois Daoust Date: Fri, 17 Jan 2025 11:13:27 +0100 Subject: [PATCH] Move dupl detection logic to CDDL marker That's a more natural place to put the logic and it simplifies things a bit as well (no need to deal with additional linking texts). --- bikeshed/cddl.py | 194 ++++++++++++++++++++------------------ tests/cddl003.console.txt | 2 +- tests/cddl005.html | 4 +- 3 files changed, 105 insertions(+), 95 deletions(-) diff --git a/bikeshed/cddl.py b/bikeshed/cddl.py index 9286387e67..a702856462 100644 --- a/bikeshed/cddl.py +++ b/bikeshed/cddl.py @@ -14,9 +14,39 @@ class CDDLMarker(cddlparser.ast.Marker): so that cross-referencing logic may take place. """ - currentRule: cddlparser.ast.Rule + # Keep pointers on the current rule context to track generic parameters + # that are scoped to it + currentRule: cddlparser.ast.Rule | None currentParameters: list[str] + # List of all CDDL terms defined so far to track and report duplicates + defined: list + + def __init__(self) -> None: + self.currentRule = None + self.currentParameters = [] + self.defined = [] + + def _recordDefinition(self, type: str, name: str, dfnFor: str | None = None) -> bool: + for term in self.defined: + if term["type"] == type and term["name"] == name and term["dfnFor"] == dfnFor: + forText = "" if dfnFor is None else f' defined in type "{dfnFor}"' + m.die( + f"CDDL {type} {name}{forText} creates a duplicate and cannot be referenced.\nPlease create additional CDDL types to disambiguate.", + ) + return False + if type != "parameter": + for term in self.defined: + if term["type"] != "parameter" and term["name"] == name and term["dfnFor"] == dfnFor: + forText = "" if dfnFor is None else f' defined in type "{dfnFor}"' + m.warn( + f"CDDL {type} {name}{forText} creates a duplicate with a CDDL {term['type']}.\nLink type needs to be specified to reference the term.\nConsider creating additional CDDL types to disambiguate.", + ) + break + term = {"type": type, "name": name, "dfnFor": dfnFor} + self.defined.append(term) + return True + def serializeValue(self, prefix: str, value: str, suffix: str, node: cddlparser.ast.Value) -> str: name = prefix + value + suffix if node.type not in {"text", "bytes"}: @@ -32,7 +62,7 @@ def serializeValue(self, prefix: str, value: str, suffix: str, node: cddlparser. if forName is None: # Cannot easily link member key back to a definition return name - else: + elif self._recordDefinition("key", value, forName): # Create a key with and without quotes as linking text lts = [value, name] return '{}'.format( @@ -40,6 +70,9 @@ def serializeValue(self, prefix: str, value: str, suffix: str, node: cddlparser. h.escapeAttr("|".join(lts)), name, ) + else: + # Duplicate found, don't create a dfn + return name elif isinstance(parent, cddlparser.ast.Operator) and parent.controller == node: # Probably a ".default" value. It may be possible to link the value # back to an enumeration but it's equally possible that this is just @@ -49,13 +82,16 @@ def serializeValue(self, prefix: str, value: str, suffix: str, node: cddlparser. forName = self._getFor(node) if forName is None: return name - else: + elif self._recordDefinition("value", value, forName): lts = [value, name] return '{}'.format( h.escapeAttr(forName), h.escapeAttr("|".join(lts)), name, ) + else: + # Duplicate found, don't create a dfn + return name def serializeName(self, name: str, node: cddlparser.ast.CDDLNode) -> str: # The node is a Typename. Such a node may appear in a Rule, a Type, @@ -73,8 +109,11 @@ def serializeName(self, name: str, node: cddlparser.ast.CDDLNode) -> str: if parent.assign.type in {cddlparser.Tokens.TCHOICEALT, cddlparser.Tokens.GCHOICEALT}: # The definition extends a base definition return '{}'.format(name) - else: + elif self._recordDefinition("type", name): return '{}'.format(h.escapeAttr(name), name) + else: + # Duplicate found, don't create a dfn + return name elif isinstance(parent, cddlparser.ast.Memberkey): # Member definition if not parent.hasColon: @@ -95,25 +134,34 @@ def serializeName(self, name: str, node: cddlparser.ast.CDDLNode) -> str: lts = [name[1:-1], name] else: lts = [name, '"' + name + '"'] - return '{}'.format( - h.escapeAttr(forName), - h.escapeAttr("|".join(lts)), - name, - ) + if self._recordDefinition("key", lts[0], forName): + return '{}'.format( + h.escapeAttr(forName), + h.escapeAttr("|".join(lts)), + name, + ) + else: + # Duplicate found, don't create a dfn + return name elif isinstance(parent, cddlparser.ast.GenericParameters): typename = parent.parentNode assert isinstance(typename, cddlparser.ast.Typename) - return '{}'.format( - h.escapeAttr(typename.name), - h.escapeAttr(name), - name, - ) + if self._recordDefinition("parameter", name, typename.name): + return '{}'.format( + h.escapeAttr(typename.name), + h.escapeAttr(name), + name, + ) + else: + # Duplicate found, don't create a dfn + return name elif name in get_args(cddlparser.ast.PreludeType): # Do not link types that come from the CDDL prelude # defined in RFC 8610 return name elif name in self.currentParameters: # Name is a reference to a generic parameter + assert self.currentRule is not None return '{}'.format( h.escapeAttr(self.currentRule.name.name), name, @@ -170,39 +218,6 @@ def markupCDDLBlock(pre: t.ElementT, doc: t.SpecT) -> set[t.ElementT]: """ localDfns = set() - # A CDDL definition may create duplicates, e.g. argh = [ "dupl", "dupl" ] - # To detect these duplicates, let's maintain a list of actual definitions - # contained in CDDL blocks. - cddlDfns = set() - - def recordDfns(el: t.ElementT) -> bool: - cddlType = "cddl-" + (el.get("data-cddl-type") or "") - for cddlText in (el.get("data-lt") or "").split("|"): - linkFors = t.cast("list[str|None]", config.splitForValues(el.get("data-cddl-for", ""))) or [None] - for linkFor in linkFors: - dfnText = cddlType + ">" + (linkFor or "") + "/" + cddlText - if dfnText in cddlDfns: - forText = "" if linkFor is None else f' defined in type "{linkFor}"' - m.die( - f"CDDL {cddlType[5:]} {cddlText}{forText} creates a duplicate and cannot be referenced.\nPlease create additional CDDL types to disambiguate.", - ) - return False - cddlDfns.add(dfnText) - if cddlType != "cddl-parameter": - warned = False - for cddlText in (el.get("data-lt") or "").split("|"): - linkFors = t.cast("list[str|None]", config.splitForValues(el.get("data-cddl-for", ""))) or [None] - for linkFor in linkFors: - dfnText = (linkFor or "") + "/" + cddlText - if dfnText in cddlDfns and not warned: - warned = True - forText = "" if linkFor is None else f' defined in type "{linkFor}"' - m.warn( - f"CDDL {cddlType[5:]} {cddlText}{forText} creates a duplicate with another CDDL definition.\nLink type needs to be specified to reference the term.\nConsider creating additional CDDL types to disambiguate.", - ) - cddlDfns.add(dfnText) - return True - for el in h.findAll("cddl", pre): # Prefix CDDL types with "cddl-" to avoid confusion with other # types (notably CSS ones such as "value") @@ -211,54 +226,49 @@ def recordDfns(el: t.ElementT) -> bool: url = None ref = None cddlText = None - # Record the dfns that the term would create and check whether - # it creates a duplicate. If it does, let's not link the term. - if not recordDfns(el): - el.tag = "span" - else: - for cddlText in (el.get("data-lt") or "").split("|"): - linkFors = t.cast("list[str|None]", config.splitForValues(el.get("data-cddl-for", ""))) or [None] - for linkFor in linkFors: - ref = doc.refs.getRef( - cddlType, - cddlText, - linkFor=linkFor, - status="local", - el=el, - error=True, - ) - if ref: - url = ref.url - break + for cddlText in (el.get("data-lt") or "").split("|"): + linkFors = t.cast("list[str|None]", config.splitForValues(el.get("data-cddl-for", ""))) or [None] + for linkFor in linkFors: + ref = doc.refs.getRef( + cddlType, + cddlText, + linkFor=linkFor, + status="local", + el=el, + error=True, + ) if ref: + url = ref.url break - if url is None: - el.tag = "dfn" - el.set("data-dfn-type", cddlType) - del el.attrib["data-cddl-type"] - if el.get("data-cddl-for"): - el.set("data-dfn-for", el.get("data-cddl-for") or "") - del el.attrib["data-cddl-for"] - else: - # Copy over the auto-generated linking text to the manual dfn. - dfn = h.find(url, doc) - # How in the hell does this work, the url is not a selector??? - assert dfn is not None - lts = combineCDDLLinkingTexts(el.get("data-lt"), dfn.get("data-lt")) - dfn.set("data-lt", lts) - localDfns.add(dfn) + if ref: + break + if url is None: + el.tag = "dfn" + el.set("data-dfn-type", cddlType) + del el.attrib["data-cddl-type"] + if el.get("data-cddl-for"): + el.set("data-dfn-for", el.get("data-cddl-for") or "") + del el.attrib["data-cddl-for"] + else: + # Copy over the auto-generated linking text to the manual dfn. + dfn = h.find(url, doc) + # How in the hell does this work, the url is not a selector??? + assert dfn is not None + lts = combineCDDLLinkingTexts(el.get("data-lt"), dfn.get("data-lt")) + dfn.set("data-lt", lts) + localDfns.add(dfn) - # Reset the element to be a link to the manual dfn. - el.tag = "a" - el.set("data-link-type", cddlType) - el.set("data-lt", cddlText) - del el.attrib["data-cddl-type"] - if el.get("data-cddl-for"): - el.set("data-link-for", el.get("data-cddl-for") or "") - del el.attrib["data-cddl-for"] - if el.get("id"): - # ID was defensively added by the Marker. - del el.attrib["id"] + # Reset the element to be a link to the manual dfn. + el.tag = "a" + el.set("data-link-type", cddlType) + el.set("data-lt", cddlText) + del el.attrib["data-cddl-type"] + if el.get("data-cddl-for"): + el.set("data-link-for", el.get("data-cddl-for") or "") + del el.attrib["data-cddl-for"] + if el.get("id"): + # ID was defensively added by the Marker. + del el.attrib["id"] return localDfns diff --git a/tests/cddl003.console.txt b/tests/cddl003.console.txt index e3dbb21d4f..264ea70a02 100644 --- a/tests/cddl003.console.txt +++ b/tests/cddl003.console.txt @@ -1,4 +1,4 @@ -WARNING: CDDL value dupl defined in type "warn" creates a duplicate with another CDDL definition. +WARNING: CDDL value dupl defined in type "warn" creates a duplicate with a CDDL key. Link type needs to be specified to reference the term. Consider creating additional CDDL types to disambiguate. LINE 94: No 'cddl' refs found for '"unique"'. diff --git a/tests/cddl005.html b/tests/cddl005.html index 44e4d8aa60..6e5c31091b 100644 --- a/tests/cddl005.html +++ b/tests/cddl005.html @@ -602,7 +602,7 @@

Table of Contents

1. The CDDL

-
error = [ "dupl", "dupl" ]
+
error = [ "dupl", "dupl" ]
 

The error type defines the "dupl" value twice. Bikeshed dies with an error message, because there is no way to disambiguate the values. If user forces generation, no dfn is created for the second value.

@@ -615,7 +615,7 @@

error, in § 1

CDDL Index

-
error = [ "dupl", "dupl" ]
+
error = [ "dupl", "dupl" ]