twisted
diff --git a/‎README.rst
Lines changed: 3 additions & 0 deletions b/‎README.rst
Lines changed: 3 additions & 0 deletions
diff --git a/‎docs/google_demo/__init__.py
Lines changed: 1 addition & 1 deletion b/‎docs/google_demo/__init__.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎docs/numpy_demo/__init__.py
Lines changed: 1 addition & 1 deletion b/‎docs/numpy_demo/__init__.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎docs/tests/test.py
Lines changed: 0 additions & 1 deletion b/‎docs/tests/test.py
Lines changed: 0 additions & 1 deletion
diff --git a/‎pydoctor/epydoc/docutils.py
Lines changed: 11 additions & 4 deletions b/‎pydoctor/epydoc/docutils.py
Lines changed: 11 additions & 4 deletions
diff --git a/‎pydoctor/epydoc/markup/__init__.py
Lines changed: 7 additions & 7 deletions b/‎pydoctor/epydoc/markup/__init__.py
Lines changed: 7 additions & 7 deletions
diff --git a/‎pydoctor/epydoc/markup/_pyval_repr.py
Lines changed: 1 addition & 1 deletion b/‎pydoctor/epydoc/markup/_pyval_repr.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎pydoctor/epydoc/markup/_types.py
Lines changed: 84 additions & 126 deletions b/‎pydoctor/epydoc/markup/_types.py
Lines changed: 84 additions & 126 deletions
@@ -73,6 +73,9 @@ What's New?
 in development
 ^^^^^^^^^^^^^^
 
+* Fix bug that would result in duplicated "Cannot find link target" warnings when the 
+  types under a docstring *Attributes* section failed to resolved.
+
 pydoctor 25.4.0
 ^^^^^^^^^^^^^^^
 
 
@@ -55,7 +55,7 @@ def function_with_types_in_docstring(param1, param2):
 
     Args:
         param1 (int): The first parameter.
-        param2 (str): The second parameter.
+        param2 (str, {"html", "json", "xml"}, optional): The second parameter.
 
     Returns:
         bool: The return value. True for success, False otherwise.
 
@@ -73,7 +73,7 @@ def function_with_types_in_docstring(param1, param2):
     ----------
     param1 : int
         The first parameter.
-    param2 : str
+    param2 : str : {"html", "json", "xml"}, optional
         The second parameter.
 
     Returns
 
@@ -195,7 +195,6 @@ def test_search(query:str, expected:List[str], order_is_important:bool=True) ->
         to_stan_results = [
                     'pydoctor.epydoc.markup.ParsedDocstring.to_stan', 
                     'pydoctor.epydoc.markup.plaintext.ParsedPlaintextDocstring.to_stan',
-                    'pydoctor.epydoc.markup._types.ParsedTypeDocstring.to_stan',
                     'pydoctor.epydoc.markup._pyval_repr.ColorizedPyvalRepr.to_stan',
                 ]
         test_search('to_stan*', to_stan_results, order_is_important=False)
 
@@ -3,7 +3,10 @@
 """
 from __future__ import annotations
 
-from typing import Iterable, Iterator, Optional, TypeVar, cast
+from typing import Iterable, Iterator, Optional, TypeVar, cast, TYPE_CHECKING
+
+if TYPE_CHECKING:
+    from typing import Literal
 
 import optparse
 
@@ -14,11 +17,11 @@
 
 _DEFAULT_DOCUTILS_SETTINGS: Optional[optparse.Values] = None
 
-def new_document(source_path: str, settings: Optional[optparse.Values] = None) -> nodes.document:
+def new_document(source: Literal['docstring', 'code'], settings: Optional[optparse.Values] = None) -> nodes.document:
     """
     Create a new L{nodes.document} using the provided settings or cached default settings.
 
-    @returns: L{nodes.document}
+    @returns: L{nodes.document} with a C{source} attribute that matches the provided source.
     """
     global _DEFAULT_DOCUTILS_SETTINGS
     # If we have docutils >= 0.19 we use get_default_settings to calculate and cache
@@ -29,7 +32,7 @@ def new_document(source_path: str, settings: Optional[optparse.Values] = None) -
 
         settings = _DEFAULT_DOCUTILS_SETTINGS
 
-    return utils.new_document(source_path, settings)
+    return utils.new_document(source, settings)
 
 def _set_nodes_parent(nodes: Iterable[nodes.Node], parent: nodes.Element) -> Iterator[nodes.Node]:
     """
@@ -145,7 +148,11 @@ def get_first_parent_lineno(_node: nodes.Element | None) -> int:
         return line
 
     if node.line:
+        # If the line is explicitely set, assume it's zero-based
         line = node.line
+        # If docutils suddenly starts populating the line attribute for
+        # title_reference node, all RST xref warnings will off by 1 :/
+
     else:
         line = get_first_parent_lineno(node.parent)
 
 
@@ -88,7 +88,7 @@ def get_supported_docformats() -> Iterator[str]:
 
 def get_parser_by_name(docformat: str, objclass: ObjClass | None = None) -> ParserFunction:
     """
-    Get the C{parse_docstring(str, List[ParseError], bool) -> ParsedDocstring} function based on a parser name. 
+    Get the C{parse_docstring(str, List[ParseError]) -> ParsedDocstring} function based on a parser name. 
 
     @raises ImportError: If the parser could not be imported, probably meaning that your are missing a dependency
         or it could be that the docformat name do not match any know L{pydoctor.epydoc.markup} submodules.
@@ -113,7 +113,7 @@ def _processtypes(doc: 'ParsedDocstring', errs: List['ParseError']) -> None:
         for field in doc.fields:
             if field.tag() in ParsedTypeDocstring.FIELDS:
                 body = ParsedTypeDocstring(field.body().to_node(), lineno=field.lineno)
-                append_warnings(body.warnings, errs, lineno=field.lineno+1)
+                append_warnings(body.warnings, errs, lineno=field.lineno)
                 field.replace_body(body)
 
     def parse_and_processtypes(doc:str, errs:List['ParseError']) -> 'ParsedDocstring':
@@ -149,8 +149,8 @@ def __init__(self, fields: Sequence['Field']):
         """
         self._stan: Optional[Tag] = None
 
-    @property  
-    @abc.abstractmethod  
+    @property
+    @abc.abstractmethod
     def has_body(self) -> bool:
         """
         Does this docstring have a non-empty body?
@@ -168,7 +168,7 @@ def get_toc(self, depth: int) -> Optional['ParsedDocstring']:
         except NotImplementedError:
             return None
         contents = build_table_of_content(document, depth=depth)
-        docstring_toc = new_document('toc')
+        docstring_toc = new_document('docstring')
         if contents:
             docstring_toc.extend(contents)
             return ParsedRstDocstring(docstring_toc, ())
@@ -228,7 +228,7 @@ def get_summary(self) -> 'ParsedDocstring':
 
 def parsed_text(text: str, 
                 klass: str | None = None, 
-                source: str = 'docstring') -> ParsedDocstring:
+                source: Literal['docstring', 'code'] = 'docstring') -> ParsedDocstring:
     """
     Create a parsed representation of a simple text 
     with a given class (or no class at all).
@@ -455,7 +455,7 @@ def visit_paragraph(self, node: nodes.paragraph) -> None:
             self.other_docs = True
             raise nodes.StopTraversal()
 
-        summary_doc = new_document('summary')
+        summary_doc = new_document('docstring')
         summary_pieces: list[nodes.Node] = []
 
         # Extract the first sentences from the first paragraph until maximum number 
 
@@ -339,7 +339,7 @@ def colorize(self, pyval: Any) -> ColorizedPyvalRepr:
             is_complete = True
 
         # Put it all together.
-        document = new_document('pyval_repr')
+        document = new_document('code')
         # This ensure the .parent and .document attributes of the child nodes are set correcly.
         set_node_attributes(document, children=[set_node_attributes(node, document=document) for node in state.result])
         return ColorizedPyvalRepr(document, is_complete, state.warnings)
 
@@ -5,66 +5,35 @@
 """
 from __future__ import annotations
 
-from typing import Any, Callable, Dict, List, Tuple, Union, cast
+from typing import Callable, Dict
 
-from pydoctor.epydoc.markup import DocstringLinker, ParseError, ParsedDocstring, get_parser_by_name
-from pydoctor.node2stan import node2stan
-from pydoctor.napoleon.docstring import TokenType, TypeDocstring
+from pydoctor.epydoc.markup import ParsedDocstring
+from pydoctor.epydoc.markup._pyval_repr import PyvalColorizer
+from pydoctor.napoleon.docstring import TokenType, ITokenizer, Tokenizer
+from pydoctor.epydoc.docutils import new_document, set_node_attributes, code
 
 from docutils import nodes
-from twisted.web.template import Tag, tags
 
-class ParsedTypeDocstring(TypeDocstring, ParsedDocstring):
+class NodeTokenizer(ITokenizer[nodes.document]):
     """
-    Add L{ParsedDocstring} interface on top of L{TypeDocstring} and 
-    allow to parse types from L{nodes.Node} objects, providing the C{--process-types} option.
+    A type tokenizer for annotation as docutils L{document <nodes.document>}.
     """
 
-    FIELDS = ('type', 'rtype', 'ytype', 'returntype', 'yieldtype')
+    def __init__(self, annotation: nodes.document, *, 
+                 warns_on_unknown_tokens: bool) -> None:
+        # build tokens and warnings
+        self.warnings = warnings = [] # type: list[str]
+        raw_tokens = Tokenizer.recombine_sets(self.tokenize_document(annotation, warnings))
+        self.tokens = Tokenizer.build(raw_tokens, warnings, warns_on_unknown_tokens)
 
-    #                                                   yes this overrides the superclass type!
-    _tokens: list[tuple[str | nodes.Node, TokenType]] # type: ignore
-
-    def __init__(self, annotation: Union[nodes.document, str],
-                 warns_on_unknown_tokens: bool = False, lineno: int = 0) -> None:
-        ParsedDocstring.__init__(self, ())
-        if isinstance(annotation, nodes.document):
-            TypeDocstring.__init__(self, '', warns_on_unknown_tokens)
-
-            _tokens = self._tokenize_node_type_spec(annotation)
-            self._tokens = cast('list[tuple[str | nodes.Node, TokenType]]', 
-                                self._build_tokens(_tokens))
-            self._trigger_warnings()
-        else:
-            TypeDocstring.__init__(self, annotation, warns_on_unknown_tokens)
-        
-        
-        # We need to store the line number because we need to pass it to DocstringLinker.link_xref
-        self._lineno = lineno
-
-    @property
-    def has_body(self) -> bool:
-        return len(self._tokens)>0
-
-    def to_node(self) -> nodes.document:
-        """
-        Not implemented at this time :/
-        """
-        #TODO: Fix this soon - PR https://github.com/twisted/pydoctor/pull/874
-        raise NotImplementedError()
-
-    def to_stan(self, docstring_linker: DocstringLinker) -> Tag:
-        """
-        Present the type as a stan tree. 
-        """
-        return self._convert_type_spec_to_stan(docstring_linker)
-
-    def _tokenize_node_type_spec(self, spec: nodes.document) -> List[Union[str, nodes.Node]]:
+    @staticmethod
+    def tokenize_document(spec: nodes.document, warnings: list[str]) -> list[str | nodes.Node]:
         def _warn_not_supported(n:nodes.Node) -> None:
-            self.warnings.append(f"Unexpected element in type specification field: element '{n.__class__.__name__}'. "
-                                    "This value should only contain text or inline markup.")
+            warnings.append("Unexpected element in type specification field: "
+                                 f"element '{n.__class__.__name__}'. This value should "
+                                 "only contain text or inline markup.")
 
-        tokens: List[Union[str, nodes.Node]] = []
+        tokens: list[str | nodes.Node] = []
         # Determine if the content is nested inside a paragraph
         # this is generally the case, except for consolidated fields generate documents.
         if spec.children and isinstance(spec.children[0], nodes.paragraph):
@@ -77,99 +46,88 @@ def _warn_not_supported(n:nodes.Node) -> None:
         for child in children:
             if isinstance(child, nodes.Text):
                 # Tokenize the Text node with the same method TypeDocstring uses.
-                tokens.extend(TypeDocstring._tokenize_type_spec(child.astext()))
+                tokens.extend(Tokenizer.tokenize_str(child.astext()))
             elif isinstance(child, nodes.Inline):
                 tokens.append(child)
             else:
                 _warn_not_supported(child)
 
         return tokens
 
-    def _convert_obj_tokens_to_stan(self, tokens: List[Tuple[Any, TokenType]], 
-                                    docstring_linker: DocstringLinker) -> list[tuple[Any, TokenType]]:
-        """
-        Convert L{TokenType.OBJ} and PEP 484 like L{TokenType.DELIMITER} type to stan, merge them together. Leave the rest untouched. 
 
-        @param tokens: List of tuples: C{(token, type)}
-        """
+class ParsedTypeDocstring(ParsedDocstring):
+    """
+    Add L{ParsedDocstring} interface on top of L{TypeDocstring} and 
+    allow to parse types from L{nodes.Node} objects, 
+    providing the C{--process-types} option.
+    """
 
-        combined_tokens: list[tuple[Any, TokenType]] = []
-
-        open_parenthesis = 0
-        open_square_braces = 0
-
-        for _token, _type in tokens:
-            # The actual type of_token is str | Tag | Node. 
-
-            if (_type is TokenType.DELIMITER and _token in ('[', '(', ')', ']')) \
-               or _type is TokenType.OBJ: 
-                if _token == "[": open_square_braces += 1
-                elif _token == "(": open_parenthesis += 1
-
-                if _type is TokenType.OBJ:
-                    _token = docstring_linker.link_xref(
-                                _token, _token, self._lineno)
-
-                if open_square_braces + open_parenthesis > 0:
-                    try: last_processed_token = combined_tokens[-1]
-                    except IndexError:
-                        combined_tokens.append((_token, _type))
-                    else:
-                        if last_processed_token[1] is TokenType.OBJ \
-                           and isinstance(last_processed_token[0], Tag):
-                            # Merge with last Tag
-                            if _type is TokenType.OBJ:
-                                assert isinstance(_token, Tag)
-                                last_processed_token[0](*_token.children)
-                            else:
-                                last_processed_token[0](_token)
-                        else:
-                            combined_tokens.append((_token, _type))
-                else:
-                    combined_tokens.append((_token, _type))
-                
-                if _token == "]": open_square_braces -= 1
-                elif _token == ")": open_parenthesis -= 1
+    FIELDS = ('type', 'rtype', 'ytype', 'returntype', 'yieldtype')
 
-            else:
-                # the token will be processed in _convert_type_spec_to_stan() method.
-                combined_tokens.append((_token, _type))
+    def __init__(self, annotation: nodes.document, 
+                 warns_on_unknown_tokens: bool = False, 
+                 lineno: int = 0) -> None:
+        super().__init__(fields=())
+
+        tokenizer = NodeTokenizer(annotation, 
+                              warns_on_unknown_tokens=warns_on_unknown_tokens)
+        self._tokens = tokenizer.tokens
+        self.warnings = tokenizer.warnings
+        self._lineno = lineno
+        self._document = self._parse_tokens()
+
+    @property
+    def has_body(self) -> bool:
+        return len(self._tokens)>0
 
-        return combined_tokens
+    def to_node(self) -> nodes.document:
+        return self._document
+
+    _converters: Dict[TokenType, Callable[[str, int], nodes.Node]] = {
+            TokenType.LITERAL: lambda _token, _: nodes.inline(
+                                         # we're re-using the STRING_TAG css 
+                                         # class for the whole literal token, it's the
+                                         # best approximation we have for now. 
+                _token, _token, classes=[PyvalColorizer.STRING_TAG]),
+            TokenType.CONTROL: lambda _token, _: nodes.emphasis(_token, _token),
+            TokenType.OBJ: lambda _token, lineno: set_node_attributes(
+                nodes.title_reference(_token, _token), lineno=lineno),
+        }
 
-    def _convert_type_spec_to_stan(self, docstring_linker: DocstringLinker) -> Tag:
+    def _parse_tokens(self) -> nodes.document:
         """
-        Convert type to L{Tag} object.
+        Convert type to docutils document object.
         """
 
-        tokens = self._convert_obj_tokens_to_stan(self._tokens, docstring_linker)
-
-        warnings: List[ParseError] = []
-
-        converters: Dict[TokenType, Callable[[Union[str, Tag]], Union[str, Tag]]] = {
-            TokenType.LITERAL:      lambda _token: tags.span(_token, class_="literal"),
-            TokenType.CONTROL:      lambda _token: tags.em(_token),
-            # We don't use safe_to_stan() here, if these converter functions raise an exception, 
-            # the whole type docstring will be rendered as plaintext.
-            # it does not crash on invalid xml entities
-            TokenType.REFERENCE:    lambda _token: get_parser_by_name('restructuredtext')(_token, warnings).to_stan(docstring_linker) if isinstance(_token, str) else _token, 
-            TokenType.UNKNOWN:      lambda _token: get_parser_by_name('restructuredtext')(_token, warnings).to_stan(docstring_linker) if isinstance(_token, str) else _token, 
-            TokenType.OBJ:          lambda _token: _token, # These convertions (OBJ and DELIMITER) are done in _convert_obj_tokens_to_stan().
-            TokenType.DELIMITER:    lambda _token: _token, 
-            TokenType.ANY:          lambda _token: _token, 
-        }
+        document = new_document('code')
 
-        for w in warnings:
-            self.warnings.append(w.descr())
+        converters = self._converters
+        lineno = self._lineno
 
-        converted = Tag('')
+        elements: list[nodes.Node] = []
+        default = lambda _token, _: nodes.Text(_token)
 
-        for token, type_ in tokens:
+        for _tok in self._tokens:
+            token, type_ = _tok.value, _tok.type
             assert token is not None
-            if isinstance(token, nodes.Node):
-                token = node2stan(token, docstring_linker)
-            assert isinstance(token, (str, Tag))
-            converted_token = converters[type_](token)
-            converted(converted_token)
+            converted_token: nodes.Node
+            
+            if type_ is TokenType.ANY:
+                assert isinstance(token, nodes.Node)
+                converted_token = token
+            else:
+                assert isinstance(token, str)
+                converted_token = converters.get(type_, default)(token, lineno)
+
+            elements.append(set_node_attributes(converted_token, 
+                                                    document=document))
+
+        return set_node_attributes(document, children=[
+            set_node_attributes(code('', ''), 
+                                children=elements, 
+                                document=document, 
+                                lineno=lineno+1)])
+                                # the +1 here is coping with the fact that
+                                # Field.lineno are 0-based but the docutils tree 
+                                # is supposed to be 1-based
 
-        return converted
Original file line number	Diff line number	Diff line change
`@@ -195,7 +195,6 @@ def test_search(query:str, expected:List[str], order_is_important:bool=True) ->`
`195`	`195`	`to_stan_results = [`
`196`	`196`	`'pydoctor.epydoc.markup.ParsedDocstring.to_stan',`
`197`	`197`	`'pydoctor.epydoc.markup.plaintext.ParsedPlaintextDocstring.to_stan',`
`198`		`- 'pydoctor.epydoc.markup._types.ParsedTypeDocstring.to_stan',`
`199`	`198`	`'pydoctor.epydoc.markup._pyval_repr.ColorizedPyvalRepr.to_stan',`
`200`	`199`	`]`
`201`	`200`	`test_search('to_stan*', to_stan_results, order_is_important=False)`