Miscellaneous fixes for documentation

Including renaming some functions for clarity.
jupyter · Dec 17, 2023 · 6e9269f · 6e9269f
1 parent c19ee22
commit 6e9269f
Show file tree

Hide file tree

Showing 5 changed files with 71 additions and 44 deletions.
diff --git a/Readme.md b/Readme.md
@@ -284,12 +284,12 @@ collection of many papyrus scrolls.
 ## Legacy (MISC/OLD) documentation (Inaccurate):
 
 
-#### generation (papyri gen ),
+#### Generation (`papyri gen`)
 
-Which collect the documentation of a project into a doc-bundle; a number of
-doc-blobs (currently json file), with a defined semantic structure, and
+Collects the documentation of a project into a DocBundle -- a number of
+DocBlobs (currently json files), with a defined semantic structure, and
 some metadata (version of the project this documentation refers to, and
-potentially some other blobs)
+potentially some other blobs).
 
 During the generation a number of normalisation and inference can and should
 happen, for example
@@ -312,11 +312,12 @@ pandas as pd`, for example,)
 
 #### Ingestion (papyri ingest)
 
-The ingestion step take doc-bundle and/or doc-blobs and add them into a graph of
-known items; the ingestion is critical to efficiently build the collection graph
-metadata and understand which items refers to which; this allow the following:
+The ingestion step takes a DocBundle and/or DocBlobs and adds them into a graph
+of known items; the ingestion is critical to efficiently build the collection
+graph metadata and understand which items refers to which. This allows the
+following:
 
- - Update the list of backreferences to a docbundle
+ - Update the list of backreferences to a DocBundle
  - Update forward references metadata to know whether links are valid.
 
 Currently the ingestion loads all in memory and update all the bundle in place

diff --git a/examples/numpy.toml b/examples/numpy.toml
@@ -35,6 +35,7 @@ execute_exclude_patterns = [
 'numpy.lib.npyio._read',
 'numpy.polynomial._polybase:ABCPolyBase',
 'numpy.distutils.misc_util:Configuration.__init__',
+'numpy.ma.core:MaskedArray.resize', # First line of docstring is a directive; breaks parsing
 ]
 
 submodules = [

diff --git a/papyri/__init__.py b/papyri/__init__.py
@@ -246,7 +246,7 @@ def ingest(
     dummy_progress: bool = typer.Option(False, help="Disable rich progress bar"),
 ):
     """
-    Given paths to a docbundle folder, ingest it into the known libraries.
+    Given paths to a DocBundle folder, ingest it into the known libraries.
 
     Parameters
     ----------
@@ -280,7 +280,7 @@ def install(
     relink: bool = False,
 ):
     """
-    WIP, download and install a remote docbundle
+    WIP. Download and install a remote DocBundle
     """
 
     from io import BytesIO
@@ -296,7 +296,7 @@ def install(
 
     async def get(name, version, results, progress):
         """
-        Utility to download a single docbundle and
+        Utility to download a single DocBundle and
         put it into result.
 
         """
@@ -333,7 +333,7 @@ async def get(name, version, results, progress):
 
     async def trio_main():
         """
-        Main trio routine to download docbundles concurently.
+        Main trio routine to download DocBundles concurently.
 
         """
         results = {}

diff --git a/papyri/gen.py b/papyri/gen.py
@@ -457,7 +457,7 @@ def load_configuration(
         root = info.pop("module")
         return root, info, conf.get("meta", {})
     else:
-        sys.exit(f"{conffile!r} does not exists.")
+        sys.exit(f"{conffile!r} does not exist.")
 
 
 def gen_main(
@@ -477,9 +477,9 @@ def gen_main(
     limit_to: List[str],
 ) -> None:
     """
-    Main entry point to generate docbundle files,
+    Main entry point to generate DocBundle files.
 
-    This will take care of reading  single configuration file with the option
+    This will take care of reading single configuration files with the options
     for the library you want to build the docs for, scrape API, narrative and
     examples, and put it into a doc bundle for later consumption.
 
@@ -779,11 +779,14 @@ def values(self):
 
 class DocBlob(Node):
     """
-    An object containing information about the documentation of an arbitrary object.
+    An object containing information about the documentation of an arbitrary
+    object.
+
+    Instead of DocBlob being a NumpyDocString, I'm thinking of them having a
+    NumpyDocString. This helps with arbitrary documents (module, examples files)
+    that cannot be parsed by Numpydoc, as well as links to external references,
+    like images generated.
 
-    Instead of docblob begin a NumpyDocString, I'm thinking of them having a numpydocstring.
-    This helps with arbitraty documents (module, examples files) that cannot be parsed by Numpydoc,
-    as well as link to external references, like images generated.
     """
 
     __slots__ = (
@@ -918,12 +921,10 @@ def _numpy_data_to_section(data: List[Tuple[str, str, List[str]]], title: str, q
 
 class APIObjectInfo:
     """
-    Info about an API object
-    This object can be many things:
+    Describes the object's type and other relevant information
 
-    Module, Class, method, function.
+    This object can be many things, such as a Module, Class, method, function.
 
-    I'll see how I handle that later.
     """
 
     kind: str
@@ -1063,7 +1064,7 @@ def _normalize_see_also(see_also: Section, qa: str):
 
 class Gen:
     """
-    Core class to generate docbundles for a given library.
+    Core class to generate a DocBundle for a given library.
 
     This is responsible for finding all objects, extracting the doc, parsing it,
     and saving that into the right folder.
@@ -1142,9 +1143,9 @@ def get_example_data(
         """Extract example section data from a NumpyDocString
 
         One of the section in numpydoc is "examples" that usually consist of number
-        if paragraph, interleaved with examples starting with >>> and ...,
+        of paragraphs, interleaved with examples starting with >>> and ...,
 
-        This attempt to parse this into structured data, with text, input and output
+        This attempts to parse this into structured data, with text, input and output
         as well as to infer the types of each token in the input examples.
 
         This is currently relatively limited as the inference does not work across
@@ -1385,7 +1386,6 @@ def collect_narrative_docs(self):
         blbs = {}
         with self.progress() as p2:
             task = p2.add_task("Parsing narative", total=len(files))
-
             for p in files:
                 p2.update(task, description=compress_user(str(p)).ljust(7))
                 p2.advance(task)
@@ -1455,7 +1455,7 @@ def write_examples(self, where: Path) -> None:
 
     def write_api(self, where: Path):
         """
-        write the API section of the docbundles.
+        Write the API section of the DocBundle.
         """
         (where / "module").mkdir(exist_ok=True)
         for k, v in self.data.items():
@@ -1466,7 +1466,7 @@ def partial_write(self, where):
 
     def write(self, where: Path):
         """
-        Write a docbundle folder.
+        Write a DocBundle folder.
         """
         self.write_api(where)
         self.write_narrative(where)
@@ -1495,14 +1495,21 @@ def put_raw(self, path: str, data: bytes):
         self.bdata[path] = data
 
     def _transform_1(self, blob: DocBlob, ndoc) -> DocBlob:
+        """
+        Populates DocBlob content field from numpydoc parsed docstring.
+
+        """
         for k, v in ndoc._parsed_data.items():
             blob.content[k] = v
         for k, v in blob.content.items():
             assert isinstance(v, (str, list, dict)), type(v)
         return blob
 
     def _transform_2(self, blob: DocBlob, target_item, qa: str) -> DocBlob:
-        # try to find relative path WRT site package.
+        """
+        Try to find relative path WRT site package and populate item_file field
+        for DocBlob.
+        """
         # will not work for dev install. Maybe an option to set the root location ?
         item_file: Optional[str] = find_file(target_item)
         if item_file is not None and item_file.endswith("<string>"):
@@ -1546,6 +1553,10 @@ def _transform_2(self, blob: DocBlob, target_item, qa: str) -> DocBlob:
         return blob
 
     def _transform_3(self, blob, target_item):
+        """
+        Try to find source line number for target object and populate item_line
+        field for DocBlob.
+        """
         item_line = None
         try:
             item_line = inspect.getsourcelines(target_item)[1]
@@ -1595,13 +1606,13 @@ def prepare_doc_for_one_object(
         aliases : sequence
             other aliases for cuttent object.
         api_object : APIObjectInfo
-            <Multiline Description Here>
+            Describes the object's type and other relevant information
 
         Returns
         -------
         Tuple of two items,
-        ndoc:
-            DocBundle with info for current object.
+        blob:
+            DocBlob with info for current object.
         figs:
             dict mapping figure names to figure data.
 
@@ -1908,17 +1919,32 @@ def collect_examples_out(self):
                 for name, data in figs:
                     self.put_raw(name, data)
 
-    def helper_1(
+    def extract_docstring(
         self, *, qa: str, target_item: Any
     ) -> Tuple[Optional[str], List[Section], APIObjectInfo]:
         """
+        Extract docstring from an object.
+
+        Detects whether an object includes a docstring and parses the object's
+        type.
+
         Parameters
         ----------
         qa : str
-            fully qualified name of the object we are extracting the
-            documentation from .
+            Fully qualified name of the object we are extracting the
+            documentation from
         target_item : Any
-            Can be any kind of object
+            Object we wish inspect. Can be any kind of object.
+
+        Returns
+        -------
+        item_docstring : str
+            The unprocessed object's docstring
+        sections : list of Section
+            A list of serialized sections of the docstring
+        api_object : APIObjectInfo
+            Describes the object's type and other relevant information
+
         """
         item_docstring: str = target_item.__doc__
         if item_docstring is not None:
@@ -1999,12 +2025,12 @@ def collect_package_metadata(self, root, relative_dir, meta):
 
     def collect_api_docs(self, root: str, limit_to: List[str]) -> None:
         """
-        Crawl one module and stores resulting docbundle in self.store.
+        Crawl one module and stores resulting DocBundle in json files.
 
         Parameters
         ----------
         root : str
-            module name to generate docbundle for.
+            Module name to generate DocBundle for.
         limit_to : list of string
             For partial documentation building and testing purposes
             we may want to generate documentation for only a single item.
@@ -2072,7 +2098,7 @@ def collect_api_docs(self, root: str, limit_to: List[str]) -> None:
             self.log.debug("treating %r", qa)
 
             with error_collector(qa=qa) as ecollector:
-                item_docstring, arbitrary, api_object = self.helper_1(
+                item_docstring, arbitrary, api_object = self.extract_docstring(
                     qa=qa,
                     target_item=target_item,
                 )
@@ -2097,7 +2123,7 @@ def collect_api_docs(self, root: str, limit_to: List[str]) -> None:
                     ndoc = NumpyDocString(dedent_but_first("No Docstrings"))
                 else:
                     ndoc = NumpyDocString(dedent_but_first(item_docstring))
-                    # note currentlu in ndoc we use:
+                    # note currently in ndoc we use:
                     # _parsed_data
                     # direct access to  ["See Also"], and [""]
                     # and :
@@ -2228,7 +2254,6 @@ def collect_api_docs(self, root: str, limit_to: List[str]) -> None:
                 "The following parsing failed \n%s",
                 json.dumps(failure_collection, indent=2, sort_keys=True),
             )
-
         self._meta.update(
             {
                 "aliases": aliases,

diff --git a/papyri/tree.py b/papyri/tree.py
@@ -549,8 +549,8 @@ def _autosummary_handler(self, argument, options: dict, content):
     def _math_handler(self, argument, options, content):
         if argument and content:
             log.info(
-                "For consistency please use the math directive"
-                " with all the equation in the content of the directive in %r",
+                "For consistency, please use the math directive"
+                " with all the equations in the content of the directive in %r",
                 self.qa,
             )
             content = argument + content