# Copyright 2023 The Bazel Authors. All rights reserved. # # Licensed under the Apache License, Version 2.0 (the "License"); # you may not use this file except in compliance with the License. # You may obtain a copy of the License at # # http://www.apache.org/licenses/LICENSE-2.0 # # Unless required by applicable law or agreed to in writing, software # distributed under the License is distributed on an "AS IS" BASIS, # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # See the License for the specific language governing permissions and # limitations under the License. import argparse import io import itertools import pathlib import sys import textwrap from typing import Callable, TextIO, TypeVar from stardoc.proto import stardoc_output_pb2 _AttributeType = stardoc_output_pb2.AttributeType _T = TypeVar("_T") def _anchor_id(text: str) -> str: # MyST/Sphinx's markdown processing doesn't like dots in anchor ids. return "#" + text.replace(".", "_").lower() # Create block attribute line. # See https://myst-parser.readthedocs.io/en/latest/syntax/optional.html#block-attributes def _block_attrs(*attrs: str) -> str: return "{" + " ".join(attrs) + "}\n" def _link(display: str, link: str = "", *, ref: str = "", classes: str = "") -> str: if ref: ref = f"[{ref}]" if link: link = f"({link})" if classes: classes = "{" + classes + "}" return f"[{display}]{ref}{link}{classes}" def _span(display: str, classes: str = ".span") -> str: return f"[{display}]{{" + classes + "}" def _link_here_icon(anchor: str) -> str: # The headerlink class activates some special logic to show/hide # text upon mouse-over; it's how headings show a clickable link. return _link("ΒΆ", anchor, classes=".headerlink") def _inline_anchor(anchor: str) -> str: return _span("", anchor) def _indent_block_text(text: str) -> str: return text.strip().replace("\n", "\n ") def _join_csv_and(values: list[str]) -> str: if len(values) == 1: return values[0] values = list(values) values[-1] = "and " + values[-1] return ", ".join(values) def _position_iter(values: list[_T]) -> tuple[bool, bool, _T]: for i, value in enumerate(values): yield i == 0, i == len(values) - 1, value def _sort_attributes_inplace(attributes): # Sort attributes so the iteration order results in a Python-syntax # valid signature. Keep name first because that's convention. attributes.sort(key=lambda a: (a.name != "name", bool(a.default_value), a.name)) class _MySTRenderer: def __init__( self, module: stardoc_output_pb2.ModuleInfo, out_stream: TextIO, public_load_path: str, ): self._module = module self._out_stream = out_stream self._public_load_path = public_load_path def render(self): self._render_module(self._module) def _render_module(self, module: stardoc_output_pb2.ModuleInfo): if self._public_load_path: bzl_path = self._public_load_path else: bzl_path = "//" + self._module.file.split("//")[1] self._write(":::{default-domain} bzl\n:::\n") self._write(":::{bzl:currentfile} ", bzl_path, "\n:::\n\n") self._write( f"# {bzl_path}\n", "\n", module.module_docstring.strip(), "\n\n", ) # Sort the objects by name objects = itertools.chain( ((r.rule_name, r, self._render_rule) for r in module.rule_info), ((p.provider_name, p, self._render_provider) for p in module.provider_info), ((f.function_name, f, self._render_func) for f in module.func_info), ((a.aspect_name, a, self._render_aspect) for a in module.aspect_info), ( (m.extension_name, m, self._render_module_extension) for m in module.module_extension_info ), ( (r.rule_name, r, self._render_repository_rule) for r in module.repository_rule_info ), ) objects = sorted(objects, key=lambda v: v[0].lower()) for _, obj, func in objects: func(obj) self._write("\n") def _render_aspect(self, aspect: stardoc_output_pb2.AspectInfo): _sort_attributes_inplace(aspect.attribute) self._write("::::::{bzl:aspect} ", aspect.aspect_name, "\n\n") edges = ", ".join(sorted(f"`{attr}`" for attr in aspect.aspect_attribute)) self._write(":aspect-attributes: ", edges, "\n\n") self._write(aspect.doc_string.strip(), "\n\n") if aspect.attribute: self._render_attributes(aspect.attribute) self._write("\n") self._write("::::::\n") def _render_module_extension(self, mod_ext: stardoc_output_pb2.ModuleExtensionInfo): self._write("::::::{bzl:module-extension} ", mod_ext.extension_name, "\n\n") self._write(mod_ext.doc_string.strip(), "\n\n") for tag in mod_ext.tag_class: tag_name = f"{mod_ext.extension_name}.{tag.tag_name}" tag_name = f"{tag.tag_name}" self._write(":::::{bzl:tag-class} ", tag_name, "\n\n") _sort_attributes_inplace(tag.attribute) self._render_signature( tag_name, tag.attribute, get_name=lambda a: a.name, get_default=lambda a: a.default_value, ) self._write(tag.doc_string.strip(), "\n\n") self._render_attributes(tag.attribute) self._write(":::::\n") self._write("::::::\n") def _render_repository_rule(self, repo_rule: stardoc_output_pb2.RepositoryRuleInfo): self._write("::::::{bzl:repo-rule} ") _sort_attributes_inplace(repo_rule.attribute) self._render_signature( repo_rule.rule_name, repo_rule.attribute, get_name=lambda a: a.name, get_default=lambda a: a.default_value, ) self._write(repo_rule.doc_string.strip(), "\n\n") if repo_rule.attribute: self._render_attributes(repo_rule.attribute) if repo_rule.environ: self._write(":envvars: ", ", ".join(sorted(repo_rule.environ))) self._write("\n") def _render_rule(self, rule: stardoc_output_pb2.RuleInfo): rule_name = rule.rule_name _sort_attributes_inplace(rule.attribute) self._write("::::{bzl:rule} ") self._render_signature( rule_name, rule.attribute, get_name=lambda r: r.name, get_default=lambda r: r.default_value, ) self._write(rule.doc_string.strip(), "\n\n") if rule.advertised_providers.provider_name: self._write(":provides: ") self._write(" | ".join(rule.advertised_providers.provider_name)) self._write("\n") self._write("\n") if rule.attribute: self._render_attributes(rule.attribute) self._write("\n") self._write("::::\n") def _rule_attr_type_string(self, attr: stardoc_output_pb2.AttributeInfo) -> str: if attr.type == _AttributeType.NAME: return "Name" elif attr.type == _AttributeType.INT: return "int" elif attr.type == _AttributeType.LABEL: return "label" elif attr.type == _AttributeType.STRING: return "str" elif attr.type == _AttributeType.STRING_LIST: return "list[str]" elif attr.type == _AttributeType.INT_LIST: return "list[int]" elif attr.type == _AttributeType.LABEL_LIST: return "list[label]" elif attr.type == _AttributeType.BOOLEAN: return "bool" elif attr.type == _AttributeType.LABEL_STRING_DICT: return "dict[label, str]" elif attr.type == _AttributeType.STRING_DICT: return "dict[str, str]" elif attr.type == _AttributeType.STRING_LIST_DICT: return "dict[str, list[str]]" elif attr.type == _AttributeType.OUTPUT: return "label" elif attr.type == _AttributeType.OUTPUT_LIST: return "list[label]" else: # If we get here, it means the value was unknown for some reason. # Rather than error, give some somewhat understandable value. return _AttributeType.Name(attr.type) def _render_func(self, func: stardoc_output_pb2.StarlarkFunctionInfo): self._write("::::::{bzl:function} ") parameters = self._render_func_signature(func) self._write(func.doc_string.strip(), "\n\n") if parameters: for param in parameters: self._write(f":arg {param.name}:\n") if param.default_value: default_value = self._format_default_value(param.default_value) self._write(" {default-value}`", default_value, "`\n") if param.doc_string: self._write(" ", _indent_block_text(param.doc_string), "\n") else: self._write(" _undocumented_\n") self._write("\n") if return_doc := getattr(func, "return").doc_string: self._write(":returns:\n") self._write(" ", _indent_block_text(return_doc), "\n") if func.deprecated.doc_string: self._write(":::::{deprecated}: unknown\n") self._write(" ", _indent_block_text(func.deprecated.doc_string), "\n") self._write(":::::\n") self._write("::::::\n") def _render_func_signature(self, func): self._write(f"{func.function_name}(") # TODO: Have an "is method" directive in the docstring to decide if # the self parameter should be removed. parameters = [param for param in func.parameter if param.name != "self"] # Unfortunately, the stardoc info is incomplete and inaccurate: # * The position of the `*args` param is wrong; it'll always # be last (or second to last, if kwargs is present). # * Stardoc doesn't explicitly tell us if an arg is `*args` or # `**kwargs`. Hence f(*args) or f(**kwargs) is ambigiguous. # See these issues: # https://github.com/bazelbuild/stardoc/issues/226 # https://github.com/bazelbuild/stardoc/issues/225 # # Below, we try to take what info we have and infer what the original # signature was. In short: # * A default=empty, mandatory=false arg is either *args or **kwargs # * If two of those are seen, the first is *args and the second is # **kwargs. Recall, however, the position of *args is mis-represented. # * If a single default=empty, mandatory=false arg is found, then # it's ambiguous as to whether its *args or **kwargs. To figure # that out, we: # * If it's not the last arg, then it must be *args. In practice, # this never occurs due to #226 above. # * If we saw a mandatory arg after an optional arg, then *args # was supposed to be between them (otherwise it wouldn't be # valid syntax). # * Otherwise, it's ambiguous. We just guess by looking at the # parameter name. var_args = None var_kwargs = None saw_mandatory_after_optional = False first_mandatory_after_optional_index = None optionals_started = False for i, p in enumerate(parameters): optionals_started = optionals_started or not p.mandatory if p.mandatory and optionals_started: saw_mandatory_after_optional = True if first_mandatory_after_optional_index is None: first_mandatory_after_optional_index = i if not p.default_value and not p.mandatory: if var_args is None: var_args = (i, p) else: var_kwargs = p if var_args and not var_kwargs: if var_args[0] != len(parameters) - 1: pass elif saw_mandatory_after_optional: var_kwargs = var_args[1] var_args = None elif var_args[1].name in ("kwargs", "attrs"): var_kwargs = var_args[1] var_args = None # Partial workaround for # https://github.com/bazelbuild/stardoc/issues/226: `*args` renders last if var_args and var_kwargs and first_mandatory_after_optional_index is not None: parameters.pop(var_args[0]) parameters.insert(first_mandatory_after_optional_index, var_args[1]) # The only way a mandatory-after-optional can occur is # if there was `*args` before it. But if we didn't see it, # it must have been the unbound `*` symbol, which stardoc doesn't # tell us exists. if saw_mandatory_after_optional and not var_args: self._write("*, ") for _, is_last, p in _position_iter(parameters): if var_args and p.name == var_args[1].name: self._write("*") elif var_kwargs and p.name == var_kwargs.name: self._write("**") self._write(p.name) if p.default_value: self._write("=", self._format_default_value(p.default_value)) if not is_last: self._write(", ") self._write(")\n") return parameters def _render_provider(self, provider: stardoc_output_pb2.ProviderInfo): self._write("::::::{bzl:provider} ", provider.provider_name, "\n") if provider.origin_key: self._render_origin_key_option(provider.origin_key) self._write("\n") self._write(provider.doc_string.strip(), "\n\n") self._write(":::::{bzl:function} ") provider.field_info.sort(key=lambda f: f.name) self._render_signature( "", provider.field_info, get_name=lambda f: f.name, ) # TODO: Add support for provider.init once our Bazel version supports # that field self._write(":::::\n") for field in provider.field_info: self._write(":::::{bzl:provider-field} ", field.name, "\n") self._write(field.doc_string.strip()) self._write("\n") self._write(":::::\n") self._write("::::::\n") def _render_attributes(self, attributes: list[stardoc_output_pb2.AttributeInfo]): for attr in attributes: attr_type = self._rule_attr_type_string(attr) self._write(f":attr {attr.name}:\n") if attr.default_value: self._write(" {bzl:default-value}`%s`\n" % attr.default_value) self._write(" {type}`%s`\n" % attr_type) self._write(" ", _indent_block_text(attr.doc_string), "\n") self._write(" :::{bzl:attr-info} Info\n") if attr.mandatory: self._write(" :mandatory:\n") self._write(" :::\n") self._write("\n") if attr.provider_name_group: self._write(" {required-providers}`") for _, outer_is_last, provider_group in _position_iter( attr.provider_name_group ): pairs = list( zip( provider_group.origin_key, provider_group.provider_name, strict=True, ) ) if len(pairs) > 1: self._write("[") for _, inner_is_last, (origin_key, name) in _position_iter(pairs): if origin_key.file == "": origin = origin_key.name else: origin = f"{origin_key.file}%{origin_key.name}" # We have to use "title " syntax because the same # name might map to different origins. Stardoc gives us # the provider's actual name, not the name of the symbol # used in the source. self._write(f"'{name} <{origin}>'") if not inner_is_last: self._write(", ") if len(pairs) > 1: self._write("]") if not outer_is_last: self._write(" | ") self._write("`\n") self._write("\n") def _render_signature( self, name: str, parameters: list[_T], *, get_name: Callable[_T, str], get_default: Callable[_T, str] = lambda v: None, ): self._write(name, "(") for _, is_last, param in _position_iter(parameters): param_name = get_name(param) self._write(f"{param_name}") default_value = get_default(param) if default_value: default_value = self._format_default_value(default_value) self._write(f"={default_value}") if not is_last: self._write(", ") self._write(")\n\n") def _render_origin_key_option(self, origin_key, indent=""): self._write( indent, ":origin-key: ", self._format_option_value(f"{origin_key.file}%{origin_key.name}"), "\n", ) def _format_default_value(self, default_value): # Handle # For now, just use quotes for lack of a better option if default_value.startswith("<"): return f"'{default_value}'" elif default_value.startswith("Label("): # Handle Label(*, "@some//label:target") start_quote = default_value.find('"') end_quote = default_value.rfind('"') return default_value[start_quote : end_quote + 1] else: return default_value def _format_option_value(self, value): # Leading @ symbols are special markup; escape them. if value.startswith("@"): return "\\" + value else: return value def _write(self, *lines: str): self._out_stream.writelines(lines) def _convert( *, proto: pathlib.Path, output: pathlib.Path, public_load_path: str, ): module = stardoc_output_pb2.ModuleInfo.FromString(proto.read_bytes()) with output.open("wt", encoding="utf8") as out_stream: _MySTRenderer(module, out_stream, public_load_path).render() def _create_parser(): parser = argparse.ArgumentParser(fromfile_prefix_chars="@") parser.add_argument("--proto", dest="proto", type=pathlib.Path) parser.add_argument("--output", dest="output", type=pathlib.Path) parser.add_argument("--public-load-path", dest="public_load_path") return parser def main(args): options = _create_parser().parse_args(args) _convert( proto=options.proto, output=options.output, public_load_path=options.public_load_path, ) return 0 if __name__ == "__main__": sys.exit(main(sys.argv[1:]))