//===- OpDocGen.cpp - MLIR operation documentation generator --------------===// // // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. // See https://llvm.org/LICENSE.txt for license information. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception // //===----------------------------------------------------------------------===// // // OpDocGen uses the description of operations to generate documentation for the // operations. // //===----------------------------------------------------------------------===// #include "DialectGenUtilities.h" #include "DocGenUtilities.h" #include "OpGenHelpers.h" #include "mlir/Support/IndentedOstream.h" #include "mlir/TableGen/AttrOrTypeDef.h" #include "mlir/TableGen/GenInfo.h" #include "mlir/TableGen/Operator.h" #include "llvm/ADT/DenseMap.h" #include "llvm/ADT/SetVector.h" #include "llvm/ADT/StringExtras.h" #include "llvm/ADT/StringRef.h" #include "llvm/Support/CommandLine.h" #include "llvm/Support/FormatVariadic.h" #include "llvm/Support/Regex.h" #include "llvm/Support/Signals.h" #include "llvm/TableGen/Error.h" #include "llvm/TableGen/Record.h" #include "llvm/TableGen/TableGenBackend.h" #include #include //===----------------------------------------------------------------------===// // Commandline Options //===----------------------------------------------------------------------===// static llvm::cl::OptionCategory docCat("Options for -gen-(attrdef|typedef|op|dialect)-doc"); llvm::cl::opt stripPrefix("strip-prefix", llvm::cl::desc("Strip prefix of the fully qualified names"), llvm::cl::init("::mlir::"), llvm::cl::cat(docCat)); llvm::cl::opt allowHugoSpecificFeatures( "allow-hugo-specific-features", llvm::cl::desc("Allows using features specific to Hugo"), llvm::cl::init(false), llvm::cl::cat(docCat)); using namespace llvm; using namespace mlir; using namespace mlir::tblgen; using mlir::tblgen::Operator; void mlir::tblgen::emitSummary(StringRef summary, raw_ostream &os) { if (!summary.empty()) { llvm::StringRef trimmed = summary.trim(); char first = std::toupper(trimmed.front()); llvm::StringRef rest = trimmed.drop_front(); os << "\n_" << first << rest << "_\n\n"; } } // Emit the description by aligning the text to the left per line (e.g., // removing the minimum indentation across the block). // // This expects that the description in the tablegen file is already formatted // in a way the user wanted but has some additional indenting due to being // nested in the op definition. void mlir::tblgen::emitDescription(StringRef description, raw_ostream &os) { raw_indented_ostream ros(os); ros.printReindented(description.rtrim(" \t")); } void mlir::tblgen::emitDescriptionComment(StringRef description, raw_ostream &os, StringRef prefix) { if (description.empty()) return; raw_indented_ostream ros(os); StringRef trimmed = description.rtrim(" \t"); ros.printReindented(trimmed, (Twine(prefix) + "/// ").str()); if (!trimmed.ends_with("\n")) ros << "\n"; } // Emits `str` with trailing newline if not empty. static void emitIfNotEmpty(StringRef str, raw_ostream &os) { if (!str.empty()) { emitDescription(str, os); os << "\n"; } } /// Emit the given named constraint. template static void emitNamedConstraint(const T &it, raw_ostream &os) { if (!it.name.empty()) os << "| `" << it.name << "`"; else os << "«unnamed»"; os << " | " << it.constraint.getSummary() << "\n"; } //===----------------------------------------------------------------------===// // Operation Documentation //===----------------------------------------------------------------------===// /// Emit the assembly format of an operation. static void emitAssemblyFormat(StringRef opName, StringRef format, raw_ostream &os) { os << "\nSyntax:\n\n```\noperation ::= `" << opName << "` "; // Print the assembly format aligned. unsigned indent = strlen("operation ::= "); std::pair split = format.split('\n'); os << split.first.trim() << "\n"; do { split = split.second.split('\n'); StringRef formatChunk = split.first.trim(); if (!formatChunk.empty()) os.indent(indent) << formatChunk << "\n"; } while (!split.second.empty()); os << "```\n\n"; } /// Place `text` between backticks so that the Markdown processor renders it as /// inline code. static std::string backticks(const std::string &text) { return '`' + text + '`'; } static void emitOpTraitsDoc(const Operator &op, raw_ostream &os) { // TODO: We should link to the trait/documentation of it. That also means we // should add descriptions to traits that can be queried. // Collect using set to sort effects, interfaces & traits. std::set effects, interfaces, traits; for (auto &trait : op.getTraits()) { if (isa(&trait)) continue; std::string name = trait.getDef().getName().str(); StringRef ref = name; StringRef traitName = trait.getDef().getValueAsString("trait"); traitName.consume_back("::Trait"); traitName.consume_back("::Impl"); if (ref.starts_with("anonymous_")) name = traitName.str(); if (isa(&trait)) { if (trait.getDef().isSubClassOf("SideEffectsTraitBase")) { auto effectName = trait.getDef().getValueAsString("baseEffectName"); effectName.consume_front("::"); effectName.consume_front("mlir::"); std::string effectStr; llvm::raw_string_ostream os(effectStr); os << effectName << "{"; auto list = trait.getDef().getValueAsListOfDefs("effects"); llvm::interleaveComma(list, os, [&](Record *rec) { StringRef effect = rec->getValueAsString("effect"); effect.consume_front("::"); effect.consume_front("mlir::"); os << effect << " on " << rec->getValueAsString("resource"); }); os << "}"; effects.insert(backticks(os.str())); name.append(llvm::formatv(" ({0})", traitName).str()); } interfaces.insert(backticks(name)); continue; } traits.insert(backticks(name)); } if (!traits.empty()) { llvm::interleaveComma(traits, os << "\nTraits: "); os << "\n"; } if (!interfaces.empty()) { llvm::interleaveComma(interfaces, os << "\nInterfaces: "); os << "\n"; } if (!effects.empty()) { llvm::interleaveComma(effects, os << "\nEffects: "); os << "\n"; } } static StringRef resolveAttrDescription(const Attribute &attr) { StringRef description = attr.getDescription(); if (description.empty()) return attr.getBaseAttr().getDescription(); return description; } static void emitOpDoc(const Operator &op, raw_ostream &os) { std::string classNameStr = op.getQualCppClassName(); StringRef className = classNameStr; (void)className.consume_front(stripPrefix); os << llvm::formatv("### `{0}` ({1})\n", op.getOperationName(), className); // Emit the summary, syntax, and description if present. if (op.hasSummary()) emitSummary(op.getSummary(), os); if (op.hasAssemblyFormat()) emitAssemblyFormat(op.getOperationName(), op.getAssemblyFormat().trim(), os); if (op.hasDescription()) mlir::tblgen::emitDescription(op.getDescription(), os); emitOpTraitsDoc(op, os); // Emit attributes. if (op.getNumAttributes() != 0) { os << "\n#### Attributes:\n\n"; // Note: This table is HTML rather than markdown so the attribute's // description can appear in an expandable region. The description may be // multiple lines, which is not supported in a markdown table cell. os << "\n"; // Header. os << "\n"; for (const auto &it : op.getAttributes()) { StringRef storageType = it.attr.getStorageType(); // Name and storage type. os << ""; os << "\n"; } os << "
AttributeMLIR TypeDescription
" << it.name << "" << storageType << ""; StringRef description = resolveAttrDescription(it.attr); if (allowHugoSpecificFeatures && !description.empty()) { // Expandable description. // This appears as just the summary, but when clicked shows the full // description. os << "
" << "" << it.attr.getSummary() << "" << "{{% markdown %}}" << description << "{{% /markdown %}}" << "
"; } else { // Fallback: Single-line summary. os << it.attr.getSummary(); } os << "
\n"; } // Emit each of the operands. if (op.getNumOperands() != 0) { os << "\n#### Operands:\n\n"; os << "| Operand | Description |\n" << "| :-----: | ----------- |\n"; for (const auto &it : op.getOperands()) emitNamedConstraint(it, os); } // Emit results. if (op.getNumResults() != 0) { os << "\n#### Results:\n\n"; os << "| Result | Description |\n" << "| :----: | ----------- |\n"; for (const auto &it : op.getResults()) emitNamedConstraint(it, os); } // Emit successors. if (op.getNumSuccessors() != 0) { os << "\n#### Successors:\n\n"; os << "| Successor | Description |\n" << "| :-------: | ----------- |\n"; for (const auto &it : op.getSuccessors()) emitNamedConstraint(it, os); } os << "\n"; } static void emitSourceLink(StringRef inputFilename, raw_ostream &os) { size_t pathBegin = inputFilename.find("mlir/include/mlir/"); if (pathBegin == StringRef::npos) return; StringRef inputFromMlirInclude = inputFilename.substr(pathBegin); os << "[source](https://github.com/llvm/llvm-project/blob/main/" << inputFromMlirInclude << ")\n\n"; } static void emitOpDoc(const RecordKeeper &recordKeeper, raw_ostream &os) { auto opDefs = getRequestedOpDefinitions(recordKeeper); os << "\n"; emitSourceLink(recordKeeper.getInputFilename(), os); for (const llvm::Record *opDef : opDefs) emitOpDoc(Operator(opDef), os); } //===----------------------------------------------------------------------===// // Attribute Documentation //===----------------------------------------------------------------------===// static void emitAttrDoc(const Attribute &attr, raw_ostream &os) { os << "### " << attr.getSummary() << "\n\n"; emitDescription(attr.getDescription(), os); os << "\n\n"; } //===----------------------------------------------------------------------===// // Type Documentation //===----------------------------------------------------------------------===// static void emitTypeDoc(const Type &type, raw_ostream &os) { os << "### " << type.getSummary() << "\n\n"; emitDescription(type.getDescription(), os); os << "\n\n"; } //===----------------------------------------------------------------------===// // TypeDef Documentation //===----------------------------------------------------------------------===// static void emitAttrOrTypeDefAssemblyFormat(const AttrOrTypeDef &def, raw_ostream &os) { ArrayRef parameters = def.getParameters(); char prefix = isa(def) ? '#' : '!'; if (parameters.empty()) { os << "\nSyntax: `" << prefix << def.getDialect().getName() << "." << def.getMnemonic() << "`\n"; return; } os << "\nSyntax:\n\n```\n" << prefix << def.getDialect().getName() << "." << def.getMnemonic() << "<\n"; for (const auto &it : llvm::enumerate(parameters)) { const AttrOrTypeParameter ¶m = it.value(); os << " " << param.getSyntax(); if (it.index() < (parameters.size() - 1)) os << ","; os << " # " << param.getName() << "\n"; } os << ">\n```\n"; } static void emitAttrOrTypeDefDoc(const AttrOrTypeDef &def, raw_ostream &os) { os << llvm::formatv("### {0}\n", def.getCppClassName()); // Emit the summary if present. if (def.hasSummary()) os << "\n" << def.getSummary() << "\n"; // Emit the syntax if present. if (def.getMnemonic() && !def.hasCustomAssemblyFormat()) emitAttrOrTypeDefAssemblyFormat(def, os); // Emit the description if present. if (def.hasDescription()) { os << "\n"; mlir::tblgen::emitDescription(def.getDescription(), os); } // Emit parameter documentation. ArrayRef parameters = def.getParameters(); if (!parameters.empty()) { os << "\n#### Parameters:\n\n"; os << "| Parameter | C++ type | Description |\n" << "| :-------: | :-------: | ----------- |\n"; for (const auto &it : parameters) { auto desc = it.getSummary(); os << "| " << it.getName() << " | `" << it.getCppType() << "` | " << (desc ? *desc : "") << " |\n"; } } os << "\n"; } static void emitAttrOrTypeDefDoc(const RecordKeeper &recordKeeper, raw_ostream &os, StringRef recordTypeName) { std::vector defs = recordKeeper.getAllDerivedDefinitions(recordTypeName); os << "\n"; for (const llvm::Record *def : defs) emitAttrOrTypeDefDoc(AttrOrTypeDef(def), os); } //===----------------------------------------------------------------------===// // Dialect Documentation //===----------------------------------------------------------------------===// struct OpDocGroup { const Dialect &getDialect() const { return ops.front().getDialect(); } // Returns the summary description of the section. std::string summary = ""; // Returns the description of the section. StringRef description = ""; // Instances inside the section. std::vector ops; }; static void maybeNest(bool nest, llvm::function_ref fn, raw_ostream &os) { std::string str; llvm::raw_string_ostream ss(str); fn(ss); for (StringRef x : llvm::split(ss.str(), "\n")) { if (nest && x.starts_with("#")) os << "#"; os << x << "\n"; } } static void emitBlock(ArrayRef attributes, StringRef inputFilename, ArrayRef attrDefs, ArrayRef ops, ArrayRef types, ArrayRef typeDefs, raw_ostream &os) { if (!ops.empty()) { os << "## Operations\n\n"; emitSourceLink(inputFilename, os); for (const OpDocGroup &grouping : ops) { bool nested = !grouping.summary.empty(); maybeNest( nested, [&](raw_ostream &os) { if (nested) { os << "## " << StringRef(grouping.summary).trim() << "\n\n"; emitDescription(grouping.description, os); os << "\n\n"; } for (const Operator &op : grouping.ops) { emitOpDoc(op, os); } }, os); } } if (!attributes.empty()) { os << "## Attribute constraints\n\n"; for (const Attribute &attr : attributes) emitAttrDoc(attr, os); } if (!attrDefs.empty()) { os << "## Attributes\n\n"; for (const AttrDef &def : attrDefs) emitAttrOrTypeDefDoc(def, os); } // TODO: Add link between use and def for types if (!types.empty()) { os << "## Type constraints\n\n"; for (const Type &type : types) emitTypeDoc(type, os); } if (!typeDefs.empty()) { os << "## Types\n\n"; for (const TypeDef &def : typeDefs) emitAttrOrTypeDefDoc(def, os); } } static void emitDialectDoc(const Dialect &dialect, StringRef inputFilename, ArrayRef attributes, ArrayRef attrDefs, ArrayRef ops, ArrayRef types, ArrayRef typeDefs, raw_ostream &os) { os << "# '" << dialect.getName() << "' Dialect\n\n"; emitIfNotEmpty(dialect.getSummary(), os); emitIfNotEmpty(dialect.getDescription(), os); // Generate a TOC marker except if description already contains one. llvm::Regex r("^[[:space:]]*\\[TOC\\]$", llvm::Regex::RegexFlags::Newline); if (!r.match(dialect.getDescription())) os << "[TOC]\n\n"; emitBlock(attributes, inputFilename, attrDefs, ops, types, typeDefs, os); } static bool emitDialectDoc(const RecordKeeper &recordKeeper, raw_ostream &os) { std::vector dialectDefs = recordKeeper.getAllDerivedDefinitionsIfDefined("Dialect"); SmallVector dialects(dialectDefs.begin(), dialectDefs.end()); std::optional dialect = findDialectToGenerate(dialects); if (!dialect) return true; std::vector opDefs = getRequestedOpDefinitions(recordKeeper); std::vector attrDefs = recordKeeper.getAllDerivedDefinitionsIfDefined("DialectAttr"); std::vector typeDefs = recordKeeper.getAllDerivedDefinitionsIfDefined("DialectType"); std::vector typeDefDefs = recordKeeper.getAllDerivedDefinitionsIfDefined("TypeDef"); std::vector attrDefDefs = recordKeeper.getAllDerivedDefinitionsIfDefined("AttrDef"); std::vector dialectAttrs; std::vector dialectAttrDefs; std::vector dialectOps; std::vector dialectTypes; std::vector dialectTypeDefs; llvm::SmallDenseSet seen; auto addIfInDialect = [&](llvm::Record *record, const auto &def, auto &vec) { if (seen.insert(record).second && def.getDialect() == *dialect) { vec.push_back(def); return true; } return false; }; SmallDenseMap opDocGroup; for (Record *def : attrDefDefs) addIfInDialect(def, AttrDef(def), dialectAttrDefs); for (Record *def : attrDefs) addIfInDialect(def, Attribute(def), dialectAttrs); for (Record *def : opDefs) { if (Record *group = def->getValueAsOptionalDef("opDocGroup")) { OpDocGroup &op = opDocGroup[group]; addIfInDialect(def, Operator(def), op.ops); } else { OpDocGroup op; op.ops.emplace_back(def); addIfInDialect(def, op, dialectOps); } } for (Record *rec : recordKeeper.getAllDerivedDefinitionsIfDefined("OpDocGroup")) { if (opDocGroup[rec].ops.empty()) continue; opDocGroup[rec].summary = rec->getValueAsString("summary"); opDocGroup[rec].description = rec->getValueAsString("description"); dialectOps.push_back(opDocGroup[rec]); } for (Record *def : typeDefDefs) addIfInDialect(def, TypeDef(def), dialectTypeDefs); for (Record *def : typeDefs) addIfInDialect(def, Type(def), dialectTypes); // Sort alphabetically ignorning dialect for ops and section name for // sections. // TODO: The sorting order could be revised, currently attempting to sort of // keep in alphabetical order. std::sort(dialectOps.begin(), dialectOps.end(), [](const OpDocGroup &lhs, const OpDocGroup &rhs) { auto getDesc = [](const OpDocGroup &arg) -> StringRef { if (!arg.summary.empty()) return arg.summary; return arg.ops.front().getDef().getValueAsString("opName"); }; return getDesc(lhs).compare_insensitive(getDesc(rhs)) < 0; }); os << "\n"; emitDialectDoc(*dialect, recordKeeper.getInputFilename(), dialectAttrs, dialectAttrDefs, dialectOps, dialectTypes, dialectTypeDefs, os); return false; } //===----------------------------------------------------------------------===// // Gen Registration //===----------------------------------------------------------------------===// static mlir::GenRegistration genAttrRegister("gen-attrdef-doc", "Generate dialect attribute documentation", [](const RecordKeeper &records, raw_ostream &os) { emitAttrOrTypeDefDoc(records, os, "AttrDef"); return false; }); static mlir::GenRegistration genOpRegister("gen-op-doc", "Generate dialect documentation", [](const RecordKeeper &records, raw_ostream &os) { emitOpDoc(records, os); return false; }); static mlir::GenRegistration genTypeRegister("gen-typedef-doc", "Generate dialect type documentation", [](const RecordKeeper &records, raw_ostream &os) { emitAttrOrTypeDefDoc(records, os, "TypeDef"); return false; }); static mlir::GenRegistration genRegister("gen-dialect-doc", "Generate dialect documentation", [](const RecordKeeper &records, raw_ostream &os) { return emitDialectDoc(records, os); });