| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275 |
- #!/usr/bin/env python3
- """Generates C++ header to support LLVM-style RTTI for a class hierarchy.
- # Background
- A C++ class hierarchy supported by this script consists of *abstract* classes,
- which can be inherited from but can't be instantiated, and *concrete* classes,
- which can be instantiated but can't be inherited from. Classes can inherit from
- at most one other class in the hierarchy; a class that doesn't inherit from
- any other class is called a *root* class, and it cannot be concrete.
- # Input format
- This script's input file declares every class in the hierarchy, and specifies
- the parent of each non-root class. The input file consists of comment lines
- starting with `#`, whitespace lines, and one `;`-terminated line for each class.
- The core of a line is `class` followed by the class name. `class` can be
- prefixed with `root` or `abstract` to specify the corresponding kind of class;
- if there is no prefix, the class is concrete. If the class is not a root class,
- the name is followed by `:` and then the name of the class it inherits from. A
- class cannot inherit from a class defined later in the file.
- For example:
- root class R;
- abstract class A : R;
- abstract class B : R;
- class C : A;
- class D : B;
- class E : A;
- # Output
- For each abstract class `Foo`, the generated header file will contain
- `enum class FooKind`, which has an enumerator for each concrete class derived
- from `Foo`, with a name that matches the concrete class name.
- For each non-root class `Foo` whose root class is `Root`, the generated header
- file will also contain a function `bool InheritsFromFoo(RootKind kind)`, which
- returns true if the value of `kind` corresponds to a class that is derived from
- `Foo`. This function can be used to implement `Foo::classof`.
- All enumerators that represent the same concrete class will have the same
- numeric value, so you can use `static_cast` to convert between the enum types
- for different classes that have a common root, so long as the enumerator value
- is present in both types. As a result, `InheritsFromFoo` can be used to
- determine whether casting to `FooKind` is safe.
- """
- __copyright__ = """
- Part of the Carbon Language project, under the Apache License v2.0 with LLVM
- Exceptions. See /LICENSE for license information.
- SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
- """
- import enum
- import re
- import sys
- class Class:
- """Metadata about a class from the input file.
- This consists of information
- Attributes set at construction:
- name: The class name.
- kind: The class kind (root, abstract, or concrete)
- ancestors: A list of Class objects representing the class's ancestors,
- starting with the root and ending with the current class's parent.
- _children: A list of Class objects representing the classes that are
- derived directly from this one.
- Attributes set by Finalize():
- id (CONCRETE only): The class's numeric ID, which will become its
- enumerator value in the generated C++ code.
- id_range (ROOT and ABSTRACT only): A pair such that a Class
- object `c` represents a concrete class derived from `self` if and only
- if c.id >= self.id_range[0] and c.id < self.id_range[1].
- leaves (ROOT only): A list of all concrete classes derived from this one,
- indexed by their IDs.
- """
- Kind = enum.Enum("Kind", "ROOT ABSTRACT CONCRETE")
- def __init__(self, name, kind, parent):
- self.name = name
- self.kind = kind
- assert (parent is None) == (kind == Class.Kind.ROOT)
- if parent is None:
- self.ancestors = []
- else:
- self.ancestors = parent.ancestors + [parent]
- if self.kind == Class.Kind.ROOT:
- self.leaves = []
- self.id_range = None
- elif self.kind == Class.Kind.ABSTRACT:
- self.id_range = None
- else:
- self.id = None
- if self.kind != Class.Kind.CONCRETE:
- self._children = []
- if parent:
- parent._children.append(self)
- def Parent(self):
- """Returns this Class's parent."""
- return self.ancestors[-1]
- def Root(self):
- """Returns the root Class of this hierarchy."""
- if self.kind == Class.Kind.ROOT:
- return self
- else:
- return self.ancestors[0]
- def _RegisterLeaf(self, leaf):
- """Records that `leaf` is derived from self.
- Also recursively updates the parent of self. leaf.id must already be
- populated, and leaves must be registered in order of ID. This operation
- is idempotent."""
- already_visited = False
- if self.kind == Class.Kind.ROOT:
- if leaf.id == len(self.leaves):
- self.leaves.append(leaf)
- else:
- assert leaf.id + 1 == len(self.leaves)
- assert self.leaves[leaf.id] == leaf
- already_visited = True
- if self.kind in [Class.Kind.ROOT, Class.Kind.ABSTRACT]:
- if self not in leaf.ancestors:
- sys.exit(
- f"{leaf.name} derived from {self.name}, but has a"
- + " different root"
- )
- if not self.id_range:
- self.id_range = (leaf.id, leaf.id + 1)
- elif self.id_range[1] == leaf.id:
- self.id_range = (self.id_range[0], self.id_range[1] + 1)
- else:
- assert self.id_range[1] == leaf.id + 1
- already_visited = True
- if not already_visited:
- if self.kind != Class.Kind.ROOT:
- self.Parent()._RegisterLeaf(leaf)
- def Finalize(self):
- """Populates additional attributes for `self` and derived Classes.
- Each Class can only be finalized once, after which no additional Classes
- can be derived from it.
- """
- if self.kind == Class.Kind.CONCRETE:
- self.id = len(self.Root().leaves)
- self._RegisterLeaf(self)
- else:
- for child in self._children:
- child.Finalize()
- _LINE_PATTERN = r"""(?P<prefix> \w*) \s*
- class \s+
- (?P<name> \w+)
- (?: \s*:\s* (?P<parent> \w+)
- )?
- ;$"""
- def main():
- input_filename = sys.argv[1]
- with open(input_filename) as file:
- lines = file.readlines()
- classes = dict()
- for line_num, line in enumerate(lines, 1):
- if line.startswith("#") or line.strip() == "":
- continue
- match_result = re.match(_LINE_PATTERN, line.strip(), re.VERBOSE)
- if not match_result:
- sys.exit(f"Invalid format on line {line_num}")
- prefix = match_result.group("prefix")
- if prefix == "":
- kind = Class.Kind.CONCRETE
- elif prefix == "root":
- kind = Class.Kind.ROOT
- elif prefix == "abstract":
- kind = Class.Kind.ABSTRACT
- else:
- sys.exit(f"Unrecognized class prefix '{prefix}' on line {line_num}")
- parent = None
- if match_result.group("parent"):
- if kind == Class.Kind.ROOT:
- sys.exit(f"Root class cannot have parent on line {line_num}")
- parent_name = match_result.group("parent")
- parent = classes[parent_name]
- if not parent:
- sys.exit(f"Unknown class '{parent_name}' on line {line_num}")
- if parent.kind == Class.Kind.CONCRETE:
- sys.exit(f"{parent.name} cannot be a parent on line {line_num}")
- else:
- if kind != Class.Kind.ROOT:
- sys.exit(
- f"Non-root class must have a parent on line {line_num}"
- )
- classes[match_result.group("name")] = Class(
- match_result.group("name"), kind, parent
- )
- for node in classes.values():
- if node.kind == Class.Kind.ROOT:
- node.Finalize()
- print(
- f"// Generated from {input_filename} by"
- + " executable_semantics/gen_rtti.py\n"
- )
- guard_macro = (
- input_filename.upper().translate(str.maketrans({"/": "_", ".": "_"}))
- + "_"
- )
- print(f"#ifndef {guard_macro}")
- print(f"#define {guard_macro}")
- print("\nnamespace Carbon {\n")
- for node in classes.values():
- if node.kind != Class.Kind.CONCRETE:
- ids = range(node.id_range[0], node.id_range[1])
- print(f"enum class {node.name}Kind {{")
- for id in ids:
- print(f" {node.Root().leaves[id].name} = {id},")
- print("};\n")
- if node.kind in [Class.Kind.ABSTRACT, Class.Kind.CONCRETE]:
- print(
- f"inline bool InheritsFrom{node.name}({node.Root().name}Kind"
- + " kind) {"
- )
- if node.kind == Class.Kind.ABSTRACT:
- if node.id_range[0] == node.id_range[1]:
- print(" return false;")
- else:
- range_begin = node.Root().leaves[node.id_range[0]].name
- print(
- f" return kind >= {node.Root().name}Kind"
- + f"::{range_begin}"
- )
- if node.id_range[1] < len(node.Root().leaves):
- range_end = node.Root().leaves[node.id_range[1]].name
- print(
- f" && kind < {node.Root().name}Kind"
- + f"::{range_end}"
- )
- print(" ;")
- elif node.kind == Class.Kind.CONCRETE:
- print(
- f" return kind == {node.Root().name}Kind::{node.name};"
- )
- print("}\n")
- print("} // namespace Carbon\n")
- print(f"#endif // {guard_macro}")
- if __name__ == "__main__":
- main()
|