autoupdate.h 9.7 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258
  1. // Part of the Carbon Language project, under the Apache License v2.0 with LLVM
  2. // Exceptions. See /LICENSE for license information.
  3. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
  4. #ifndef CARBON_TESTING_FILE_TEST_AUTOUPDATE_H_
  5. #define CARBON_TESTING_FILE_TEST_AUTOUPDATE_H_
  6. #include <filesystem>
  7. #include <utility>
  8. #include "common/check.h"
  9. #include "llvm/ADT/DenseMap.h"
  10. #include "llvm/ADT/SmallVector.h"
  11. #include "llvm/ADT/StringRef.h"
  12. #include "re2/re2.h"
  13. #include "testing/file_test/line.h"
  14. namespace Carbon::Testing {
  15. class FileTestAutoupdater {
  16. public:
  17. struct LineNumberReplacement {
  18. bool has_file;
  19. // The line replacement. The pattern should match lines. If has_file,
  20. // pattern should have a file and line group; otherwise, only a line group,
  21. // but default_file_re should be provided.
  22. //
  23. // Uses shared_ptr for storage in SmallVector.
  24. std::shared_ptr<RE2> re;
  25. // line_formatv should provide {0} to substitute with [[@LINE...]] deltas.
  26. std::string line_formatv;
  27. };
  28. explicit FileTestAutoupdater(
  29. const std::filesystem::path& file_test_path, std::string test_command,
  30. std::string dump_command, llvm::StringRef input_content,
  31. const llvm::SmallVector<llvm::StringRef>& filenames,
  32. int autoupdate_line_number, bool autoupdate_split,
  33. const llvm::SmallVector<FileTestLine>& non_check_lines,
  34. llvm::StringRef actual_stdout, llvm::StringRef actual_stderr,
  35. const std::optional<RE2>& default_file_re,
  36. const llvm::SmallVector<LineNumberReplacement>& line_number_replacements,
  37. std::function<auto(std::string&)->void> do_extra_check_replacements)
  38. : file_test_path_(file_test_path),
  39. test_command_(std::move(test_command)),
  40. dump_command_(std::move(dump_command)),
  41. input_content_(input_content),
  42. autoupdate_line_number_(autoupdate_line_number),
  43. non_check_lines_(non_check_lines),
  44. default_file_re_(default_file_re),
  45. line_number_replacements_(line_number_replacements),
  46. do_extra_check_replacements_(std::move(do_extra_check_replacements)),
  47. autoupdate_split_file_(
  48. autoupdate_split ? std::optional(filenames.size()) : std::nullopt),
  49. file_to_number_map_(BuildFileToNumberMap(filenames)),
  50. // BuildCheckLines should only be called after other member
  51. // initialization.
  52. stdout_(BuildCheckLines(actual_stdout, "STDOUT")),
  53. stderr_(BuildCheckLines(actual_stderr, "STDERR")),
  54. any_attached_stdout_lines_(llvm::any_of(
  55. stdout_.lines,
  56. [&](const CheckLine& line) { return line.line_number() != -1; })),
  57. non_check_line_(non_check_lines_.begin()) {
  58. for (const auto& replacement : line_number_replacements_) {
  59. CARBON_CHECK(replacement.has_file || default_file_re_,
  60. "For replacement with pattern `{0}` to have has_file=false, "
  61. "override GetDefaultFileRE.",
  62. replacement.re->pattern());
  63. CARBON_CHECK(replacement.re->ok(), "Invalid line replacement RE2: {0}",
  64. replacement.re->error());
  65. }
  66. }
  67. // Automatically updates CHECKs in the provided file when dry_run=false.
  68. // Returns true if generated file content differs from actual file content.
  69. auto Run(bool dry_run) -> bool;
  70. private:
  71. // The file and line number that a CHECK line refers to, and the
  72. // replacement from which they were determined, if any.
  73. struct FileAndLineNumber {
  74. explicit FileAndLineNumber(int file_number) : file_number(file_number) {}
  75. explicit FileAndLineNumber(const LineNumberReplacement* replacement,
  76. int file_number, absl::string_view line_number);
  77. const LineNumberReplacement* replacement = nullptr;
  78. int file_number;
  79. int line_number = -1;
  80. };
  81. // A TIP line added by autoupdate. Not associated with any line in output.
  82. class TipLine : public FileTestLineBase {
  83. public:
  84. explicit TipLine(std::string line)
  85. : FileTestLineBase(-1, -1), line_(std::move(line)) {}
  86. auto Print(llvm::raw_ostream& out) const -> void override { out << line_; }
  87. auto is_blank() const -> bool override { return line_.empty(); }
  88. private:
  89. std::string line_;
  90. };
  91. // A CHECK line which is integrated into autoupdate output.
  92. //
  93. // `final` because we use pointer arithmetic on this type.
  94. class CheckLine final : public FileTestLineBase {
  95. public:
  96. // RE2 is passed by a pointer because it doesn't support std::optional.
  97. explicit CheckLine(FileAndLineNumber file_and_line_number, std::string line)
  98. : FileTestLineBase(file_and_line_number.file_number,
  99. file_and_line_number.line_number),
  100. replacement_(file_and_line_number.replacement),
  101. line_(std::move(line)) {}
  102. auto Print(llvm::raw_ostream& out) const -> void override {
  103. out << indent_ << line_;
  104. }
  105. // When the location of the CHECK in output is known, we can set the indent
  106. // and its line.
  107. auto SetOutputLine(llvm::StringRef indent, int output_file_number,
  108. int output_line_number) -> void {
  109. indent_ = indent;
  110. output_file_number_ = output_file_number;
  111. output_line_number_ = output_line_number;
  112. }
  113. // When the location of all lines in a file are known, we can set the line
  114. // offset based on the target line.
  115. auto RemapLineNumbers(
  116. const llvm::DenseMap<llvm::StringRef, int>& file_to_number_map,
  117. const llvm::DenseMap<std::pair<int, int>, int>& output_line_remap,
  118. const llvm::SmallVector<int>& new_last_line_numbers) -> void;
  119. auto is_blank() const -> bool override { return false; }
  120. private:
  121. const LineNumberReplacement* replacement_;
  122. std::string line_;
  123. llvm::StringRef indent_;
  124. int output_file_number_ = -1;
  125. int output_line_number_ = -1;
  126. };
  127. // Clusters information for stdout and stderr.
  128. struct CheckLines {
  129. explicit CheckLines(llvm::SmallVector<CheckLine> lines)
  130. : lines(std::move(lines)), cursor(this->lines.begin()) {}
  131. // The full list of check lines.
  132. llvm::SmallVector<CheckLine> lines;
  133. // An iterator into check_lines.
  134. CheckLine* cursor;
  135. };
  136. // Looks for the patterns in the line. Returns the first match, or defaulted
  137. // information if not found.
  138. auto GetFileAndLineNumber(
  139. const llvm::DenseMap<llvm::StringRef, int>& file_to_number_map,
  140. int default_file_number, const std::string& check_line)
  141. -> FileAndLineNumber;
  142. // Builds a mapping from file name to file number.
  143. auto BuildFileToNumberMap(const llvm::SmallVector<llvm::StringRef>& filenames)
  144. -> llvm::DenseMap<llvm::StringRef, int> {
  145. llvm::DenseMap<llvm::StringRef, int> file_to_number_map;
  146. for (auto [number, name] : llvm::enumerate(filenames)) {
  147. file_to_number_map.insert({name, number});
  148. }
  149. return file_to_number_map;
  150. }
  151. // Builds CheckLine lists for autoupdate.
  152. auto BuildCheckLines(llvm::StringRef output, const char* label) -> CheckLines;
  153. // Adds a non-check line to the new_lines and output_line_remap. The caller
  154. // still needs to advance the cursor when ready.
  155. auto AddRemappedNonCheckLine() -> void;
  156. // Adds TIP lines for file_test usage.
  157. auto AddTips() -> void;
  158. // Returns true if there's a CheckLine that should be added at
  159. // `to_line_number`.
  160. auto ShouldAddCheckLine(const CheckLines& check_lines, bool to_file_end) const
  161. -> bool;
  162. // Adds check_lines until output reaches:
  163. // - If not to_file_end, non_check_line.
  164. // - If to_file_end, the end of the file.
  165. auto AddCheckLines(CheckLines& check_lines, bool to_file_end) -> void;
  166. // Adds remaining check lines for the current file. stderr is always included,
  167. // but stdout is only included when either any_attached_stdout_lines_ or
  168. // is_last_file is true.
  169. auto FinishFile(bool is_last_file) -> void;
  170. // Starts a new split file, updating file and line numbers. Advances past the
  171. // split line.
  172. auto StartSplitFile() -> void;
  173. // Passed-in state.
  174. const std::filesystem::path& file_test_path_;
  175. std::string test_command_;
  176. std::string dump_command_;
  177. llvm::StringRef input_content_;
  178. int autoupdate_line_number_;
  179. const llvm::SmallVector<FileTestLine>& non_check_lines_;
  180. const std::optional<RE2>& default_file_re_;
  181. const llvm::SmallVector<LineNumberReplacement>& line_number_replacements_;
  182. std::function<auto(std::string&)->void> do_extra_check_replacements_;
  183. // If we have an autoupdate split that still needs to be processed, the file
  184. // number of the autoupdate split. Otherwise, this is nullopt.
  185. std::optional<int> autoupdate_split_file_;
  186. // Generated TIP lines, from AddTips.
  187. llvm::SmallVector<TipLine> tips_;
  188. // Mapping from file names to file numbers.
  189. llvm::DenseMap<llvm::StringRef, int> file_to_number_map_;
  190. // The constructed CheckLine list and cursor.
  191. CheckLines stdout_;
  192. CheckLines stderr_;
  193. // Whether any stdout lines have an associated line number.
  194. bool any_attached_stdout_lines_;
  195. // Iterators for the main Run loop.
  196. const FileTestLine* non_check_line_;
  197. // Tracks the new last line numbers for each file.
  198. llvm::SmallVector<int> new_last_line_numbers_;
  199. // A reusable blank line. new_lines_ can contain a reference back to it.
  200. const FileTestLine blank_line_ = FileTestLine(-1, -1, "");
  201. // Stitched-together content.
  202. llvm::SmallVector<const FileTestLineBase*> new_lines_;
  203. // Maps {file_number, original line number} to a new line number.
  204. llvm::DenseMap<std::pair<int, int>, int> output_line_remap_;
  205. // The current output file number; mainly used for tracking progression.
  206. int output_file_number_ = 0;
  207. // The current output line number in stitched content.
  208. int output_line_number_ = 0;
  209. };
  210. } // namespace Carbon::Testing
  211. #endif // CARBON_TESTING_FILE_TEST_AUTOUPDATE_H_