| 12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019 |
- // Part of the Carbon Language project, under the Apache License v2.0 with LLVM
- // Exceptions. See /LICENSE for license information.
- // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
- #include "toolchain/driver/compile_subcommand.h"
- #include <functional>
- #include <memory>
- #include <optional>
- #include <string>
- #include <system_error>
- #include <utility>
- #include "common/pretty_stack_trace_function.h"
- #include "common/vlog.h"
- #include "llvm/ADT/STLExtras.h"
- #include "llvm/ADT/ScopeExit.h"
- #include "toolchain/base/timings.h"
- #include "toolchain/check/check.h"
- #include "toolchain/codegen/codegen.h"
- #include "toolchain/diagnostics/diagnostic_emitter.h"
- #include "toolchain/diagnostics/sorting_diagnostic_consumer.h"
- #include "toolchain/lex/lex.h"
- #include "toolchain/lower/lower.h"
- #include "toolchain/parse/parse.h"
- #include "toolchain/parse/tree_and_subtrees.h"
- #include "toolchain/sem_ir/formatter.h"
- #include "toolchain/sem_ir/import_ir.h"
- #include "toolchain/sem_ir/inst_namer.h"
- #include "toolchain/source/source_buffer.h"
- namespace Carbon {
- auto CompileOptions::Build(CommandLine::CommandBuilder& b) -> void {
- b.AddStringPositionalArg(
- {
- .name = "FILE",
- .help = R"""(
- The input Carbon source file to compile.
- )""",
- },
- [&](auto& arg_b) {
- arg_b.Required(true);
- arg_b.Append(&input_filenames);
- });
- b.AddOneOfOption(
- {
- .name = "phase",
- .help = R"""(
- Selects the compilation phase to run. These phases are always run in sequence,
- so every phase before the one selected will also be run. The default is to
- compile to machine code.
- )""",
- },
- [&](auto& arg_b) {
- arg_b.SetOneOf(
- {
- arg_b.OneOfValue("lex", Phase::Lex),
- arg_b.OneOfValue("parse", Phase::Parse),
- arg_b.OneOfValue("check", Phase::Check),
- arg_b.OneOfValue("lower", Phase::Lower),
- arg_b.OneOfValue("codegen", Phase::CodeGen).Default(true),
- },
- &phase);
- });
- // TODO: Rearrange the code setting this option and two related ones to
- // allow them to reference each other instead of hard-coding their names.
- b.AddStringOption(
- {
- .name = "output",
- .value_name = "FILE",
- .help = R"""(
- The output filename for codegen.
- When this is a file name, either textual assembly or a binary object will be
- written to it based on the flag `--asm-output`. The default is to write a binary
- object file.
- Passing `--output=-` will write the output to stdout. In that case, the flag
- `--asm-output` is ignored and the output defaults to textual assembly. Binary
- object output can be forced by enabling `--force-obj-output`.
- )""",
- },
- [&](auto& arg_b) { arg_b.Set(&output_filename); });
- // Include the common code generation options at this point to render it
- // after the more common options above, but before the more unusual options
- // below.
- codegen_options.Build(b);
- b.AddFlag(
- {
- .name = "asm-output",
- .help = R"""(
- Write textual assembly rather than a binary object file to the code generation
- output.
- This flag only applies when writing to a file. When writing to stdout, the
- default is textual assembly and this flag is ignored.
- )""",
- },
- [&](auto& arg_b) { arg_b.Set(&asm_output); });
- b.AddFlag(
- {
- .name = "force-obj-output",
- .help = R"""(
- Force binary object output, even with `--output=-`.
- When `--output=-` is set, the default is textual assembly; this forces printing
- of a binary object file instead. Ignored for other `--output` values.
- )""",
- },
- [&](auto& arg_b) { arg_b.Set(&force_obj_output); });
- b.AddFlag(
- {
- .name = "stream-errors",
- .help = R"""(
- Stream error messages to stderr as they are generated rather than sorting them
- and displaying them in source order.
- )""",
- },
- [&](auto& arg_b) { arg_b.Set(&stream_errors); });
- b.AddFlag(
- {
- .name = "dump-shared-values",
- .help = R"""(
- Dumps shared values. These aren't owned by any particular file or phase.
- )""",
- },
- [&](auto& arg_b) { arg_b.Set(&dump_shared_values); });
- b.AddFlag(
- {
- .name = "dump-tokens",
- .help = R"""(
- Dump the tokens to stdout when lexed.
- )""",
- },
- [&](auto& arg_b) { arg_b.Set(&dump_tokens); });
- b.AddFlag(
- {
- .name = "omit-file-boundary-tokens",
- .help = R"""(
- For `--dump-tokens`, omit file start and end boundary tokens.
- )""",
- },
- [&](auto& arg_b) { arg_b.Set(&omit_file_boundary_tokens); });
- b.AddFlag(
- {
- .name = "dump-parse-tree",
- .help = R"""(
- Dump the parse tree to stdout when parsed.
- )""",
- },
- [&](auto& arg_b) { arg_b.Set(&dump_parse_tree); });
- b.AddFlag(
- {
- .name = "preorder-parse-tree",
- .help = R"""(
- When dumping the parse tree, reorder it so that it is in preorder rather than
- postorder.
- )""",
- },
- [&](auto& arg_b) { arg_b.Set(&preorder_parse_tree); });
- b.AddFlag(
- {
- .name = "dump-raw-sem-ir",
- .help = R"""(
- Dump the raw JSON structure of SemIR to stdout when built.
- )""",
- },
- [&](auto& arg_b) { arg_b.Set(&dump_raw_sem_ir); });
- b.AddFlag(
- {
- .name = "dump-sem-ir",
- .help = R"""(
- Dump the full SemIR to stdout when built.
- )""",
- },
- [&](auto& arg_b) { arg_b.Set(&dump_sem_ir); });
- b.AddOneOfOption(
- {
- .name = "dump-sem-ir-ranges",
- .help = R"""(
- Selects handling of `//@dump-sem-ir-[begin|end]` markers when dumping SemIR.
- By default, `if-present` prints ranges for files that have them, and full SemIR
- for files that don't. `only` skips files with no ranges, and `ignore` always
- prints full SemIR.
- )""",
- },
- [&](auto& arg_b) {
- arg_b.SetOneOf(
- {
- arg_b.OneOfValue("if-present", DumpSemIRRanges::IfPresent)
- .Default(true),
- arg_b.OneOfValue("only", DumpSemIRRanges::Only),
- arg_b.OneOfValue("ignore", DumpSemIRRanges::Ignore),
- },
- &dump_sem_ir_ranges);
- });
- b.AddFlag(
- {
- .name = "builtin-sem-ir",
- .help = R"""(
- Include the SemIR for builtins when dumping it.
- )""",
- },
- [&](auto& arg_b) { arg_b.Set(&builtin_sem_ir); });
- b.AddFlag(
- {
- .name = "dump-llvm-ir",
- .help = R"""(
- Dump the LLVM IR to stdout after lowering.
- )""",
- },
- [&](auto& arg_b) { arg_b.Set(&dump_llvm_ir); });
- b.AddFlag(
- {
- .name = "dump-asm",
- .help = R"""(
- Dump the generated assembly to stdout after codegen.
- )""",
- },
- [&](auto& arg_b) { arg_b.Set(&dump_asm); });
- b.AddFlag(
- {
- .name = "dump-mem-usage",
- .help = R"""(
- Dumps the amount of memory used.
- )""",
- },
- [&](auto& arg_b) { arg_b.Set(&dump_mem_usage); });
- b.AddFlag(
- {
- .name = "dump-timings",
- .help = R"""(
- Dumps the duration of each phase for each compilation unit.
- )""",
- },
- [&](auto& arg_b) { arg_b.Set(&dump_timings); });
- b.AddFlag(
- {
- .name = "prelude-import",
- .help = R"""(
- Whether to use the implicit prelude import. Enabled by default.
- )""",
- },
- [&](auto& arg_b) {
- arg_b.Default(true);
- arg_b.Set(&prelude_import);
- });
- b.AddFlag(
- {
- .name = "custom-core",
- .value_name = "CUSTOM_CORE",
- .help = R"""(
- Whether to use a custom Core package, the files for which must all be included
- in the compile command line.
- The prelude library in the Core package is imported automatically. By default,
- the Core package shipped with the toolchain is used, and its files do not need
- to be specified in the compile command line.
- )""",
- },
- [&](auto& arg_b) {
- arg_b.Default(false);
- arg_b.Set(&custom_core);
- });
- b.AddStringOption(
- {
- .name = "exclude-dump-file-prefix",
- .value_name = "PREFIX",
- .help = R"""(
- Excludes files with the given prefix from dumps.
- )""",
- },
- [&](auto& arg_b) { arg_b.Append(&exclude_dump_file_prefixes); });
- b.AddFlag(
- {
- .name = "debug-info",
- .help = R"""(
- Whether to emit DWARF debug information.
- )""",
- },
- [&](auto& arg_b) {
- arg_b.Default(true);
- arg_b.Set(&include_debug_info);
- });
- b.AddFlag(
- {
- .name = "verify-llvm-ir",
- .help = R"""(
- Whether to run the LLVM verifier on modules.
- )""",
- },
- [&](auto& arg_b) {
- arg_b.Default(true);
- arg_b.Set(&run_llvm_verifier);
- });
- }
- static constexpr CommandLine::CommandInfo SubcommandInfo = {
- .name = "compile",
- .help = R"""(
- Compile Carbon source code.
- This subcommand runs the Carbon compiler over input source code, checking it for
- errors and producing the requested output.
- Error messages are written to the standard error stream.
- Different phases of the compiler can be selected to run, and intermediate state
- can be written to standard output as these phases progress.
- )""",
- };
- CompileSubcommand::CompileSubcommand() : DriverSubcommand(SubcommandInfo) {}
- // Returns a string for printing the phase in a diagnostic.
- static auto PhaseToString(CompileOptions::Phase phase) -> std::string {
- switch (phase) {
- case CompileOptions::Phase::Lex:
- return "lex";
- case CompileOptions::Phase::Parse:
- return "parse";
- case CompileOptions::Phase::Check:
- return "check";
- case CompileOptions::Phase::Lower:
- return "lower";
- case CompileOptions::Phase::CodeGen:
- return "codegen";
- }
- }
- auto CompileSubcommand::ValidateOptions(
- Diagnostics::NoLocEmitter& emitter) const -> bool {
- CARBON_DIAGNOSTIC(
- CompilePhaseFlagConflict, Error,
- "requested dumping {0} but compile phase is limited to `{1}`",
- std::string, std::string);
- using Phase = CompileOptions::Phase;
- switch (options_.phase) {
- case Phase::Lex:
- if (options_.dump_parse_tree) {
- emitter.Emit(CompilePhaseFlagConflict, "parse tree",
- PhaseToString(options_.phase));
- return false;
- }
- [[fallthrough]];
- case Phase::Parse:
- if (options_.dump_sem_ir) {
- emitter.Emit(CompilePhaseFlagConflict, "SemIR",
- PhaseToString(options_.phase));
- return false;
- }
- [[fallthrough]];
- case Phase::Check:
- if (options_.dump_llvm_ir) {
- emitter.Emit(CompilePhaseFlagConflict, "LLVM IR",
- PhaseToString(options_.phase));
- return false;
- }
- [[fallthrough]];
- case Phase::Lower:
- case Phase::CodeGen:
- // Everything can be dumped in these phases.
- break;
- }
- return true;
- }
- namespace {
- class MultiUnitCache;
- // Ties together information for a file being compiled.
- class CompilationUnit {
- public:
- explicit CompilationUnit(int unit_index, DriverEnv* driver_env,
- const CompileOptions* options,
- Diagnostics::Consumer* consumer,
- llvm::StringRef input_filename);
- // Sets the multi-unit cache and initializes dependent member state.
- auto SetMultiUnitCache(MultiUnitCache* cache) -> void;
- // Loads source and lexes it. Returns true on success.
- auto RunLex() -> void;
- // Parses tokens. Returns true on success.
- auto RunParse() -> void;
- // Returns information needed to check this unit.
- auto GetCheckUnit() -> Check::Unit;
- // Runs post-check logic. Returns true if checking succeeded for the IR.
- auto PostCheck() -> void;
- // Lower SemIR to LLVM IR.
- auto RunLower() -> void;
- auto RunCodeGen() -> void;
- // Runs post-compile logic. This is always called, and called after all other
- // actions on the CompilationUnit.
- auto PostCompile() -> void;
- // Flushes diagnostics, specifically as part of generating stack trace
- // information.
- auto FlushForStackTrace() -> void { consumer_->Flush(); }
- auto input_filename() -> llvm::StringRef { return input_filename_; }
- auto success() -> bool { return success_; }
- auto has_source() -> bool { return source_.has_value(); }
- auto get_trees_and_subtrees() -> Parse::GetTreeAndSubtreesFn {
- return *tree_and_subtrees_getter_;
- }
- private:
- // Do codegen. Returns true on success.
- auto RunCodeGenHelper() -> bool;
- // The TreeAndSubtrees is mainly used for debugging and diagnostics, and has
- // significant overhead. Avoid constructing it when unused.
- auto GetParseTreeAndSubtrees() -> const Parse::TreeAndSubtrees&;
- // Handles printing of formatted SemIR.
- auto MaybePrintFormattedSemIR() -> void;
- // Wraps a call with log statements to indicate start and end. Typically logs
- // with the actual function name, but marks timings with the appropriate
- // phase.
- auto LogCall(llvm::StringLiteral logging_label,
- llvm::StringLiteral timing_label,
- llvm::function_ref<auto()->void> fn) -> void;
- // Returns true if the current file should be included in debug dumps.
- auto IncludeInDumps() -> bool;
- // The index of the unit amongst all units. Equivalent to a `CheckIRId`.
- int unit_index_;
- DriverEnv* driver_env_;
- const CompileOptions* options_;
- SharedValueStores value_stores_;
- // The input filename from the command line. For most diagnostics, we
- // typically use `source_->filename()`, which includes a `-` -> `<stdin>`
- // translation. However, logging and some diagnostics use the command line
- // argument.
- std::string input_filename_;
- // Copied from driver_ for CARBON_VLOG.
- llvm::raw_pwrite_stream* vlog_stream_;
- // Diagnostics are sent to consumer_, with optional sorting.
- std::optional<Diagnostics::SortingConsumer> sorting_consumer_;
- Diagnostics::Consumer* consumer_;
- bool success_ = true;
- // Initialized by `SetMultiUnitCache`.
- MultiUnitCache* cache_ = nullptr;
- // Tracks memory usage of the compile.
- std::optional<MemUsage> mem_usage_;
- // Tracks timings of the compile.
- std::optional<Timings> timings_;
- // These are initialized as steps are run.
- std::optional<SourceBuffer> source_;
- std::optional<Lex::TokenizedBuffer> tokens_;
- std::optional<Parse::Tree> parse_tree_;
- std::optional<Parse::TreeAndSubtrees> parse_tree_and_subtrees_;
- std::optional<std::function<auto()->const Parse::TreeAndSubtrees&>>
- tree_and_subtrees_getter_;
- std::optional<SemIR::File> sem_ir_;
- std::unique_ptr<clang::ASTUnit> cpp_ast_;
- std::unique_ptr<llvm::LLVMContext> llvm_context_;
- std::unique_ptr<llvm::Module> module_;
- };
- // Caches lists that are shared cross-unit. Accessors do lazy caching because
- // they may not be used.
- class MultiUnitCache {
- public:
- // This relies on construction after `units` are all initialized, which is
- // reflected by the `ArrayRef` here.
- explicit MultiUnitCache(
- const CompileOptions* options,
- const llvm::ArrayRef<std::unique_ptr<CompilationUnit>> units)
- : options_(options), units_(units) {}
- auto include_in_dumps() -> llvm::ArrayRef<bool> {
- CARBON_CHECK(!units_.empty());
- if (include_in_dumps_.empty()) {
- BuildIncludeInDumps();
- }
- return include_in_dumps_;
- }
- auto tree_and_subtrees_getters()
- -> llvm::ArrayRef<Parse::GetTreeAndSubtreesFn> {
- CARBON_CHECK(!units_.empty());
- if (tree_and_subtrees_getters_.empty()) {
- BuildTreeAndSubtreesGetters();
- }
- return tree_and_subtrees_getters_;
- }
- private:
- auto BuildIncludeInDumps() -> void {
- CARBON_CHECK(include_in_dumps_.empty());
- llvm::append_range(
- include_in_dumps_, llvm::map_range(units_, [&](const auto& unit) {
- return llvm::none_of(
- options_->exclude_dump_file_prefixes, [&](auto prefix) {
- return unit->input_filename().starts_with(prefix);
- });
- }));
- }
- auto BuildTreeAndSubtreesGetters() -> void {
- CARBON_CHECK(tree_and_subtrees_getters_.empty());
- llvm::append_range(
- tree_and_subtrees_getters_,
- llvm::map_range(units_, [&](const auto& unit) {
- return unit->has_source() ? unit->get_trees_and_subtrees() : nullptr;
- }));
- }
- const CompileOptions* options_;
- // The units being compiled.
- const llvm::ArrayRef<std::unique_ptr<CompilationUnit>> units_;
- // For each unit, whether it's included in dumps. Used cross-phase.
- llvm::SmallVector<bool> include_in_dumps_;
- // For each unit, the `TreeAndSubtrees` getter. Used by lowering.
- llvm::SmallVector<Parse::GetTreeAndSubtreesFn> tree_and_subtrees_getters_;
- };
- } // namespace
- CompilationUnit::CompilationUnit(int unit_index, DriverEnv* driver_env,
- const CompileOptions* options,
- Diagnostics::Consumer* consumer,
- llvm::StringRef input_filename)
- : unit_index_(unit_index),
- driver_env_(driver_env),
- options_(options),
- input_filename_(input_filename),
- vlog_stream_(driver_env_->vlog_stream) {
- if (vlog_stream_ != nullptr || options_->stream_errors) {
- consumer_ = consumer;
- } else {
- sorting_consumer_ = Diagnostics::SortingConsumer(*consumer);
- consumer_ = &*sorting_consumer_;
- }
- }
- auto CompilationUnit::IncludeInDumps() -> bool {
- return cache_->include_in_dumps()[unit_index_];
- }
- auto CompilationUnit::SetMultiUnitCache(MultiUnitCache* cache) -> void {
- CARBON_CHECK(!cache_, "Called SetMultiUnitCache twice");
- cache_ = cache;
- if (options_->dump_mem_usage && IncludeInDumps()) {
- CARBON_CHECK(!mem_usage_);
- mem_usage_ = MemUsage();
- }
- if (options_->dump_timings && IncludeInDumps()) {
- CARBON_CHECK(!timings_);
- timings_ = Timings();
- }
- }
- auto CompilationUnit::RunLex() -> void {
- CARBON_CHECK(cache_, "Must call SetMultiUnitCache first");
- CARBON_CHECK(!tokens_, "Called RunLex twice");
- LogCall("SourceBuffer::MakeFromFileOrStdin", "source", [&] {
- source_ = SourceBuffer::MakeFromFileOrStdin(*driver_env_->fs,
- input_filename_, *consumer_);
- });
- if (!source_) {
- success_ = false;
- return;
- }
- if (mem_usage_) {
- mem_usage_->Add("source_", source_->text().size(), source_->text().size());
- }
- CARBON_VLOG("*** SourceBuffer ***\n```\n{0}\n```\n", source_->text());
- LogCall("Lex::Lex", "lex",
- [&] { tokens_ = Lex::Lex(value_stores_, *source_, *consumer_); });
- if (options_->dump_tokens && IncludeInDumps()) {
- consumer_->Flush();
- tokens_->Print(*driver_env_->output_stream,
- options_->omit_file_boundary_tokens);
- }
- if (mem_usage_) {
- mem_usage_->Collect("tokens_", *tokens_);
- }
- CARBON_VLOG("*** Lex::TokenizedBuffer ***\n{0}", tokens_);
- if (tokens_->has_errors()) {
- success_ = false;
- }
- }
- auto CompilationUnit::RunParse() -> void {
- LogCall("Parse::Parse", "parse", [&] {
- parse_tree_ = Parse::Parse(*tokens_, *consumer_, vlog_stream_);
- });
- if (options_->dump_parse_tree && IncludeInDumps()) {
- consumer_->Flush();
- const auto& tree_and_subtrees = GetParseTreeAndSubtrees();
- if (options_->preorder_parse_tree) {
- tree_and_subtrees.PrintPreorder(*driver_env_->output_stream);
- } else {
- tree_and_subtrees.Print(*driver_env_->output_stream);
- }
- }
- if (mem_usage_) {
- mem_usage_->Collect("parse_tree_", *parse_tree_);
- }
- CARBON_VLOG("*** Parse::Tree ***\n{0}", parse_tree_);
- if (parse_tree_->has_errors()) {
- success_ = false;
- }
- }
- auto CompilationUnit::GetCheckUnit() -> Check::Unit {
- CARBON_CHECK(parse_tree_, "Must call RunParse first");
- CARBON_CHECK(!sem_ir_, "Called GetCheckUnit twice");
- tree_and_subtrees_getter_ = [this]() -> const Parse::TreeAndSubtrees& {
- return this->GetParseTreeAndSubtrees();
- };
- sem_ir_.emplace(&*parse_tree_, SemIR::CheckIRId(unit_index_),
- parse_tree_->packaging_decl(), value_stores_,
- input_filename_);
- return {.consumer = consumer_,
- .value_stores = &value_stores_,
- .timings = timings_ ? &*timings_ : nullptr,
- .sem_ir = &*sem_ir_,
- .cpp_ast = &cpp_ast_};
- }
- auto CompilationUnit::MaybePrintFormattedSemIR() -> void {
- bool print = options_->dump_sem_ir && IncludeInDumps();
- if (!vlog_stream_ && !print) {
- return;
- }
- if (options_->dump_sem_ir_ranges == CompileOptions::DumpSemIRRanges::Only &&
- !tokens_->has_dump_sem_ir_ranges()) {
- return;
- }
- bool use_dump_sem_ir_ranges =
- options_->dump_sem_ir_ranges != CompileOptions::DumpSemIRRanges::Ignore &&
- tokens_->has_dump_sem_ir_ranges();
- SemIR::Formatter formatter(&*sem_ir_, *tree_and_subtrees_getter_,
- cache_->include_in_dumps(),
- use_dump_sem_ir_ranges);
- formatter.Format();
- if (vlog_stream_) {
- CARBON_VLOG("*** SemIR::File ***\n");
- formatter.Write(*vlog_stream_);
- }
- if (print) {
- formatter.Write(*driver_env_->output_stream);
- }
- }
- auto CompilationUnit::PostCheck() -> void {
- CARBON_CHECK(sem_ir_, "Must call GetCheckUnit first");
- // We've finished all steps that can produce diagnostics. Emit the
- // diagnostics now, so that the developer sees them sooner and doesn't need
- // to wait for code generation.
- consumer_->Flush();
- if (mem_usage_) {
- mem_usage_->Collect("sem_ir_", *sem_ir_);
- }
- if (options_->dump_raw_sem_ir && IncludeInDumps()) {
- CARBON_VLOG("*** Raw SemIR::File ***\n{0}\n", *sem_ir_);
- sem_ir_->Print(*driver_env_->output_stream, options_->builtin_sem_ir);
- if (options_->dump_sem_ir) {
- *driver_env_->output_stream << "\n";
- }
- }
- MaybePrintFormattedSemIR();
- if (sem_ir_->has_errors()) {
- success_ = false;
- }
- }
- auto CompilationUnit::RunLower() -> void {
- LogCall("Lower::LowerToLLVM", "lower", [&] {
- llvm_context_ = std::make_unique<llvm::LLVMContext>();
- // TODO: Consider disabling instruction naming by default if we're not
- // producing textual LLVM IR.
- SemIR::InstNamer inst_namer(&*sem_ir_);
- llvm::ArrayRef<Parse::GetTreeAndSubtreesFn> subtrees =
- cache_->tree_and_subtrees_getters();
- module_ = Lower::LowerToLLVM(
- *llvm_context_, driver_env_->fs,
- options_->run_llvm_verifier ? driver_env_->error_stream : nullptr,
- options_->include_debug_info, subtrees, input_filename_, *sem_ir_,
- &inst_namer, vlog_stream_);
- });
- if (vlog_stream_) {
- CARBON_VLOG("*** llvm::Module ***\n");
- module_->print(*vlog_stream_, /*AAW=*/nullptr,
- /*ShouldPreserveUseListOrder=*/false,
- /*IsForDebug=*/true);
- }
- if (options_->dump_llvm_ir && IncludeInDumps()) {
- module_->print(*driver_env_->output_stream, /*AAW=*/nullptr,
- /*ShouldPreserveUseListOrder=*/true);
- }
- }
- auto CompilationUnit::RunCodeGen() -> void {
- CARBON_CHECK(module_, "Must call RunLower first");
- LogCall("CodeGen", "codegen", [&] { success_ = RunCodeGenHelper(); });
- }
- auto CompilationUnit::PostCompile() -> void {
- if (options_->dump_shared_values && IncludeInDumps()) {
- Yaml::Print(*driver_env_->output_stream,
- value_stores_.OutputYaml(input_filename_));
- }
- if (mem_usage_) {
- mem_usage_->Collect("value_stores_", value_stores_);
- Yaml::Print(*driver_env_->output_stream,
- mem_usage_->OutputYaml(input_filename_));
- }
- if (timings_) {
- Yaml::Print(*driver_env_->output_stream,
- timings_->OutputYaml(input_filename_));
- }
- // The diagnostics consumer must be flushed before compilation artifacts are
- // destructed, because diagnostics can refer to their state.
- consumer_->Flush();
- }
- auto CompilationUnit::RunCodeGenHelper() -> bool {
- std::optional<CodeGen> codegen =
- CodeGen::Make(module_.get(), options_->codegen_options.target,
- driver_env_->error_stream);
- if (!codegen) {
- return false;
- }
- if (vlog_stream_) {
- CARBON_VLOG("*** Assembly ***\n");
- codegen->EmitAssembly(*vlog_stream_);
- }
- if (options_->output_filename == "-") {
- // TODO: The output file name, forcing object output, and requesting
- // textual assembly output are all somewhat linked flags. We should add
- // some validation that they are used correctly.
- if (options_->force_obj_output) {
- if (!codegen->EmitObject(*driver_env_->output_stream)) {
- return false;
- }
- } else {
- if (!codegen->EmitAssembly(*driver_env_->output_stream)) {
- return false;
- }
- }
- } else {
- llvm::SmallString<256> output_filename = options_->output_filename;
- if (output_filename.empty()) {
- if (!source_->is_regular_file()) {
- // Don't invent file names like `-.o` or `/dev/stdin.o`.
- // TODO: Consider rephrasing the diagnostic to use the file as the
- // `Emit` location.
- CARBON_DIAGNOSTIC(CompileInputNotRegularFile, Error,
- "output file name must be specified for input `{0}` "
- "that is not a regular file",
- std::string);
- driver_env_->emitter.Emit(CompileInputNotRegularFile, input_filename_);
- return false;
- }
- output_filename = input_filename_;
- llvm::sys::path::replace_extension(output_filename,
- options_->asm_output ? ".s" : ".o");
- } else {
- // TODO: Handle the case where multiple input files were specified
- // along with an output file name. That should either be an error or
- // should produce a single LLVM IR module containing all inputs.
- // Currently each unit overwrites the output from the previous one in
- // this case.
- }
- CARBON_VLOG("Writing output to: {0}\n", output_filename);
- std::error_code ec;
- llvm::raw_fd_ostream output_file(output_filename, ec,
- llvm::sys::fs::OF_None);
- if (ec) {
- // TODO: Consider rephrasing the diagnostic to use the file as the `Emit`
- // location.
- CARBON_DIAGNOSTIC(CompileOutputFileOpenError, Error,
- "could not open output file `{0}`: {1}", std::string,
- std::string);
- driver_env_->emitter.Emit(CompileOutputFileOpenError,
- output_filename.str().str(), ec.message());
- return false;
- }
- if (options_->asm_output) {
- if (!codegen->EmitAssembly(output_file)) {
- return false;
- }
- } else {
- if (!codegen->EmitObject(output_file)) {
- return false;
- }
- }
- }
- return true;
- }
- auto CompilationUnit::GetParseTreeAndSubtrees()
- -> const Parse::TreeAndSubtrees& {
- if (!parse_tree_and_subtrees_) {
- parse_tree_and_subtrees_ = Parse::TreeAndSubtrees(*tokens_, *parse_tree_);
- if (mem_usage_) {
- mem_usage_->Collect("parse_tree_and_subtrees_",
- *parse_tree_and_subtrees_);
- }
- }
- return *parse_tree_and_subtrees_;
- }
- auto CompilationUnit::LogCall(llvm::StringLiteral logging_label,
- llvm::StringLiteral timing_label,
- llvm::function_ref<auto()->void> fn) -> void {
- PrettyStackTraceFunction trace_file([&](llvm::raw_ostream& out) {
- out << "Filename: " << input_filename_ << "\n";
- });
- CARBON_VLOG("*** {0}: {1} ***\n", logging_label, input_filename_);
- Timings::ScopedTiming timing(timings_ ? &*timings_ : nullptr, timing_label);
- fn();
- CARBON_VLOG("*** {0} done ***\n", logging_label);
- }
- auto CompileSubcommand::Run(DriverEnv& driver_env) -> DriverResult {
- if (!ValidateOptions(driver_env.emitter)) {
- return {.success = false};
- }
- // Find the files comprising the prelude if we are importing it.
- // TODO: Replace this with a search for library api files in a
- // package-specific search path based on the library name.
- llvm::SmallVector<std::string> prelude;
- if (options_.prelude_import && !options_.custom_core &&
- options_.phase >= CompileOptions::Phase::Check) {
- if (auto find = driver_env.installation->ReadPreludeManifest(); find.ok()) {
- prelude = std::move(*find);
- } else {
- // TODO: Change ReadPreludeManifest to produce diagnostics.
- CARBON_DIAGNOSTIC(CompilePreludeManifestError, Error, "{0}", std::string);
- driver_env.emitter.Emit(CompilePreludeManifestError,
- PrintToString(find.error()));
- return {.success = false};
- }
- }
- // Prepare CompilationUnits before building scope exit handlers.
- llvm::SmallVector<std::unique_ptr<CompilationUnit>> units;
- int unit_index = -1;
- auto unit_builder = [&](llvm::StringRef filename) {
- return std::make_unique<CompilationUnit>(
- ++unit_index, &driver_env, &options_, &driver_env.consumer, filename);
- };
- llvm::append_range(units, llvm::map_range(prelude, unit_builder));
- llvm::append_range(units,
- llvm::map_range(options_.input_filenames, unit_builder));
- // Add the cache to all units. This must be done after all units are created.
- MultiUnitCache cache(&options_, units);
- for (auto& unit : units) {
- unit->SetMultiUnitCache(&cache);
- }
- auto on_exit = llvm::make_scope_exit([&]() {
- // Finish compilation units. This flushes their diagnostics in the order in
- // which they were specified on the command line.
- for (auto& unit : units) {
- unit->PostCompile();
- }
- driver_env.consumer.Flush();
- });
- PrettyStackTraceFunction flush_on_crash([&](llvm::raw_ostream& out) {
- // When crashing, flush diagnostics. If sorting diagnostics, they can be
- // redirected to the crash stream; if streaming, the original stream is
- // flushed.
- // TODO: Eventually we'll want to limit the count.
- if (options_.stream_errors) {
- out << "Flushing diagnostics\n";
- } else {
- out << "Pending diagnostics:\n";
- driver_env.consumer.set_stream(&out);
- }
- for (auto& unit : units) {
- unit->FlushForStackTrace();
- }
- driver_env.consumer.Flush();
- driver_env.consumer.set_stream(driver_env.error_stream);
- });
- // Returns a DriverResult object. Called whenever Compile returns.
- auto make_result = [&]() {
- DriverResult result = {.success = true};
- for (const auto& unit : units) {
- result.success &= unit->success();
- result.per_file_success.push_back(
- {unit->input_filename().str(), unit->success()});
- }
- return result;
- };
- // Lex.
- for (auto& unit : units) {
- unit->RunLex();
- }
- if (options_.phase == CompileOptions::Phase::Lex) {
- return make_result();
- }
- // Parse and check phases examine `has_source` because they want to proceed if
- // lex failed, but not if source doesn't exist. Later steps are skipped if
- // anything failed, so don't need this.
- // Parse.
- for (auto& unit : units) {
- if (unit->has_source()) {
- unit->RunParse();
- }
- }
- if (options_.phase == CompileOptions::Phase::Parse) {
- return make_result();
- }
- // Gather Check::Units.
- llvm::SmallVector<Check::Unit> check_units;
- check_units.reserve(units.size());
- for (auto& unit : units) {
- if (unit->has_source()) {
- check_units.push_back(unit->GetCheckUnit());
- }
- }
- // Execute the actual checking.
- CARBON_VLOG_TO(driver_env.vlog_stream, "*** Check::CheckParseTrees ***\n");
- Check::CheckParseTrees(check_units, cache.tree_and_subtrees_getters(),
- options_.prelude_import, driver_env.fs,
- options_.codegen_options.target,
- driver_env.vlog_stream, driver_env.fuzzing);
- CARBON_VLOG_TO(driver_env.vlog_stream,
- "*** Check::CheckParseTrees done ***\n");
- for (auto& unit : units) {
- if (unit->has_source()) {
- unit->PostCheck();
- }
- }
- if (options_.phase == CompileOptions::Phase::Check) {
- return make_result();
- }
- // Unlike previous steps, errors block further progress.
- if (llvm::any_of(units, [&](const auto& unit) { return !unit->success(); })) {
- CARBON_VLOG_TO(driver_env.vlog_stream,
- "*** Stopping before lowering due to errors ***\n");
- return make_result();
- }
- // Lower.
- for (const auto& unit : units) {
- unit->RunLower();
- }
- if (options_.phase == CompileOptions::Phase::Lower) {
- return make_result();
- }
- CARBON_CHECK(options_.phase == CompileOptions::Phase::CodeGen,
- "CodeGen should be the last stage");
- // Codegen.
- for (auto& unit : units) {
- unit->RunCodeGen();
- }
- return make_result();
- }
- } // namespace Carbon
|