| 1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018 |
- // Part of the Carbon Language project, under the Apache License v2.0 with LLVM
- // Exceptions. See /LICENSE for license information.
- // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
- #include "toolchain/driver/driver.h"
- #include <algorithm>
- #include <memory>
- #include <optional>
- #include "common/command_line.h"
- #include "common/version.h"
- #include "common/vlog.h"
- #include "llvm/ADT/ArrayRef.h"
- #include "llvm/ADT/ScopeExit.h"
- #include "llvm/ADT/StringExtras.h"
- #include "llvm/ADT/StringRef.h"
- #include "llvm/IR/LLVMContext.h"
- #include "llvm/Support/Path.h"
- #include "llvm/TargetParser/Host.h"
- #include "llvm/TargetParser/Triple.h"
- #include "toolchain/base/value_store.h"
- #include "toolchain/check/check.h"
- #include "toolchain/codegen/codegen.h"
- #include "toolchain/diagnostics/sorting_diagnostic_consumer.h"
- #include "toolchain/driver/clang_runner.h"
- #include "toolchain/lex/lex.h"
- #include "toolchain/lower/lower.h"
- #include "toolchain/parse/parse.h"
- #include "toolchain/parse/tree_and_subtrees.h"
- #include "toolchain/sem_ir/formatter.h"
- #include "toolchain/sem_ir/inst_namer.h"
- #include "toolchain/source/source_buffer.h"
- namespace Carbon {
- struct Driver::CodegenOptions {
- void Build(CommandLine::CommandBuilder& b) {
- b.AddStringOption(
- {
- .name = "target",
- .help = R"""(
- Select a target platform. Uses the LLVM target syntax. Also known as a "triple"
- for historical reasons.
- This corresponds to the `target` flag to Clang and accepts the same strings
- documented there:
- https://clang.llvm.org/docs/CrossCompilation.html#target-triple
- )""",
- },
- [&](auto& arg_b) {
- arg_b.Default(host);
- arg_b.Set(&target);
- });
- }
- std::string host = llvm::sys::getDefaultTargetTriple();
- llvm::StringRef target;
- };
- struct Driver::CompileOptions {
- static constexpr CommandLine::CommandInfo Info = {
- .name = "compile",
- .help = R"""(
- Compile Carbon source code.
- This subcommand runs the Carbon compiler over input source code, checking it for
- errors and producing the requested output.
- Error messages are written to the standard error stream.
- Different phases of the compiler can be selected to run, and intermediate state
- can be written to standard output as these phases progress.
- )""",
- };
- enum class Phase : int8_t {
- Lex,
- Parse,
- Check,
- Lower,
- CodeGen,
- };
- friend auto operator<<(llvm::raw_ostream& out, Phase phase)
- -> llvm::raw_ostream& {
- switch (phase) {
- case Phase::Lex:
- out << "lex";
- break;
- case Phase::Parse:
- out << "parse";
- break;
- case Phase::Check:
- out << "check";
- break;
- case Phase::Lower:
- out << "lower";
- break;
- case Phase::CodeGen:
- out << "codegen";
- break;
- }
- return out;
- }
- void Build(CommandLine::CommandBuilder& b, CodegenOptions& codegen_options) {
- b.AddStringPositionalArg(
- {
- .name = "FILE",
- .help = R"""(
- The input Carbon source file to compile.
- )""",
- },
- [&](auto& arg_b) {
- arg_b.Required(true);
- arg_b.Append(&input_filenames);
- });
- b.AddOneOfOption(
- {
- .name = "phase",
- .help = R"""(
- Selects the compilation phase to run. These phases are always run in sequence,
- so every phase before the one selected will also be run. The default is to
- compile to machine code.
- )""",
- },
- [&](auto& arg_b) {
- arg_b.SetOneOf(
- {
- arg_b.OneOfValue("lex", Phase::Lex),
- arg_b.OneOfValue("parse", Phase::Parse),
- arg_b.OneOfValue("check", Phase::Check),
- arg_b.OneOfValue("lower", Phase::Lower),
- arg_b.OneOfValue("codegen", Phase::CodeGen).Default(true),
- },
- &phase);
- });
- // TODO: Rearrange the code setting this option and two related ones to
- // allow them to reference each other instead of hard-coding their names.
- b.AddStringOption(
- {
- .name = "output",
- .value_name = "FILE",
- .help = R"""(
- The output filename for codegen.
- When this is a file name, either textual assembly or a binary object will be
- written to it based on the flag `--asm-output`. The default is to write a binary
- object file.
- Passing `--output=-` will write the output to stdout. In that case, the flag
- `--asm-output` is ignored and the output defaults to textual assembly. Binary
- object output can be forced by enabling `--force-obj-output`.
- )""",
- },
- [&](auto& arg_b) { arg_b.Set(&output_filename); });
- // Include the common code generation options at this point to render it
- // after the more common options above, but before the more unusual options
- // below.
- codegen_options.Build(b);
- b.AddFlag(
- {
- .name = "asm-output",
- .help = R"""(
- Write textual assembly rather than a binary object file to the code generation
- output.
- This flag only applies when writing to a file. When writing to stdout, the
- default is textual assembly and this flag is ignored.
- )""",
- },
- [&](auto& arg_b) { arg_b.Set(&asm_output); });
- b.AddFlag(
- {
- .name = "force-obj-output",
- .help = R"""(
- Force binary object output, even with `--output=-`.
- When `--output=-` is set, the default is textual assembly; this forces printing
- of a binary object file instead. Ignored for other `--output` values.
- )""",
- },
- [&](auto& arg_b) { arg_b.Set(&force_obj_output); });
- b.AddFlag(
- {
- .name = "stream-errors",
- .help = R"""(
- Stream error messages to stderr as they are generated rather than sorting them
- and displaying them in source order.
- )""",
- },
- [&](auto& arg_b) { arg_b.Set(&stream_errors); });
- b.AddFlag(
- {
- .name = "dump-shared-values",
- .help = R"""(
- Dumps shared values. These aren't owned by any particular file or phase.
- )""",
- },
- [&](auto& arg_b) { arg_b.Set(&dump_shared_values); });
- b.AddFlag(
- {
- .name = "dump-tokens",
- .help = R"""(
- Dump the tokens to stdout when lexed.
- )""",
- },
- [&](auto& arg_b) { arg_b.Set(&dump_tokens); });
- b.AddFlag(
- {
- .name = "dump-parse-tree",
- .help = R"""(
- Dump the parse tree to stdout when parsed.
- )""",
- },
- [&](auto& arg_b) { arg_b.Set(&dump_parse_tree); });
- b.AddFlag(
- {
- .name = "preorder-parse-tree",
- .help = R"""(
- When dumping the parse tree, reorder it so that it is in preorder rather than
- postorder.
- )""",
- },
- [&](auto& arg_b) { arg_b.Set(&preorder_parse_tree); });
- b.AddFlag(
- {
- .name = "dump-raw-sem-ir",
- .help = R"""(
- Dump the raw JSON structure of SemIR to stdout when built.
- )""",
- },
- [&](auto& arg_b) { arg_b.Set(&dump_raw_sem_ir); });
- b.AddFlag(
- {
- .name = "dump-sem-ir",
- .help = R"""(
- Dump the SemIR to stdout when built.
- )""",
- },
- [&](auto& arg_b) { arg_b.Set(&dump_sem_ir); });
- b.AddFlag(
- {
- .name = "builtin-sem-ir",
- .help = R"""(
- Include the SemIR for builtins when dumping it.
- )""",
- },
- [&](auto& arg_b) { arg_b.Set(&builtin_sem_ir); });
- b.AddFlag(
- {
- .name = "dump-llvm-ir",
- .help = R"""(
- Dump the LLVM IR to stdout after lowering.
- )""",
- },
- [&](auto& arg_b) { arg_b.Set(&dump_llvm_ir); });
- b.AddFlag(
- {
- .name = "dump-asm",
- .help = R"""(
- Dump the generated assembly to stdout after codegen.
- )""",
- },
- [&](auto& arg_b) { arg_b.Set(&dump_asm); });
- b.AddFlag(
- {
- .name = "dump-mem-usage",
- .help = R"""(
- Dumps the amount of memory used.
- )""",
- },
- [&](auto& arg_b) { arg_b.Set(&dump_mem_usage); });
- b.AddFlag(
- {
- .name = "prelude-import",
- .help = R"""(
- Whether to use the implicit prelude import. Enabled by default.
- )""",
- },
- [&](auto& arg_b) {
- arg_b.Default(true);
- arg_b.Set(&prelude_import);
- });
- b.AddStringOption(
- {
- .name = "exclude-dump-file-prefix",
- .value_name = "PREFIX",
- .help = R"""(
- Excludes files with the given prefix from dumps.
- )""",
- },
- [&](auto& arg_b) { arg_b.Set(&exclude_dump_file_prefix); });
- b.AddFlag(
- {
- .name = "debug-info",
- .help = R"""(
- Emit DWARF debug information.
- )""",
- },
- [&](auto& arg_b) {
- arg_b.Default(true);
- arg_b.Set(&include_debug_info);
- });
- }
- Phase phase;
- llvm::StringRef output_filename;
- llvm::SmallVector<llvm::StringRef> input_filenames;
- bool asm_output = false;
- bool force_obj_output = false;
- bool dump_shared_values = false;
- bool dump_tokens = false;
- bool dump_parse_tree = false;
- bool dump_raw_sem_ir = false;
- bool dump_sem_ir = false;
- bool dump_llvm_ir = false;
- bool dump_asm = false;
- bool dump_mem_usage = false;
- bool stream_errors = false;
- bool preorder_parse_tree = false;
- bool builtin_sem_ir = false;
- bool prelude_import = false;
- bool include_debug_info = true;
- llvm::StringRef exclude_dump_file_prefix;
- };
- struct Driver::LinkOptions {
- static constexpr CommandLine::CommandInfo Info = {
- .name = "link",
- .help = R"""(
- Link Carbon executables.
- This subcommand links Carbon executables by combining object files.
- TODO: Support linking binary libraries, both archives and shared libraries.
- TODO: Support linking against binary libraries.
- )""",
- };
- void Build(CommandLine::CommandBuilder& b, CodegenOptions& codegen_options) {
- b.AddStringPositionalArg(
- {
- .name = "OBJECT_FILE",
- .help = R"""(
- The input object files.
- )""",
- },
- [&](auto& arg_b) {
- arg_b.Required(true);
- arg_b.Append(&object_filenames);
- });
- b.AddStringOption(
- {
- .name = "output",
- .value_name = "FILE",
- .help = R"""(
- The linked file name. The output is always a linked binary.
- )""",
- },
- [&](auto& arg_b) {
- arg_b.Required(true);
- arg_b.Set(&output_filename);
- });
- codegen_options.Build(b);
- }
- llvm::StringRef output_filename;
- llvm::SmallVector<llvm::StringRef> object_filenames;
- };
- struct Driver::Options {
- static const CommandLine::CommandInfo Info;
- enum class Subcommand : int8_t {
- Compile,
- Link,
- };
- void Build(CommandLine::CommandBuilder& b) {
- b.AddFlag(
- {
- .name = "verbose",
- .short_name = "v",
- .help = "Enable verbose logging to the stderr stream.",
- },
- [&](CommandLine::FlagBuilder& arg_b) { arg_b.Set(&verbose); });
- b.AddSubcommand(CompileOptions::Info,
- [&](CommandLine::CommandBuilder& sub_b) {
- compile_options.Build(sub_b, codegen_options);
- sub_b.Do([&] { subcommand = Subcommand::Compile; });
- });
- b.AddSubcommand(LinkOptions::Info, [&](CommandLine::CommandBuilder& sub_b) {
- link_options.Build(sub_b, codegen_options);
- sub_b.Do([&] { subcommand = Subcommand::Link; });
- });
- b.RequiresSubcommand();
- }
- bool verbose;
- Subcommand subcommand;
- CodegenOptions codegen_options;
- CompileOptions compile_options;
- LinkOptions link_options;
- };
- // Note that this is not constexpr so that it can include information generated
- // in separate translation units and potentially overridden at link time in the
- // version string.
- const CommandLine::CommandInfo Driver::Options::Info = {
- .name = "carbon",
- .version = Version::ToolchainInfo,
- .help = R"""(
- This is the unified Carbon Language toolchain driver. Its subcommands provide
- all of the core behavior of the toolchain, including compilation, linking, and
- developer tools. Each of these has its own subcommand, and you can pass a
- specific subcommand to the `help` subcommand to get details about its usage.
- )""",
- .help_epilogue = R"""(
- For questions, issues, or bug reports, please use our GitHub project:
- https://github.com/carbon-language/carbon-lang
- )""",
- };
- auto Driver::ParseArgs(llvm::ArrayRef<llvm::StringRef> args, Options& options)
- -> CommandLine::ParseResult {
- return CommandLine::Parse(
- args, output_stream_, error_stream_, Options::Info,
- [&](CommandLine::CommandBuilder& b) { options.Build(b); });
- }
- auto Driver::RunCommand(llvm::ArrayRef<llvm::StringRef> args) -> RunResult {
- Options options;
- CommandLine::ParseResult result = ParseArgs(args, options);
- if (result == CommandLine::ParseResult::Error) {
- return {.success = false};
- } else if (result == CommandLine::ParseResult::MetaSuccess) {
- return {.success = true};
- }
- if (options.verbose) {
- // Note this implies streamed output in order to interleave.
- vlog_stream_ = &error_stream_;
- }
- switch (options.subcommand) {
- case Options::Subcommand::Compile:
- return Compile(options.compile_options, options.codegen_options);
- case Options::Subcommand::Link:
- return Link(options.link_options, options.codegen_options);
- }
- llvm_unreachable("All subcommands handled!");
- }
- auto Driver::ValidateCompileOptions(const CompileOptions& options) const
- -> bool {
- using Phase = CompileOptions::Phase;
- switch (options.phase) {
- case Phase::Lex:
- if (options.dump_parse_tree) {
- error_stream_ << "ERROR: Requested dumping the parse tree but compile "
- "phase is limited to '"
- << options.phase << "'.\n";
- return false;
- }
- [[fallthrough]];
- case Phase::Parse:
- if (options.dump_sem_ir) {
- error_stream_ << "ERROR: Requested dumping the SemIR but compile phase "
- "is limited to '"
- << options.phase << "'.\n";
- return false;
- }
- [[fallthrough]];
- case Phase::Check:
- if (options.dump_llvm_ir) {
- error_stream_ << "ERROR: Requested dumping the LLVM IR but compile "
- "phase is limited to '"
- << options.phase << "'.\n";
- return false;
- }
- [[fallthrough]];
- case Phase::Lower:
- case Phase::CodeGen:
- // Everything can be dumped in these phases.
- break;
- }
- return true;
- }
- // Ties together information for a file being compiled.
- class Driver::CompilationUnit {
- public:
- explicit CompilationUnit(Driver* driver, const CompileOptions& options,
- const CodegenOptions& codegen_options,
- DiagnosticConsumer* consumer,
- llvm::StringRef input_filename)
- : driver_(driver),
- options_(options),
- codegen_options_(codegen_options),
- input_filename_(input_filename),
- vlog_stream_(driver_->vlog_stream_) {
- if (vlog_stream_ != nullptr || options_.stream_errors) {
- consumer_ = consumer;
- } else {
- sorting_consumer_ = SortingDiagnosticConsumer(*consumer);
- consumer_ = &*sorting_consumer_;
- }
- if (options_.dump_mem_usage && IncludeInDumps()) {
- mem_usage_ = MemUsage();
- }
- }
- // Loads source and lexes it. Returns true on success.
- auto RunLex() -> void {
- LogCall("SourceBuffer::MakeFromFile", [&] {
- if (input_filename_ == "-") {
- source_ = SourceBuffer::MakeFromStdin(*consumer_);
- } else {
- source_ = SourceBuffer::MakeFromFile(driver_->fs_, input_filename_,
- *consumer_);
- }
- });
- if (mem_usage_) {
- mem_usage_->Add("source_", source_->text().size(),
- source_->text().size());
- }
- if (!source_) {
- success_ = false;
- return;
- }
- CARBON_VLOG() << "*** SourceBuffer ***\n```\n"
- << source_->text() << "\n```\n";
- LogCall("Lex::Lex",
- [&] { tokens_ = Lex::Lex(value_stores_, *source_, *consumer_); });
- if (options_.dump_tokens && IncludeInDumps()) {
- consumer_->Flush();
- driver_->output_stream_ << tokens_;
- }
- if (mem_usage_) {
- mem_usage_->Collect("tokens_", *tokens_);
- }
- CARBON_VLOG() << "*** Lex::TokenizedBuffer ***\n" << tokens_;
- if (tokens_->has_errors()) {
- success_ = false;
- }
- }
- // Parses tokens. Returns true on success.
- auto RunParse() -> void {
- CARBON_CHECK(tokens_);
- LogCall("Parse::Parse", [&] {
- parse_tree_ = Parse::Parse(*tokens_, *consumer_, vlog_stream_);
- });
- if (options_.dump_parse_tree && IncludeInDumps()) {
- consumer_->Flush();
- const auto& tree_and_subtrees = GetParseTreeAndSubtrees();
- if (options_.preorder_parse_tree) {
- tree_and_subtrees.PrintPreorder(driver_->output_stream_);
- } else {
- tree_and_subtrees.Print(driver_->output_stream_);
- }
- }
- if (mem_usage_) {
- mem_usage_->Collect("parse_tree_", *parse_tree_);
- }
- CARBON_VLOG() << "*** Parse::Tree ***\n" << parse_tree_;
- if (parse_tree_->has_errors()) {
- success_ = false;
- }
- }
- // Returns information needed to check this unit.
- auto GetCheckUnit() -> Check::Unit {
- CARBON_CHECK(parse_tree_);
- return {
- .value_stores = &value_stores_,
- .tokens = &*tokens_,
- .parse_tree = &*parse_tree_,
- .consumer = consumer_,
- .get_parse_tree_and_subtrees = [&]() -> const Parse::TreeAndSubtrees& {
- return GetParseTreeAndSubtrees();
- },
- .sem_ir = &sem_ir_};
- }
- // Runs post-check logic. Returns true if checking succeeded for the IR.
- auto PostCheck() -> void {
- CARBON_CHECK(sem_ir_);
- // We've finished all steps that can produce diagnostics. Emit the
- // diagnostics now, so that the developer sees them sooner and doesn't need
- // to wait for code generation.
- consumer_->Flush();
- if (mem_usage_) {
- mem_usage_->Collect("sem_ir_", *sem_ir_);
- }
- if (options_.dump_raw_sem_ir && IncludeInDumps()) {
- CARBON_VLOG() << "*** Raw SemIR::File ***\n" << *sem_ir_ << "\n";
- sem_ir_->Print(driver_->output_stream_, options_.builtin_sem_ir);
- if (options_.dump_sem_ir) {
- driver_->output_stream_ << "\n";
- }
- }
- bool print = options_.dump_sem_ir && IncludeInDumps();
- if (vlog_stream_ || print) {
- SemIR::Formatter formatter(*tokens_, *parse_tree_, *sem_ir_);
- if (vlog_stream_) {
- CARBON_VLOG() << "*** SemIR::File ***\n";
- formatter.Print(*vlog_stream_);
- }
- if (print) {
- formatter.Print(driver_->output_stream_);
- }
- }
- if (sem_ir_->has_errors()) {
- success_ = false;
- }
- }
- // Lower SemIR to LLVM IR.
- auto RunLower(const Check::SemIRDiagnosticConverter& converter) -> void {
- CARBON_CHECK(sem_ir_);
- LogCall("Lower::LowerToLLVM", [&] {
- llvm_context_ = std::make_unique<llvm::LLVMContext>();
- // TODO: Consider disabling instruction naming by default if we're not
- // producing textual LLVM IR.
- SemIR::InstNamer inst_namer(*tokens_, *parse_tree_, *sem_ir_);
- module_ = Lower::LowerToLLVM(*llvm_context_, options_.include_debug_info,
- converter, input_filename_, *sem_ir_,
- &inst_namer, vlog_stream_);
- });
- if (vlog_stream_) {
- CARBON_VLOG() << "*** llvm::Module ***\n";
- module_->print(*vlog_stream_, /*AAW=*/nullptr,
- /*ShouldPreserveUseListOrder=*/false,
- /*IsForDebug=*/true);
- }
- if (options_.dump_llvm_ir && IncludeInDumps()) {
- module_->print(driver_->output_stream_, /*AAW=*/nullptr,
- /*ShouldPreserveUseListOrder=*/true);
- }
- }
- auto RunCodeGen() -> void {
- CARBON_CHECK(module_);
- LogCall("CodeGen", [&] { success_ = RunCodeGenHelper(); });
- }
- // Runs post-compile logic. This is always called, and called after all other
- // actions on the CompilationUnit.
- auto PostCompile() -> void {
- if (options_.dump_shared_values && IncludeInDumps()) {
- Yaml::Print(driver_->output_stream_,
- value_stores_.OutputYaml(input_filename_));
- }
- if (mem_usage_) {
- mem_usage_->Collect("value_stores_", value_stores_);
- Yaml::Print(driver_->output_stream_,
- mem_usage_->OutputYaml(input_filename_));
- }
- // The diagnostics consumer must be flushed before compilation artifacts are
- // destructed, because diagnostics can refer to their state.
- consumer_->Flush();
- }
- auto input_filename() -> llvm::StringRef { return input_filename_; }
- auto success() -> bool { return success_; }
- auto has_source() -> bool { return source_.has_value(); }
- private:
- // Do codegen. Returns true on success.
- auto RunCodeGenHelper() -> bool {
- std::optional<CodeGen> codegen = CodeGen::Make(
- *module_, codegen_options_.target, driver_->error_stream_);
- if (!codegen) {
- return false;
- }
- if (vlog_stream_) {
- CARBON_VLOG() << "*** Assembly ***\n";
- codegen->EmitAssembly(*vlog_stream_);
- }
- if (options_.output_filename == "-") {
- // TODO: the output file name, forcing object output, and requesting
- // textual assembly output are all somewhat linked flags. We should add
- // some validation that they are used correctly.
- if (options_.force_obj_output) {
- if (!codegen->EmitObject(driver_->output_stream_)) {
- return false;
- }
- } else {
- if (!codegen->EmitAssembly(driver_->output_stream_)) {
- return false;
- }
- }
- } else {
- llvm::SmallString<256> output_filename = options_.output_filename;
- if (output_filename.empty()) {
- if (!source_->is_regular_file()) {
- // Don't invent file names like `-.o` or `/dev/stdin.o`.
- driver_->error_stream_
- << "ERROR: Output file name must be specified for input '"
- << input_filename_ << "' that is not a regular file.\n";
- return false;
- }
- output_filename = input_filename_;
- llvm::sys::path::replace_extension(output_filename,
- options_.asm_output ? ".s" : ".o");
- } else {
- // TODO: Handle the case where multiple input files were specified
- // along with an output file name. That should either be an error or
- // should produce a single LLVM IR module containing all inputs.
- // Currently each unit overwrites the output from the previous one in
- // this case.
- }
- CARBON_VLOG() << "Writing output to: " << output_filename << "\n";
- std::error_code ec;
- llvm::raw_fd_ostream output_file(output_filename, ec,
- llvm::sys::fs::OF_None);
- if (ec) {
- driver_->error_stream_ << "ERROR: Could not open output file '"
- << output_filename << "': " << ec.message()
- << "\n";
- return false;
- }
- if (options_.asm_output) {
- if (!codegen->EmitAssembly(output_file)) {
- return false;
- }
- } else {
- if (!codegen->EmitObject(output_file)) {
- return false;
- }
- }
- }
- return true;
- }
- // The TreeAndSubtrees is mainly used for debugging and diagnostics, and has
- // significant overhead. Avoid constructing it when unused.
- auto GetParseTreeAndSubtrees() -> const Parse::TreeAndSubtrees& {
- if (!parse_tree_and_subtrees_) {
- parse_tree_and_subtrees_ = Parse::TreeAndSubtrees(*tokens_, *parse_tree_);
- if (mem_usage_) {
- mem_usage_->Collect("parse_tree_and_subtrees_",
- *parse_tree_and_subtrees_);
- }
- }
- return *parse_tree_and_subtrees_;
- }
- // Wraps a call with log statements to indicate start and end.
- auto LogCall(llvm::StringLiteral label, llvm::function_ref<void()> fn)
- -> void {
- CARBON_VLOG() << "*** " << label << ": " << input_filename_ << " ***\n";
- fn();
- CARBON_VLOG() << "*** " << label << " done ***\n";
- }
- // Returns true if the file can be dumped.
- auto IncludeInDumps() const -> bool {
- return options_.exclude_dump_file_prefix.empty() ||
- !input_filename_.starts_with(options_.exclude_dump_file_prefix);
- }
- Driver* driver_;
- SharedValueStores value_stores_;
- const CompileOptions& options_;
- const CodegenOptions& codegen_options_;
- std::string input_filename_;
- // Copied from driver_ for CARBON_VLOG.
- llvm::raw_pwrite_stream* vlog_stream_;
- // Diagnostics are sent to consumer_, with optional sorting.
- std::optional<SortingDiagnosticConsumer> sorting_consumer_;
- DiagnosticConsumer* consumer_;
- bool success_ = true;
- // Tracks memory usage of the compile.
- std::optional<MemUsage> mem_usage_;
- // These are initialized as steps are run.
- std::optional<SourceBuffer> source_;
- std::optional<Lex::TokenizedBuffer> tokens_;
- std::optional<Parse::Tree> parse_tree_;
- std::optional<Parse::TreeAndSubtrees> parse_tree_and_subtrees_;
- std::optional<SemIR::File> sem_ir_;
- std::unique_ptr<llvm::LLVMContext> llvm_context_;
- std::unique_ptr<llvm::Module> module_;
- };
- auto Driver::Compile(const CompileOptions& options,
- const CodegenOptions& codegen_options) -> RunResult {
- if (!ValidateCompileOptions(options)) {
- return {.success = false};
- }
- // Find the files comprising the prelude if we are importing it.
- // TODO: Replace this with a search for library api files in a
- // package-specific search path based on the library name.
- llvm::SmallVector<std::string> prelude;
- if (options.prelude_import && options.phase >= CompileOptions::Phase::Check) {
- if (auto find = installation_->FindPreludeFiles(); find.ok()) {
- prelude = std::move(*find);
- } else {
- error_stream_ << "ERROR: " << find.error() << "\n";
- return {.success = false};
- }
- }
- // Prepare CompilationUnits before building scope exit handlers.
- StreamDiagnosticConsumer stream_consumer(error_stream_);
- llvm::SmallVector<std::unique_ptr<CompilationUnit>> units;
- units.reserve(prelude.size() + options.input_filenames.size());
- // Add the prelude files.
- for (const auto& input_filename : prelude) {
- units.push_back(std::make_unique<CompilationUnit>(
- this, options, codegen_options, &stream_consumer, input_filename));
- }
- // Add the input source files.
- for (const auto& input_filename : options.input_filenames) {
- units.push_back(std::make_unique<CompilationUnit>(
- this, options, codegen_options, &stream_consumer, input_filename));
- }
- auto on_exit = llvm::make_scope_exit([&]() {
- // Finish compilation units. This flushes their diagnostics in the order in
- // which they were specified on the command line.
- for (auto& unit : units) {
- unit->PostCompile();
- }
- stream_consumer.Flush();
- });
- // Returns a RunResult object. Called whenever Compile returns.
- auto make_result = [&]() {
- RunResult result = {.success = true};
- for (const auto& unit : units) {
- result.success &= unit->success();
- result.per_file_success.push_back(
- {unit->input_filename().str(), unit->success()});
- }
- return result;
- };
- // Lex.
- for (auto& unit : units) {
- unit->RunLex();
- }
- if (options.phase == CompileOptions::Phase::Lex) {
- return make_result();
- }
- // Parse and check phases examine `has_source` because they want to proceed if
- // lex failed, but not if source doesn't exist. Later steps are skipped if
- // anything failed, so don't need this.
- // Parse.
- for (auto& unit : units) {
- if (unit->has_source()) {
- unit->RunParse();
- }
- }
- if (options.phase == CompileOptions::Phase::Parse) {
- return make_result();
- }
- // Check.
- SharedValueStores builtin_value_stores;
- llvm::SmallVector<Check::Unit> check_units;
- for (auto& unit : units) {
- if (unit->has_source()) {
- check_units.push_back(unit->GetCheckUnit());
- }
- }
- llvm::SmallVector<Parse::NodeLocConverter> node_converters;
- node_converters.reserve(check_units.size());
- for (auto& unit : check_units) {
- node_converters.emplace_back(unit.tokens, unit.tokens->source().filename(),
- unit.get_parse_tree_and_subtrees);
- }
- CARBON_VLOG() << "*** Check::CheckParseTrees ***\n";
- Check::CheckParseTrees(check_units, node_converters, options.prelude_import,
- vlog_stream_);
- CARBON_VLOG() << "*** Check::CheckParseTrees done ***\n";
- for (auto& unit : units) {
- if (unit->has_source()) {
- unit->PostCheck();
- }
- }
- if (options.phase == CompileOptions::Phase::Check) {
- return make_result();
- }
- // Unlike previous steps, errors block further progress.
- if (std::any_of(units.begin(), units.end(),
- [&](const auto& unit) { return !unit->success(); })) {
- CARBON_VLOG() << "*** Stopping before lowering due to errors ***";
- return make_result();
- }
- // Lower.
- for (const auto& unit : units) {
- Check::SemIRDiagnosticConverter converter(node_converters,
- &**unit->GetCheckUnit().sem_ir);
- unit->RunLower(converter);
- }
- if (options.phase == CompileOptions::Phase::Lower) {
- return make_result();
- }
- CARBON_CHECK(options.phase == CompileOptions::Phase::CodeGen)
- << "CodeGen should be the last stage";
- // Codegen.
- for (auto& unit : units) {
- unit->RunCodeGen();
- }
- return make_result();
- }
- static void AddOSFlags(llvm::StringRef target,
- llvm::SmallVectorImpl<llvm::StringRef>& args) {
- llvm::Triple triple(target);
- switch (triple.getOS()) {
- case llvm::Triple::Darwin:
- case llvm::Triple::MacOSX:
- // On macOS we need to set the sysroot to a viable SDK. Currently, this
- // hard codes the path to be the unversioned symlink. The prefix is also
- // hard coded in Homebrew and so this seems likely to work reasonably
- // well. Homebrew and I suspect the Xcode Clang both have this hard coded
- // at build time, so this seems reasonably safe but we can revisit if/when
- // needed.
- args.push_back(
- "--sysroot=/Library/Developer/CommandLineTools/SDKs/MacOSX.sdk");
- // We also need to insist on a modern linker, otherwise the driver tries
- // too old and deprecated flags. The specific number here comes from an
- // inspection of the Clang driver source code to understand where features
- // were enabled, and this appears to be the latest version to control
- // driver behavior.
- //
- // TODO: We should replace this with use of `lld` eventually.
- args.push_back("-mlinker-version=705");
- break;
- default:
- // By default, just let the Clang driver handle everything.
- break;
- }
- }
- auto Driver::Link(const LinkOptions& options,
- const CodegenOptions& codegen_options) -> RunResult {
- // TODO: Currently we use the Clang driver to link. This works well on Unix
- // OSes but we likely need to directly build logic to invoke `link.exe` on
- // Windows where `cl.exe` doesn't typically cover that logic.
- // Use a reasonably large small vector here to minimize allocations. We expect
- // to link reasonably large numbers of object files.
- llvm::SmallVector<llvm::StringRef, 128> clang_args;
- // We link using a C++ mode of the driver.
- clang_args.push_back("--driver-mode=g++");
- // Use LLD, which we provide in our install directory, for linking.
- clang_args.push_back("-fuse-ld=lld");
- // Disable linking the C++ standard library until can build and ship it as
- // part of the Carbon toolchain. This clearly won't work once we get into
- // interop, but for now it avoids spurious failures and distraction. The plan
- // is to build and bundle libc++ at which point we can replace this with
- // pointing at our bundled library.
- // TODO: Replace this when ready.
- clang_args.push_back("-nostdlib++");
- // Add OS-specific flags based on the target.
- AddOSFlags(codegen_options.target, clang_args);
- clang_args.push_back("-o");
- clang_args.push_back(options.output_filename);
- clang_args.append(options.object_filenames.begin(),
- options.object_filenames.end());
- ClangRunner runner(installation_, codegen_options.target, vlog_stream_);
- return {.success = runner.Run(clang_args)};
- }
- } // namespace Carbon
|