Files
swift-mirror/lib/SymbolGraphGen/SymbolGraphGen.cpp
Dylan Sturgeon 4b4f9f18fc Add an option for symbol graph to support long module names. (#83782)
Currently symbol graphs are always written in files that contain 1 to 2
module names. It's possible for Swift module names to be very long, so
combining 2 of them in file name like `module1@module2...` in the same
path component means the name can be too long for some file systems. The
new option `-symbol-graph-shorten-output-names` changes the symbol graph
output files to use a MD5 hash of the module name(s) as the filename and
outputs an additional JSON file with the original names mapped to the
real filename. The module names JSON can be used to construct a VFS
overlay with the original naming scheme.

fix #83723

I considered using vfsoverlay, which seems like a viable solution, but
the vfsoverlay options don't seem to apply to any of the outputs from
the compiler. When I set an overlay to remap the symbol graph file
outputs, the remapped external paths aren't used so the root problem of
too long file names remains.
2025-11-06 19:30:44 -08:00

246 lines
8.5 KiB
C++

//===--- SymbolGraphGen.cpp - Symbol Graph Generator Entry Point ----------===//
//
// This source file is part of the Swift.org open source project
//
// Copyright (c) 2014 - 2017 Apple Inc. and the Swift project authors
// Licensed under Apache License v2.0 with Runtime Library Exception
//
// See https://swift.org/LICENSE.txt for license information
// See https://swift.org/CONTRIBUTORS.txt for the list of Swift project authors
//
//===----------------------------------------------------------------------===//
#include "swift/SymbolGraphGen/SymbolGraphGen.h"
#include "swift/AST/ASTContext.h"
#include "swift/AST/FileSystem.h"
#include "swift/AST/Import.h"
#include "swift/AST/Module.h"
#include "swift/AST/NameLookup.h"
#include "swift/Sema/IDETypeChecking.h"
#include "clang/Basic/Module.h"
#include "llvm/ADT/STLExtras.h"
#include "llvm/Support/JSON.h"
#include "llvm/Support/MD5.h"
#include "llvm/Support/Path.h"
#include "SymbolGraphASTWalker.h"
using namespace swift;
using namespace symbolgraphgen;
namespace {
/// Utility for managing symbol graph output file names.
class SymbolGraphWriter {
public:
SymbolGraphWriter(const SymbolGraphOptions &Options) : Options(Options) {}
bool
withOutputPath(DiagnosticEngine &Diags, llvm::vfs::OutputBackend &Backend,
StringRef ModuleName,
llvm::function_ref<bool(llvm::raw_pwrite_stream &)> Action) {
SmallString<32> FileName;
if (Options.ShortenOutputNames) {
llvm::MD5 Hash;
Hash.update(ModuleName);
llvm::MD5::MD5Result Result;
Hash.final(Result);
llvm::MD5::stringifyResult(Result, FileName);
} else {
FileName = ModuleName;
}
FileName.append(".symbols.json");
SymbolFileShortPaths.try_emplace(std::string(ModuleName), std::string(FileName));
SmallString<1024> OutputPath(Options.OutputDir);
llvm::sys::path::append(OutputPath, FileName);
return swift::withOutputPath(Diags, Backend, OutputPath, Action);
}
bool finalize(DiagnosticEngine &Diags, llvm::vfs::OutputBackend &Backend) {
if (!Options.ShortenOutputNames) {
return false; // No errors.
}
SmallString<1024> OutputPath(Options.OutputDir);
llvm::sys::path::append(OutputPath, "symbol_modules.json");
return swift::withOutputPath(
Diags, Backend, OutputPath, [&](raw_ostream &OS) {
llvm::json::OStream JSON(OS, Options.PrettyPrint ? 2 : 0);
JSON.object([&] {
// Insert the module to real filename mappings in a deterministic
// order. Enumerating the map returns the keys in order.
JSON.attributeObject("modules", [&] {
for (const auto &[K, V] : SymbolFileShortPaths) {
JSON.attribute(K, V);
}
});
});
return false;
});
}
private:
const SymbolGraphOptions &Options;
std::map<std::string, std::string> SymbolFileShortPaths;
};
int serializeSymbolGraph(SymbolGraph &SG, const SymbolGraphOptions &Options,
SymbolGraphWriter &Writer) {
SmallString<256> FileName;
FileName.append(getFullModuleName(&SG.M));
if (SG.ExtendedModule.has_value()) {
FileName.push_back('@');
// FileName.append(SG.ExtendedModule.value()->getNameStr());
FileName.append(getFullModuleName(SG.ExtendedModule.value()));
} else if (SG.DeclaringModule.has_value()) {
// Treat cross-import overlay modules as "extensions" of their declaring
// module
FileName.push_back('@');
// FileName.append(SG.DeclaringModule.value()->getNameStr());
FileName.append(getFullModuleName(SG.DeclaringModule.value()));
}
return Writer.withOutputPath(
SG.M.getASTContext().Diags, SG.M.getASTContext().getOutputBackend(),
FileName, [&](raw_ostream &OS) {
llvm::json::OStream J(OS, Options.PrettyPrint ? 2 : 0);
SG.serialize(J);
return false;
});
}
} // end anonymous namespace
// MARK: - Main Entry Point
/// Emit a symbol graph JSON file for a `ModuleDecl`.
int symbolgraphgen::emitSymbolGraphForModule(
ModuleDecl *M, const SymbolGraphOptions &Options) {
ModuleDecl::ImportCollector importCollector(Options.MinimumAccessLevel);
SmallPtrSet<const clang::Module *, 2> ExportedClangModules = {};
SmallPtrSet<const clang::Module *, 2> WildcardExportClangModules = {};
if (const auto *ClangModule = M->findUnderlyingClangModule()) {
// Scan through the Clang module's exports and collect them for later
// handling
for (auto ClangExport : ClangModule->Exports) {
if (ClangExport.getInt()) {
// Blanket exports are represented as a true boolean tag
if (const auto *ExportParent = ClangExport.getPointer()) {
// If a pointer is present, this is a scoped blanket export, like
// `export Submodule.*`
WildcardExportClangModules.insert(ExportParent);
} else {
// Otherwise it represents a full blanket `export *`
WildcardExportClangModules.insert(ClangModule);
}
} else if (!ClangExport.getInt() && ClangExport.getPointer()) {
// This is an explicit `export Submodule`
ExportedClangModules.insert(ClangExport.getPointer());
}
}
if (ExportedClangModules.empty() && WildcardExportClangModules.empty()) {
// HACK: In the absence of an explicit export declaration, export all of the submodules.
WildcardExportClangModules.insert(ClangModule);
}
}
auto importFilter = [&Options, &WildcardExportClangModules,
&ExportedClangModules](const ModuleDecl *module) {
if (!module)
return false;
if (const auto *ClangModule = module->findUnderlyingClangModule()) {
if (ExportedClangModules.contains(ClangModule)) {
return true;
}
for (const auto *ClangParent : WildcardExportClangModules) {
if (ClangModule->isSubModuleOf(ClangParent))
return true;
}
}
if (Options.AllowedReexportedModules.has_value())
for (const auto &allowedModuleName : *Options.AllowedReexportedModules)
if (allowedModuleName == module->getNameStr())
return true;
return false;
};
if (Options.AllowedReexportedModules.has_value() ||
!WildcardExportClangModules.empty() || !ExportedClangModules.empty())
importCollector.importFilter = std::move(importFilter);
SmallVector<Decl *, 64> ModuleDecls;
swift::getTopLevelDeclsForDisplay(
M, ModuleDecls, [&importCollector](ModuleDecl *M, SmallVectorImpl<Decl *> &results) {
M->getDisplayDeclsRecursivelyAndImports(results, importCollector);
});
if (Options.PrintMessages)
llvm::errs() << ModuleDecls.size()
<< " top-level declarations in this module.\n";
SymbolGraphASTWalker Walker(*M, importCollector.imports,
importCollector.qualifiedImports, Options);
for (auto *Decl : ModuleDecls) {
Walker.walk(Decl);
}
if (Options.PrintMessages)
llvm::errs()
<< "Found " << Walker.MainGraph.Nodes.size() << " symbols and "
<< Walker.MainGraph.Edges.size() << " relationships.\n";
int Success = EXIT_SUCCESS;
SymbolGraphWriter Writer(Options);
Success |= serializeSymbolGraph(Walker.MainGraph, Options, Writer);
for (const auto &Entry : Walker.ExtendedModuleGraphs) {
if (Entry.getValue()->empty()) {
continue;
}
Success |= serializeSymbolGraph(*Entry.getValue(), Options, Writer);
}
Success |=
Writer.finalize(Walker.MainGraph.M.getASTContext().Diags,
Walker.MainGraph.M.getASTContext().getOutputBackend());
return Success;
}
int symbolgraphgen::
printSymbolGraphForDecl(const ValueDecl *D, Type BaseTy,
bool InSynthesizedExtension,
const SymbolGraphOptions &Options,
llvm::raw_ostream &OS,
SmallVectorImpl<PathComponent> &ParentContexts,
SmallVectorImpl<FragmentInfo> &FragmentInfo) {
if (!Symbol::supportsKind(D->getKind()))
return EXIT_FAILURE;
llvm::json::OStream JOS(OS, Options.PrettyPrint ? 2 : 0);
ModuleDecl *MD = D->getModuleContext();
SymbolGraphASTWalker Walker(*MD, Options);
markup::MarkupContext MarkupCtx;
SymbolGraph Graph(Walker, *MD, std::nullopt, MarkupCtx, std::nullopt,
/*IsForSingleNode=*/true);
NominalTypeDecl *NTD = InSynthesizedExtension
? BaseTy->getAnyNominal()
: nullptr;
Symbol MySym(&Graph, D, NTD, BaseTy);
MySym.getPathComponents(ParentContexts);
MySym.getFragmentInfo(FragmentInfo);
Graph.recordNode(MySym);
Graph.serialize(JOS);
return EXIT_SUCCESS;
}