From fe929aa33c226b8d60268420f78fc38d783ec5e5 Mon Sep 17 00:00:00 2001 From: Sean Callanan Date: Fri, 16 Dec 2016 23:21:38 +0000 Subject: [PATCH] Testbed and skeleton of a new expression parser LLVM's JIT is now the foundation of dynamic-compilation features for many languages. Clang also has low-level support for dynamic compilation (ASTImporter and ExternalASTSource, notably). How the compiler is set up for dynamic parsing is generally left up to individual clients, for example LLDB's C/C++/Objective-C expression parser and the ROOT project. Although this arrangement offers external clients the flexibility to implement dynamic features as they see fit, the lack of an in-tree client means that subtle bugs can be introduced that cause regressions in the external clients but aren't caught by tests (or users) until much later. LLDB for example regularly encounters complicated ODR violation scenarios where it is not immediately clear who is at fault. Other external clients (notably, Cling) rely on similar functionality, and another goal is to break this functionality up into composable parts so that any client can be built easily on top of Clang without requiring extensive additional code. I propose that the parts required to build a simple expression parser be added to Clang. Initially, I aim to have the following features: - A piece that looks up external declarations from a variety of sources (e.g., from previous dynamic compilations, from modules, or from DWARF) and uses clear conflict resolution rules to reconcile differences, with easily understood errors. This functionality will be supported by in-tree tests. - A piece that works hand in hand with the LLVM JIT to resolve the locations of external declarations so that e.g. variables can be redeclared and (for high-performance applications like DTrace) external variables can be accessed directly from the registers where they reside. This commit adds a tester that parses a sequence of source files and then uses them as source data for an expression. External references are resolved using an ExternalASTSource that responds to name queries using an ASTImporter. This is the setup that LLDB uses, and the motivating reason for MinimalImport in ASTImporter. When complete, this tester will implement the first of the above goals. Differential Revision: https://reviews.llvm.org/D27180 llvm-svn: 290004 --- clang/test/CMakeLists.txt | 1 + clang/test/Import/clang-flags/Inputs/S.c | 2 + clang/test/Import/clang-flags/test.c | 5 + clang/test/Import/empty-struct/Inputs/S.c | 2 + clang/test/Import/empty-struct/test.c | 5 + .../Import/error-in-expression/Inputs/S.c | 2 + clang/test/Import/error-in-expression/test.c | 6 + clang/test/Import/error-in-import/Inputs/S.c | 2 + clang/test/Import/error-in-import/test.c | 6 + clang/test/Import/missing-import/test.c | 6 + clang/tools/CMakeLists.txt | 1 + clang/tools/clang-import-test/CMakeLists.txt | 24 ++ .../clang-import-test/clang-import-test.cpp | 319 ++++++++++++++++++ 13 files changed, 381 insertions(+) create mode 100644 clang/test/Import/clang-flags/Inputs/S.c create mode 100644 clang/test/Import/clang-flags/test.c create mode 100644 clang/test/Import/empty-struct/Inputs/S.c create mode 100644 clang/test/Import/empty-struct/test.c create mode 100644 clang/test/Import/error-in-expression/Inputs/S.c create mode 100644 clang/test/Import/error-in-expression/test.c create mode 100644 clang/test/Import/error-in-import/Inputs/S.c create mode 100644 clang/test/Import/error-in-import/test.c create mode 100644 clang/test/Import/missing-import/test.c create mode 100644 clang/tools/clang-import-test/CMakeLists.txt create mode 100644 clang/tools/clang-import-test/clang-import-test.cpp diff --git a/clang/test/CMakeLists.txt b/clang/test/CMakeLists.txt index 8ba9040a92af..46bf2ae213ae 100644 --- a/clang/test/CMakeLists.txt +++ b/clang/test/CMakeLists.txt @@ -39,6 +39,7 @@ list(APPEND CLANG_TEST_DEPS c-index-test diagtool clang-tblgen clang-offload-bundler + clang-import-test ) if(CLANG_ENABLE_STATIC_ANALYZER) diff --git a/clang/test/Import/clang-flags/Inputs/S.c b/clang/test/Import/clang-flags/Inputs/S.c new file mode 100644 index 000000000000..742dac8a35b4 --- /dev/null +++ b/clang/test/Import/clang-flags/Inputs/S.c @@ -0,0 +1,2 @@ +STRUCT S { +}; diff --git a/clang/test/Import/clang-flags/test.c b/clang/test/Import/clang-flags/test.c new file mode 100644 index 000000000000..7a19ea7ff648 --- /dev/null +++ b/clang/test/Import/clang-flags/test.c @@ -0,0 +1,5 @@ +// RUN: clang-import-test -import %S/Inputs/S.c -expression %s -Xcc -DSTRUCT=struct +void expr() { + STRUCT S MyS; + void *MyPtr = &MyS; +} diff --git a/clang/test/Import/empty-struct/Inputs/S.c b/clang/test/Import/empty-struct/Inputs/S.c new file mode 100644 index 000000000000..8c90352bc463 --- /dev/null +++ b/clang/test/Import/empty-struct/Inputs/S.c @@ -0,0 +1,2 @@ +struct S { +}; diff --git a/clang/test/Import/empty-struct/test.c b/clang/test/Import/empty-struct/test.c new file mode 100644 index 000000000000..d51a69706dcd --- /dev/null +++ b/clang/test/Import/empty-struct/test.c @@ -0,0 +1,5 @@ +// RUN: clang-import-test -import %S/Inputs/S.c -expression %s +void expr() { + struct S MyS; + void *MyPtr = &MyS; +} diff --git a/clang/test/Import/error-in-expression/Inputs/S.c b/clang/test/Import/error-in-expression/Inputs/S.c new file mode 100644 index 000000000000..8c90352bc463 --- /dev/null +++ b/clang/test/Import/error-in-expression/Inputs/S.c @@ -0,0 +1,2 @@ +struct S { +}; diff --git a/clang/test/Import/error-in-expression/test.c b/clang/test/Import/error-in-expression/test.c new file mode 100644 index 000000000000..65d3b4a5dcb0 --- /dev/null +++ b/clang/test/Import/error-in-expression/test.c @@ -0,0 +1,6 @@ +// RUN: not clang-import-test -import %S/Inputs/S.c -expression %s 2>&1 | FileCheck %s +// CHECK: {{.*}}no viable conversion{{.*}} +void expr() { + struct S MyS; + void *MyPtr = MyS; +} diff --git a/clang/test/Import/error-in-import/Inputs/S.c b/clang/test/Import/error-in-import/Inputs/S.c new file mode 100644 index 000000000000..23ca763f6798 --- /dev/null +++ b/clang/test/Import/error-in-import/Inputs/S.c @@ -0,0 +1,2 @@ +struct S [ +]; diff --git a/clang/test/Import/error-in-import/test.c b/clang/test/Import/error-in-import/test.c new file mode 100644 index 000000000000..197d4e30426a --- /dev/null +++ b/clang/test/Import/error-in-import/test.c @@ -0,0 +1,6 @@ +// RUN: not clang-import-test -import %S/Inputs/S.c -expression %s 2>&1 | FileCheck %s +// CHECK: {{.*}}expected unqualified-id{{.*}} +void expr() { + struct S MyS; + void *MyPtr = &MyS; +} diff --git a/clang/test/Import/missing-import/test.c b/clang/test/Import/missing-import/test.c new file mode 100644 index 000000000000..acf6389cc5fc --- /dev/null +++ b/clang/test/Import/missing-import/test.c @@ -0,0 +1,6 @@ +// RUN: not clang-import-test -import %S/Inputs/S.c -expression %s 2>&1 | FileCheck %s +// CHECK: {{.*}}Couldn't open{{.*}}Inputs/S.c{{.*}} +void expr() { + struct S MyS; + void *MyPtr = &MyS; +} diff --git a/clang/tools/CMakeLists.txt b/clang/tools/CMakeLists.txt index b8850e454688..b0c97f0f1e4c 100644 --- a/clang/tools/CMakeLists.txt +++ b/clang/tools/CMakeLists.txt @@ -5,6 +5,7 @@ add_clang_subdirectory(driver) add_clang_subdirectory(clang-format) add_clang_subdirectory(clang-format-vs) add_clang_subdirectory(clang-fuzzer) +add_clang_subdirectory(clang-import-test) add_clang_subdirectory(clang-offload-bundler) add_clang_subdirectory(c-index-test) diff --git a/clang/tools/clang-import-test/CMakeLists.txt b/clang/tools/clang-import-test/CMakeLists.txt new file mode 100644 index 000000000000..4d41a5674ae6 --- /dev/null +++ b/clang/tools/clang-import-test/CMakeLists.txt @@ -0,0 +1,24 @@ +set(LLVM_LINK_COMPONENTS + support +) + +if(NOT CLANG_BUILT_STANDALONE) + set(tablegen_deps intrinsics_gen) +endif() + +add_clang_tool(clang-import-test + clang-import-test.cpp + DEPENDS + ${tablegen_deps} + ) + +set(CLANG_IMPORT_TEST_LIB_DEPS + clangAST + clangBasic + clangCodeGen + clangFrontend + ) + +target_link_libraries(clang-import-test + ${CLANG_IMPORT_TEST_LIB_DEPS} + ) diff --git a/clang/tools/clang-import-test/clang-import-test.cpp b/clang/tools/clang-import-test/clang-import-test.cpp new file mode 100644 index 000000000000..931b46245bb7 --- /dev/null +++ b/clang/tools/clang-import-test/clang-import-test.cpp @@ -0,0 +1,319 @@ +//===-- import-test.cpp - ASTImporter/ExternalASTSource testbed -----------===// +// +// The LLVM Compiler Infrastructure +// +// This file is distributed under the University of Illinois Open Source +// License. See LICENSE.TXT for details. +// +//===----------------------------------------------------------------------===// + +#include "clang/AST/ASTContext.h" +#include "clang/AST/ASTImporter.h" +#include "clang/Basic/Builtins.h" +#include "clang/Basic/IdentifierTable.h" +#include "clang/Basic/SourceLocation.h" +#include "clang/Basic/TargetInfo.h" +#include "clang/Basic/TargetOptions.h" +#include "clang/CodeGen/ModuleBuilder.h" +#include "clang/Frontend/CompilerInstance.h" +#include "clang/Frontend/TextDiagnosticBuffer.h" +#include "clang/Lex/Lexer.h" +#include "clang/Lex/Preprocessor.h" +#include "clang/Parse/ParseAST.h" + +#include "llvm/IR/LLVMContext.h" +#include "llvm/Support/CommandLine.h" +#include "llvm/Support/Error.h" +#include "llvm/Support/Host.h" +#include "llvm/Support/Signals.h" + +#include +#include + +using namespace clang; + +static llvm::cl::opt Expression( + "expression", llvm::cl::Required, + llvm::cl::desc("Path to a file containing the expression to parse")); + +static llvm::cl::list + Imports("import", llvm::cl::ZeroOrMore, + llvm::cl::desc("Path to a file containing declarations to import")); + +static llvm::cl::list + ClangArgs("Xcc", llvm::cl::ZeroOrMore, + llvm::cl::desc("Argument to pass to the CompilerInvocation"), + llvm::cl::CommaSeparated); + +namespace init_convenience { +class TestDiagnosticConsumer : public DiagnosticConsumer { +private: + std::unique_ptr Passthrough; + const LangOptions *LangOpts = nullptr; + +public: + TestDiagnosticConsumer() + : Passthrough(llvm::make_unique()) {} + + virtual void BeginSourceFile(const LangOptions &LangOpts, + const Preprocessor *PP = nullptr) override { + this->LangOpts = &LangOpts; + return Passthrough->BeginSourceFile(LangOpts, PP); + } + + virtual void EndSourceFile() override { + this->LangOpts = nullptr; + Passthrough->EndSourceFile(); + } + + virtual bool IncludeInDiagnosticCounts() const override { + return Passthrough->IncludeInDiagnosticCounts(); + } + +private: + static void PrintSourceForLocation(const SourceLocation &Loc, + SourceManager &SM) { + const char *LocData = SM.getCharacterData(Loc, /*Invalid=*/nullptr); + unsigned LocColumn = + SM.getSpellingColumnNumber(Loc, /*Invalid=*/nullptr) - 1; + FileID FID = SM.getFileID(Loc); + llvm::MemoryBuffer *Buffer = SM.getBuffer(FID, Loc, /*Invalid=*/nullptr); + + assert(LocData >= Buffer->getBufferStart() && + LocData < Buffer->getBufferEnd()); + + const char *LineBegin = LocData - LocColumn; + + assert(LineBegin >= Buffer->getBufferStart()); + + const char *LineEnd = nullptr; + + for (LineEnd = LineBegin; *LineEnd != '\n' && *LineEnd != '\r' && + LineEnd < Buffer->getBufferEnd(); + ++LineEnd) + ; + + llvm::StringRef LineString(LineBegin, LineEnd - LineBegin); + + llvm::errs() << LineString << '\n'; + std::string Space(LocColumn, ' '); + llvm::errs() << Space.c_str() << '\n'; + } + + virtual void HandleDiagnostic(DiagnosticsEngine::Level DiagLevel, + const Diagnostic &Info) override { + if (Info.hasSourceManager() && LangOpts) { + SourceManager &SM = Info.getSourceManager(); + + if (Info.getLocation().isValid()) { + Info.getLocation().print(llvm::errs(), SM); + llvm::errs() << ": "; + } + + SmallString<16> DiagText; + Info.FormatDiagnostic(DiagText); + llvm::errs() << DiagText << '\n'; + + if (Info.getLocation().isValid()) { + PrintSourceForLocation(Info.getLocation(), SM); + } + + for (const CharSourceRange &Range : Info.getRanges()) { + bool Invalid = true; + StringRef Ref = Lexer::getSourceText(Range, SM, *LangOpts, &Invalid); + if (!Invalid) { + llvm::errs() << Ref.str() << '\n'; + } + } + } + DiagnosticConsumer::HandleDiagnostic(DiagLevel, Info); + } +}; + +std::unique_ptr +BuildCompilerInstance(ArrayRef ClangArgv) { + auto Ins = llvm::make_unique(); + auto DC = llvm::make_unique(); + const bool ShouldOwnClient = true; + Ins->createDiagnostics(DC.release(), ShouldOwnClient); + + auto Inv = llvm::make_unique(); + + CompilerInvocation::CreateFromArgs(*Inv, ClangArgv.data(), + &ClangArgv.data()[ClangArgv.size()], + Ins->getDiagnostics()); + + Inv->getLangOpts()->CPlusPlus = true; + Inv->getLangOpts()->CPlusPlus11 = true; + Inv->getHeaderSearchOpts().UseLibcxx = true; + Inv->getLangOpts()->Bool = true; + Inv->getLangOpts()->WChar = true; + Inv->getLangOpts()->Blocks = true; + Inv->getLangOpts()->DebuggerSupport = true; + Inv->getLangOpts()->SpellChecking = false; + Inv->getLangOpts()->ThreadsafeStatics = false; + Inv->getLangOpts()->AccessControl = false; + Inv->getLangOpts()->DollarIdents = true; + Inv->getCodeGenOpts().setDebugInfo(codegenoptions::FullDebugInfo); + Inv->getTargetOpts().Triple = llvm::sys::getDefaultTargetTriple(); + + Ins->setInvocation(Inv.release()); + + TargetInfo *TI = TargetInfo::CreateTargetInfo( + Ins->getDiagnostics(), Ins->getInvocation().TargetOpts); + Ins->setTarget(TI); + Ins->getTarget().adjust(Ins->getLangOpts()); + Ins->createFileManager(); + Ins->createSourceManager(Ins->getFileManager()); + Ins->createPreprocessor(TU_Complete); + + return Ins; +} + +std::unique_ptr +BuildASTContext(CompilerInstance &CI, SelectorTable &ST, Builtin::Context &BC) { + auto AST = llvm::make_unique( + CI.getLangOpts(), CI.getSourceManager(), + CI.getPreprocessor().getIdentifierTable(), ST, BC); + AST->InitBuiltinTypes(CI.getTarget()); + return AST; +} + +std::unique_ptr BuildCodeGen(CompilerInstance &CI, + llvm::LLVMContext &LLVMCtx) { + StringRef ModuleName("$__module"); + return std::unique_ptr(CreateLLVMCodeGen( + CI.getDiagnostics(), ModuleName, CI.getHeaderSearchOpts(), + CI.getPreprocessorOpts(), CI.getCodeGenOpts(), LLVMCtx)); +} +} // end namespace + +namespace { +class TestExternalASTSource : public ExternalASTSource { +private: + llvm::ArrayRef> ImportCIs; + std::map> ForwardImporters; + std::map> ReverseImporters; + +public: + TestExternalASTSource( + CompilerInstance &ExpressionCI, + llvm::ArrayRef> ImportCIs) + : ImportCIs(ImportCIs) { + for (const std::unique_ptr &ImportCI : ImportCIs) { + ForwardImporters[ImportCI.get()] = llvm::make_unique( + ExpressionCI.getASTContext(), ExpressionCI.getFileManager(), + ImportCI->getASTContext(), ImportCI->getFileManager(), + /*MinimalImport=*/true); + ReverseImporters[ImportCI.get()] = llvm::make_unique( + ImportCI->getASTContext(), ImportCI->getFileManager(), + ExpressionCI.getASTContext(), ExpressionCI.getFileManager(), + /*MinimalImport=*/true); + } + } + + bool FindExternalVisibleDeclsByName(const DeclContext *DC, + DeclarationName Name) override { + llvm::SmallVector Decls; + + if (isa(DC)) { + for (const std::unique_ptr &I : ImportCIs) { + DeclarationName FromName = ReverseImporters[I.get()]->Import(Name); + DeclContextLookupResult Result = + I->getASTContext().getTranslationUnitDecl()->lookup(FromName); + for (NamedDecl *FromD : Result) { + NamedDecl *D = + llvm::cast(ForwardImporters[I.get()]->Import(FromD)); + Decls.push_back(D); + } + } + } + if (Decls.empty()) { + return false; + } else { + SetExternalVisibleDeclsForName(DC, Name, Decls); + return true; + } + } +}; + +void AddExternalSource( + CompilerInstance &CI, + llvm::ArrayRef> Imports) { + ASTContext &AST = CI.getASTContext(); + auto ES = llvm::make_unique(CI, Imports); + AST.setExternalSource(ES.release()); + AST.getTranslationUnitDecl()->setHasExternalVisibleStorage(); +} + +llvm::Error ParseSource(const std::string &Path, CompilerInstance &CI, + CodeGenerator &CG) { + SourceManager &SM = CI.getSourceManager(); + const FileEntry *FE = CI.getFileManager().getFile(Path); + if (!FE) { + return llvm::make_error( + llvm::Twine("Couldn't open ", Path), std::error_code()); + } + SM.setMainFileID(SM.createFileID(FE, SourceLocation(), SrcMgr::C_User)); + ParseAST(CI.getPreprocessor(), &CG, CI.getASTContext()); + return llvm::Error::success(); +} + +llvm::Expected> +Parse(const std::string &Path, + llvm::ArrayRef> Imports) { + std::vector ClangArgv(ClangArgs.size()); + std::transform(ClangArgs.begin(), ClangArgs.end(), ClangArgv.begin(), + [](const std::string &s) -> const char * { return s.data(); }); + std::unique_ptr CI = + init_convenience::BuildCompilerInstance(ClangArgv); + auto ST = llvm::make_unique(); + auto BC = llvm::make_unique(); + std::unique_ptr AST = + init_convenience::BuildASTContext(*CI, *ST, *BC); + CI->setASTContext(AST.release()); + AddExternalSource(*CI, Imports); + + auto LLVMCtx = llvm::make_unique(); + std::unique_ptr CG = + init_convenience::BuildCodeGen(*CI, *LLVMCtx); + CG->Initialize(CI->getASTContext()); + + CI->getDiagnosticClient().BeginSourceFile(CI->getLangOpts(), + &CI->getPreprocessor()); + if (llvm::Error PE = ParseSource(Path, *CI, *CG)) { + return std::move(PE); + } + CI->getDiagnosticClient().EndSourceFile(); + if (CI->getDiagnosticClient().getNumErrors()) { + return llvm::make_error( + "Errors occured while parsing the expression.", std::error_code()); + } else { + return std::move(CI); + } +} +} // end namespace + +int main(int argc, const char **argv) { + const bool DisableCrashReporting = true; + llvm::sys::PrintStackTraceOnErrorSignal(argv[0], DisableCrashReporting); + llvm::cl::ParseCommandLineOptions(argc, argv); + std::vector> ImportCIs; + for (auto I : Imports) { + llvm::Expected> ImportCI = Parse(I, {}); + if (auto E = ImportCI.takeError()) { + llvm::errs() << llvm::toString(std::move(E)); + exit(-1); + } else { + ImportCIs.push_back(std::move(*ImportCI)); + } + } + llvm::Expected> ExpressionCI = + Parse(Expression, ImportCIs); + if (auto E = ExpressionCI.takeError()) { + llvm::errs() << llvm::toString(std::move(E)); + exit(-1); + } else { + return 0; + } +}