Files
clice/tests/unit/syntax/scan_tests.cpp
2026-03-22 23:37:08 +08:00

450 lines
12 KiB
C++

#include "test/test.h"
#include "syntax/scan.h"
namespace clice::testing {
namespace {
/// Helper: find entry in StringMap whose key contains the given substring.
template <typename T>
auto find_by_substr(llvm::StringMap<T>& map, llvm::StringRef substr) {
for(auto it = map.begin(); it != map.end(); ++it) {
if(it->first().contains(substr)) {
return it;
}
}
return map.end();
}
TEST_SUITE(Scan) {
// === scan() tests ===
TEST_CASE(BasicIncludes) {
auto result = scan(R"(
#include <vector>
#include "foo/bar.h"
int x = 1;
)");
ASSERT_EQ(result.includes.size(), 2u);
EXPECT_EQ(result.includes[0].path, "vector");
EXPECT_FALSE(result.includes[0].conditional);
EXPECT_EQ(result.includes[1].path, "foo/bar.h");
EXPECT_FALSE(result.includes[1].conditional);
EXPECT_TRUE(result.module_name.empty());
}
TEST_CASE(ConditionalIncludes) {
auto result = scan(R"(
#include <always.h>
#ifdef FOO
#include <conditional.h>
#endif
#include <after.h>
)");
ASSERT_EQ(result.includes.size(), 3u);
EXPECT_EQ(result.includes[0].path, "always.h");
EXPECT_FALSE(result.includes[0].conditional);
EXPECT_EQ(result.includes[1].path, "conditional.h");
EXPECT_TRUE(result.includes[1].conditional);
EXPECT_EQ(result.includes[2].path, "after.h");
EXPECT_FALSE(result.includes[2].conditional);
}
TEST_CASE(NestedConditionals) {
auto result = scan(R"(
#ifdef A
#ifdef B
#include <nested.h>
#endif
#include <outer.h>
#endif
#include <top.h>
)");
ASSERT_EQ(result.includes.size(), 3u);
EXPECT_EQ(result.includes[0].path, "nested.h");
EXPECT_TRUE(result.includes[0].conditional);
EXPECT_EQ(result.includes[1].path, "outer.h");
EXPECT_TRUE(result.includes[1].conditional);
EXPECT_EQ(result.includes[2].path, "top.h");
EXPECT_FALSE(result.includes[2].conditional);
}
TEST_CASE(ModuleDeclaration) {
auto result = scan(R"(
module;
#include <header.h>
export module my.module;
)");
EXPECT_EQ(result.module_name, "my.module");
EXPECT_TRUE(result.is_interface_unit);
EXPECT_FALSE(result.need_preprocess);
ASSERT_EQ(result.includes.size(), 1u);
EXPECT_EQ(result.includes[0].path, "header.h");
}
TEST_CASE(ModulePartition) {
auto result = scan(R"(
module my.module:part;
)");
EXPECT_EQ(result.module_name, "my.module:part");
EXPECT_FALSE(result.is_interface_unit);
}
TEST_CASE(ModuleImplementation) {
auto result = scan(R"(
module my.module;
)");
EXPECT_EQ(result.module_name, "my.module");
EXPECT_FALSE(result.is_interface_unit);
}
TEST_CASE(ConditionalModule) {
auto result = scan(R"(
#ifdef USE_MODULES
export module foo;
#endif
)");
EXPECT_TRUE(result.module_name.empty());
EXPECT_TRUE(result.need_preprocess);
}
TEST_CASE(GlobalModuleFragment) {
auto result = scan(R"(
module;
export module test;
)");
EXPECT_EQ(result.module_name, "test");
EXPECT_TRUE(result.is_interface_unit);
}
TEST_CASE(EmptyContent) {
auto result = scan("");
EXPECT_TRUE(result.includes.empty());
EXPECT_TRUE(result.module_name.empty());
EXPECT_FALSE(result.need_preprocess);
}
TEST_CASE(NoDirectives) {
auto result = scan(R"(
int main() {
return 0;
}
)");
EXPECT_TRUE(result.includes.empty());
EXPECT_TRUE(result.module_name.empty());
}
// === scan_fuzzy() tests ===
TEST_CASE(FuzzyBasic) {
auto vfs = llvm::makeIntrusiveRefCnt<TestVFS>();
auto main_path = TestVFS::path("main.cpp");
vfs->add("main.cpp", R"(
#include "header.h"
int main() {}
)");
vfs->add("header.h", R"(
#pragma once
int x = 1;
)");
auto args = std::vector<const char*>{"clang++", "-std=c++20", main_path.c_str()};
auto results = scan_fuzzy(args, TestVFS::root(), {}, nullptr, vfs);
auto main_it = find_by_substr(results, "main.cpp");
ASSERT_TRUE(main_it != results.end());
ASSERT_EQ(main_it->second.includes.size(), 1u);
EXPECT_FALSE(main_it->second.includes[0].not_found);
EXPECT_FALSE(main_it->second.includes[0].conditional);
}
TEST_CASE(FuzzyConditionalTracking) {
auto vfs = llvm::makeIntrusiveRefCnt<TestVFS>();
auto main_path = TestVFS::path("main.cpp");
vfs->add("main.cpp", R"(
#include "always.h"
#ifdef FOO
#include "conditional.h"
#endif
#include "after.h"
)");
vfs->add("always.h");
vfs->add("conditional.h");
vfs->add("after.h");
auto args = std::vector<const char*>{"clang++", "-std=c++20", main_path.c_str()};
auto results = scan_fuzzy(args, TestVFS::root(), {}, nullptr, vfs);
auto main_it = find_by_substr(results, "main.cpp");
ASSERT_TRUE(main_it != results.end());
auto& includes = main_it->second.includes;
ASSERT_EQ(includes.size(), 3u);
EXPECT_FALSE(includes[0].conditional); // always.h
EXPECT_TRUE(includes[1].conditional); // conditional.h
EXPECT_FALSE(includes[2].conditional); // after.h
}
TEST_CASE(FuzzyNotFound) {
auto vfs = llvm::makeIntrusiveRefCnt<TestVFS>();
auto main_path = TestVFS::path("main.cpp");
vfs->add("main.cpp", R"(
#include "exists.h"
#include "missing.h"
#include "also_exists.h"
)");
vfs->add("exists.h");
vfs->add("also_exists.h");
auto args = std::vector<const char*>{"clang++", "-std=c++20", main_path.c_str()};
auto results = scan_fuzzy(args, TestVFS::root(), {}, nullptr, vfs);
auto main_it = find_by_substr(results, "main.cpp");
ASSERT_TRUE(main_it != results.end());
auto& includes = main_it->second.includes;
ASSERT_EQ(includes.size(), 3u);
EXPECT_FALSE(includes[0].not_found); // exists.h
EXPECT_TRUE(includes[1].not_found); // missing.h
EXPECT_FALSE(includes[2].not_found); // also_exists.h
}
TEST_CASE(FuzzyTransitiveIncludes) {
auto vfs = llvm::makeIntrusiveRefCnt<TestVFS>();
auto main_path = TestVFS::path("main.cpp");
vfs->add("main.cpp", R"(
#include "a.h"
)");
vfs->add("a.h", R"(
#pragma once
#include "b.h"
)");
vfs->add("b.h", R"(
#pragma once
int b = 1;
)");
auto args = std::vector<const char*>{"clang++", "-std=c++20", main_path.c_str()};
auto results = scan_fuzzy(args, TestVFS::root(), {}, nullptr, vfs);
// main.cpp includes a.h
auto main_it = find_by_substr(results, "main.cpp");
ASSERT_TRUE(main_it != results.end());
ASSERT_EQ(main_it->second.includes.size(), 1u);
// a.h includes b.h
auto a_it = find_by_substr(results, "a.h");
ASSERT_TRUE(a_it != results.end());
ASSERT_EQ(a_it->second.includes.size(), 1u);
}
TEST_CASE(FuzzyWithCache) {
auto vfs = llvm::makeIntrusiveRefCnt<TestVFS>();
auto main_path = TestVFS::path("main.cpp");
auto other_path = TestVFS::path("other.cpp");
vfs->add("main.cpp", R"(
#include "shared.h"
)");
vfs->add("other.cpp", R"(
#include "shared.h"
)");
vfs->add("shared.h", R"(
#pragma once
int shared = 1;
)");
SharedScanCache cache;
auto args1 = std::vector<const char*>{"clang++", "-std=c++20", main_path.c_str()};
auto results1 = scan_fuzzy(args1, TestVFS::root(), {}, &cache, vfs);
// shared.h should be cached after first scan.
EXPECT_FALSE(cache.entries.empty());
auto args2 = std::vector<const char*>{"clang++", "-std=c++20", other_path.c_str()};
auto results2 = scan_fuzzy(args2, TestVFS::root(), {}, &cache, vfs);
// Both scans should find includes.
ASSERT_TRUE(find_by_substr(results1, "main.cpp") != results1.end());
ASSERT_TRUE(find_by_substr(results2, "other.cpp") != results2.end());
}
TEST_CASE(FuzzyWithContent) {
auto vfs = llvm::makeIntrusiveRefCnt<TestVFS>();
auto main_path = TestVFS::path("main.cpp");
vfs->add("main.cpp");
vfs->add("header.h");
auto args = std::vector<const char*>{"clang++", "-std=c++20", main_path.c_str()};
auto results = scan_fuzzy(args, TestVFS::root(), R"(#include "header.h")", nullptr, vfs);
auto main_it = find_by_substr(results, "main.cpp");
ASSERT_TRUE(main_it != results.end());
ASSERT_EQ(main_it->second.includes.size(), 1u);
EXPECT_FALSE(main_it->second.includes[0].not_found);
}
// === scan_precise() tests ===
TEST_CASE(PreciseBasic) {
auto vfs = llvm::makeIntrusiveRefCnt<TestVFS>();
auto main_path = TestVFS::path("main.cpp");
vfs->add("main.cpp", R"(
#include "header.h"
int main() {}
)");
vfs->add("header.h", R"(
#pragma once
int x = 1;
)");
auto args = std::vector<const char*>{"clang++", "-std=c++20", main_path.c_str()};
auto result = scan_precise(args, TestVFS::root(), {}, nullptr, vfs);
ASSERT_EQ(result.includes.size(), 1u);
EXPECT_FALSE(result.includes[0].not_found);
EXPECT_FALSE(result.includes[0].conditional);
}
TEST_CASE(PreciseConditionalWithDefine) {
auto vfs = llvm::makeIntrusiveRefCnt<TestVFS>();
auto main_path = TestVFS::path("main.cpp");
vfs->add("main.cpp", R"(
#define USE_FOO
#ifdef USE_FOO
#include "foo.h"
#endif
#ifndef USE_FOO
#include "bar.h"
#endif
)");
vfs->add("foo.h");
vfs->add("bar.h");
auto args = std::vector<const char*>{"clang++", "-std=c++20", main_path.c_str()};
auto result = scan_precise(args, TestVFS::root(), {}, nullptr, vfs);
// Precise mode evaluates conditionals: only foo.h should be included.
ASSERT_EQ(result.includes.size(), 1u);
EXPECT_TRUE(result.includes[0].conditional);
EXPECT_TRUE(result.includes[0].path.find("foo.h") != std::string::npos);
}
TEST_CASE(PreciseWithContent) {
auto vfs = llvm::makeIntrusiveRefCnt<TestVFS>();
auto main_path = TestVFS::path("main.cpp");
vfs->add("main.cpp");
vfs->add("header.h");
auto args = std::vector<const char*>{"clang++", "-std=c++20", main_path.c_str()};
auto result = scan_precise(args, TestVFS::root(), R"(#include "header.h")", nullptr, vfs);
ASSERT_EQ(result.includes.size(), 1u);
EXPECT_FALSE(result.includes[0].not_found);
}
}; // TEST_SUITE(Scan)
TEST_SUITE(PreambleBound) {
TEST_CASE(Empty) {
EXPECT_EQ(compute_preamble_bound(""), 0u);
}
TEST_CASE(NoDirectives) {
EXPECT_EQ(compute_preamble_bound("int x = 1;"), 0u);
}
TEST_CASE(SingleInclude) {
llvm::StringRef src = R"(
#include <vector>
int x;
)";
auto bound = compute_preamble_bound(src);
EXPECT_TRUE(bound > 0u);
EXPECT_TRUE(bound <= src.find("int"));
}
TEST_CASE(MultipleDirectives) {
llvm::StringRef src = R"(
#include <vector>
#include <string>
#define FOO 1
int x;
)";
auto bound = compute_preamble_bound(src);
EXPECT_TRUE(bound > src.find("#define"));
}
TEST_CASE(GlobalModuleFragment) {
llvm::StringRef src = R"(
module;
#include <vector>
export module foo;
)";
auto bound = compute_preamble_bound(src);
EXPECT_TRUE(bound > 0u);
EXPECT_TRUE(bound < src.size());
}
TEST_CASE(BoundsVector) {
llvm::StringRef src = R"(
#include <a>
#include <b>
int x;
)";
auto bounds = compute_preamble_bounds(src);
ASSERT_EQ(bounds.size(), 2u);
EXPECT_TRUE(bounds[0] < bounds[1]);
}
TEST_CASE(BoundsWithModuleFragment) {
llvm::StringRef src = R"(
module;
#include <a>
#include <b>
export module foo;
)";
auto bounds = compute_preamble_bounds(src);
// module; + two #include = 3 bounds.
ASSERT_EQ(bounds.size(), 3u);
EXPECT_TRUE(bounds[0] < bounds[1]);
EXPECT_TRUE(bounds[1] < bounds[2]);
}
TEST_CASE(StopsAtCode) {
llvm::StringRef src = R"(
#include <a>
int x;
#include <b>
)";
auto bounds = compute_preamble_bounds(src);
ASSERT_EQ(bounds.size(), 1u);
}
TEST_CASE(ConditionalDirectives) {
llvm::StringRef src = R"(
#ifndef GUARD
#define GUARD
#include <a>
#endif
int x;
)";
auto bound = compute_preamble_bound(src);
EXPECT_TRUE(bound > src.find("#endif"));
}
}; // TEST_SUITE(PreambleBound)
} // namespace
} // namespace clice::testing