Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 1 | //===-- DexTests.cpp ---------------------------------*- C++ -*-----------===// |
Kirill Bobyrev | 5e82f05 | 2018-07-25 10:34:57 +0000 | [diff] [blame] | 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
| 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
| 9 | |
Kirill Bobyrev | 19a9461 | 2018-09-06 12:54:43 +0000 | [diff] [blame] | 10 | #include "FuzzyMatch.h" |
| 11 | #include "TestFS.h" |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 12 | #include "TestIndex.h" |
| 13 | #include "index/Index.h" |
| 14 | #include "index/Merge.h" |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 15 | #include "index/dex/Dex.h" |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 16 | #include "index/dex/Iterator.h" |
Kirill Bobyrev | 5e82f05 | 2018-07-25 10:34:57 +0000 | [diff] [blame] | 17 | #include "index/dex/Token.h" |
| 18 | #include "index/dex/Trigram.h" |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 19 | #include "llvm/Support/ScopedPrinter.h" |
| 20 | #include "llvm/Support/raw_ostream.h" |
Kirill Bobyrev | 5e82f05 | 2018-07-25 10:34:57 +0000 | [diff] [blame] | 21 | #include "gmock/gmock.h" |
| 22 | #include "gtest/gtest.h" |
Kirill Bobyrev | 5e82f05 | 2018-07-25 10:34:57 +0000 | [diff] [blame] | 23 | #include <string> |
| 24 | #include <vector> |
| 25 | |
Sam McCall | c92e4f3 | 2018-10-09 10:02:02 +0000 | [diff] [blame] | 26 | using ::testing::AnyOf; |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 27 | using ::testing::ElementsAre; |
| 28 | using ::testing::UnorderedElementsAre; |
| 29 | |
Sam McCall | c008af6 | 2018-10-20 15:30:37 +0000 | [diff] [blame] | 30 | using namespace llvm; |
Kirill Bobyrev | 5e82f05 | 2018-07-25 10:34:57 +0000 | [diff] [blame] | 31 | namespace clang { |
| 32 | namespace clangd { |
| 33 | namespace dex { |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 34 | namespace { |
Kirill Bobyrev | bea258d | 2018-07-26 10:42:31 +0000 | [diff] [blame] | 35 | |
Kirill Bobyrev | 19a9461 | 2018-09-06 12:54:43 +0000 | [diff] [blame] | 36 | std::vector<std::string> URISchemes = {"unittest"}; |
| 37 | |
| 38 | //===----------------------------------------------------------------------===// |
| 39 | // Query iterator tests. |
| 40 | //===----------------------------------------------------------------------===// |
| 41 | |
Kirill Bobyrev | a98961b | 2018-08-24 11:25:43 +0000 | [diff] [blame] | 42 | std::vector<DocID> consumeIDs(Iterator &It) { |
| 43 | auto IDAndScore = consume(It); |
Kirill Bobyrev | 7413e98 | 2018-08-22 13:44:15 +0000 | [diff] [blame] | 44 | std::vector<DocID> IDs(IDAndScore.size()); |
| 45 | for (size_t I = 0; I < IDAndScore.size(); ++I) |
| 46 | IDs[I] = IDAndScore[I].first; |
| 47 | return IDs; |
| 48 | } |
| 49 | |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 50 | TEST(DexIterators, DocumentIterator) { |
Kirill Bobyrev | 249c586 | 2018-09-13 17:11:03 +0000 | [diff] [blame] | 51 | const PostingList L({4, 7, 8, 20, 42, 100}); |
| 52 | auto DocIterator = L.iterator(); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 53 | |
| 54 | EXPECT_EQ(DocIterator->peek(), 4U); |
Kirill Bobyrev | 6d8bd7f | 2018-08-20 09:16:14 +0000 | [diff] [blame] | 55 | EXPECT_FALSE(DocIterator->reachedEnd()); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 56 | |
| 57 | DocIterator->advance(); |
| 58 | EXPECT_EQ(DocIterator->peek(), 7U); |
Kirill Bobyrev | 6d8bd7f | 2018-08-20 09:16:14 +0000 | [diff] [blame] | 59 | EXPECT_FALSE(DocIterator->reachedEnd()); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 60 | |
| 61 | DocIterator->advanceTo(20); |
| 62 | EXPECT_EQ(DocIterator->peek(), 20U); |
Kirill Bobyrev | 6d8bd7f | 2018-08-20 09:16:14 +0000 | [diff] [blame] | 63 | EXPECT_FALSE(DocIterator->reachedEnd()); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 64 | |
| 65 | DocIterator->advanceTo(65); |
| 66 | EXPECT_EQ(DocIterator->peek(), 100U); |
Kirill Bobyrev | 6d8bd7f | 2018-08-20 09:16:14 +0000 | [diff] [blame] | 67 | EXPECT_FALSE(DocIterator->reachedEnd()); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 68 | |
| 69 | DocIterator->advanceTo(420); |
Kirill Bobyrev | 6d8bd7f | 2018-08-20 09:16:14 +0000 | [diff] [blame] | 70 | EXPECT_TRUE(DocIterator->reachedEnd()); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 71 | } |
| 72 | |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 73 | TEST(DexIterators, AndTwoLists) { |
Sam McCall | a659d77 | 2018-10-02 19:59:23 +0000 | [diff] [blame] | 74 | Corpus C{10000}; |
Kirill Bobyrev | 249c586 | 2018-09-13 17:11:03 +0000 | [diff] [blame] | 75 | const PostingList L0({0, 5, 7, 10, 42, 320, 9000}); |
| 76 | const PostingList L1({0, 4, 7, 10, 30, 60, 320, 9000}); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 77 | |
Sam McCall | a659d77 | 2018-10-02 19:59:23 +0000 | [diff] [blame] | 78 | auto And = C.intersect(L1.iterator(), L0.iterator()); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 79 | |
Kirill Bobyrev | 6d8bd7f | 2018-08-20 09:16:14 +0000 | [diff] [blame] | 80 | EXPECT_FALSE(And->reachedEnd()); |
Kirill Bobyrev | 7413e98 | 2018-08-22 13:44:15 +0000 | [diff] [blame] | 81 | EXPECT_THAT(consumeIDs(*And), ElementsAre(0U, 7U, 10U, 320U, 9000U)); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 82 | |
Sam McCall | a659d77 | 2018-10-02 19:59:23 +0000 | [diff] [blame] | 83 | And = C.intersect(L0.iterator(), L1.iterator()); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 84 | |
| 85 | And->advanceTo(0); |
| 86 | EXPECT_EQ(And->peek(), 0U); |
| 87 | And->advanceTo(5); |
| 88 | EXPECT_EQ(And->peek(), 7U); |
| 89 | And->advanceTo(10); |
| 90 | EXPECT_EQ(And->peek(), 10U); |
| 91 | And->advanceTo(42); |
| 92 | EXPECT_EQ(And->peek(), 320U); |
| 93 | And->advanceTo(8999); |
| 94 | EXPECT_EQ(And->peek(), 9000U); |
| 95 | And->advanceTo(9001); |
| 96 | } |
| 97 | |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 98 | TEST(DexIterators, AndThreeLists) { |
Sam McCall | a659d77 | 2018-10-02 19:59:23 +0000 | [diff] [blame] | 99 | Corpus C{10000}; |
Kirill Bobyrev | 249c586 | 2018-09-13 17:11:03 +0000 | [diff] [blame] | 100 | const PostingList L0({0, 5, 7, 10, 42, 320, 9000}); |
| 101 | const PostingList L1({0, 4, 7, 10, 30, 60, 320, 9000}); |
| 102 | const PostingList L2({1, 4, 7, 11, 30, 60, 320, 9000}); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 103 | |
Sam McCall | a659d77 | 2018-10-02 19:59:23 +0000 | [diff] [blame] | 104 | auto And = C.intersect(L0.iterator(), L1.iterator(), L2.iterator()); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 105 | EXPECT_EQ(And->peek(), 7U); |
| 106 | And->advanceTo(300); |
| 107 | EXPECT_EQ(And->peek(), 320U); |
| 108 | And->advanceTo(100000); |
| 109 | |
Kirill Bobyrev | 6d8bd7f | 2018-08-20 09:16:14 +0000 | [diff] [blame] | 110 | EXPECT_TRUE(And->reachedEnd()); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 111 | } |
| 112 | |
Sam McCall | 87f69eaf | 2018-10-04 13:12:23 +0000 | [diff] [blame] | 113 | TEST(DexIterators, AndEmpty) { |
| 114 | Corpus C{10000}; |
Sam McCall | a4c17dd | 2018-10-04 16:05:22 +0000 | [diff] [blame] | 115 | const PostingList L1{1}; |
| 116 | const PostingList L2{2}; |
Sam McCall | 87f69eaf | 2018-10-04 13:12:23 +0000 | [diff] [blame] | 117 | // These iterators are empty, but the optimizer can't tell. |
| 118 | auto Empty1 = C.intersect(L1.iterator(), L2.iterator()); |
| 119 | auto Empty2 = C.intersect(L1.iterator(), L2.iterator()); |
| 120 | // And syncs iterators on construction, and used to fail on empty children. |
| 121 | auto And = C.intersect(std::move(Empty1), std::move(Empty2)); |
| 122 | EXPECT_TRUE(And->reachedEnd()); |
| 123 | } |
| 124 | |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 125 | TEST(DexIterators, OrTwoLists) { |
Sam McCall | a659d77 | 2018-10-02 19:59:23 +0000 | [diff] [blame] | 126 | Corpus C{10000}; |
Kirill Bobyrev | 249c586 | 2018-09-13 17:11:03 +0000 | [diff] [blame] | 127 | const PostingList L0({0, 5, 7, 10, 42, 320, 9000}); |
| 128 | const PostingList L1({0, 4, 7, 10, 30, 60, 320, 9000}); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 129 | |
Sam McCall | a659d77 | 2018-10-02 19:59:23 +0000 | [diff] [blame] | 130 | auto Or = C.unionOf(L0.iterator(), L1.iterator()); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 131 | |
Kirill Bobyrev | 6d8bd7f | 2018-08-20 09:16:14 +0000 | [diff] [blame] | 132 | EXPECT_FALSE(Or->reachedEnd()); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 133 | EXPECT_EQ(Or->peek(), 0U); |
| 134 | Or->advance(); |
| 135 | EXPECT_EQ(Or->peek(), 4U); |
| 136 | Or->advance(); |
| 137 | EXPECT_EQ(Or->peek(), 5U); |
| 138 | Or->advance(); |
| 139 | EXPECT_EQ(Or->peek(), 7U); |
| 140 | Or->advance(); |
| 141 | EXPECT_EQ(Or->peek(), 10U); |
| 142 | Or->advance(); |
| 143 | EXPECT_EQ(Or->peek(), 30U); |
| 144 | Or->advanceTo(42); |
| 145 | EXPECT_EQ(Or->peek(), 42U); |
| 146 | Or->advanceTo(300); |
| 147 | EXPECT_EQ(Or->peek(), 320U); |
| 148 | Or->advanceTo(9000); |
| 149 | EXPECT_EQ(Or->peek(), 9000U); |
| 150 | Or->advanceTo(9001); |
Kirill Bobyrev | 6d8bd7f | 2018-08-20 09:16:14 +0000 | [diff] [blame] | 151 | EXPECT_TRUE(Or->reachedEnd()); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 152 | |
Sam McCall | a659d77 | 2018-10-02 19:59:23 +0000 | [diff] [blame] | 153 | Or = C.unionOf(L0.iterator(), L1.iterator()); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 154 | |
Kirill Bobyrev | 7413e98 | 2018-08-22 13:44:15 +0000 | [diff] [blame] | 155 | EXPECT_THAT(consumeIDs(*Or), |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 156 | ElementsAre(0U, 4U, 5U, 7U, 10U, 30U, 42U, 60U, 320U, 9000U)); |
| 157 | } |
| 158 | |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 159 | TEST(DexIterators, OrThreeLists) { |
Sam McCall | a659d77 | 2018-10-02 19:59:23 +0000 | [diff] [blame] | 160 | Corpus C{10000}; |
Kirill Bobyrev | 249c586 | 2018-09-13 17:11:03 +0000 | [diff] [blame] | 161 | const PostingList L0({0, 5, 7, 10, 42, 320, 9000}); |
| 162 | const PostingList L1({0, 4, 7, 10, 30, 60, 320, 9000}); |
| 163 | const PostingList L2({1, 4, 7, 11, 30, 60, 320, 9000}); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 164 | |
Sam McCall | a659d77 | 2018-10-02 19:59:23 +0000 | [diff] [blame] | 165 | auto Or = C.unionOf(L0.iterator(), L1.iterator(), L2.iterator()); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 166 | |
Kirill Bobyrev | 6d8bd7f | 2018-08-20 09:16:14 +0000 | [diff] [blame] | 167 | EXPECT_FALSE(Or->reachedEnd()); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 168 | EXPECT_EQ(Or->peek(), 0U); |
| 169 | |
| 170 | Or->advance(); |
| 171 | EXPECT_EQ(Or->peek(), 1U); |
| 172 | |
| 173 | Or->advance(); |
| 174 | EXPECT_EQ(Or->peek(), 4U); |
| 175 | |
| 176 | Or->advanceTo(7); |
| 177 | |
| 178 | Or->advanceTo(59); |
| 179 | EXPECT_EQ(Or->peek(), 60U); |
| 180 | |
| 181 | Or->advanceTo(9001); |
Kirill Bobyrev | 6d8bd7f | 2018-08-20 09:16:14 +0000 | [diff] [blame] | 182 | EXPECT_TRUE(Or->reachedEnd()); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 183 | } |
| 184 | |
| 185 | // FIXME(kbobyrev): The testcase below is similar to what is expected in real |
| 186 | // queries. It should be updated once new iterators (such as boosting, limiting, |
| 187 | // etc iterators) appear. However, it is not exhaustive and it would be |
Kirill Bobyrev | 7413e98 | 2018-08-22 13:44:15 +0000 | [diff] [blame] | 188 | // beneficial to implement automatic generation (e.g. fuzzing) of query trees |
| 189 | // for more comprehensive testing. |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 190 | TEST(DexIterators, QueryTree) { |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 191 | // |
| 192 | // +-----------------+ |
| 193 | // |And Iterator:1, 5| |
| 194 | // +--------+--------+ |
| 195 | // | |
| 196 | // | |
Kirill Bobyrev | 7413e98 | 2018-08-22 13:44:15 +0000 | [diff] [blame] | 197 | // +-------------+----------------------+ |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 198 | // | | |
| 199 | // | | |
Kirill Bobyrev | 7413e98 | 2018-08-22 13:44:15 +0000 | [diff] [blame] | 200 | // +----------v----------+ +----------v------------+ |
| 201 | // |And Iterator: 1, 5, 9| |Or Iterator: 0, 1, 3, 5| |
| 202 | // +----------+----------+ +----------+------------+ |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 203 | // | | |
Kirill Bobyrev | 6c2f5bd | 2018-09-25 11:54:51 +0000 | [diff] [blame] | 204 | // +------+-----+ ------------+ |
| 205 | // | | | | |
| 206 | // +-------v-----+ +----+---+ +---v----+ +----v---+ |
| 207 | // |1, 3, 5, 8, 9| |Boost: 2| |Boost: 3| |Boost: 4| |
| 208 | // +-------------+ +----+---+ +---+----+ +----+---+ |
| 209 | // | | | |
| 210 | // +----v-----+ +-v--+ +---v---+ |
| 211 | // |1, 5, 7, 9| |1, 5| |0, 3, 5| |
| 212 | // +----------+ +----+ +-------+ |
Kirill Bobyrev | 7413e98 | 2018-08-22 13:44:15 +0000 | [diff] [blame] | 213 | // |
Sam McCall | a659d77 | 2018-10-02 19:59:23 +0000 | [diff] [blame] | 214 | Corpus C{10}; |
Kirill Bobyrev | 249c586 | 2018-09-13 17:11:03 +0000 | [diff] [blame] | 215 | const PostingList L0({1, 3, 5, 8, 9}); |
| 216 | const PostingList L1({1, 5, 7, 9}); |
Kirill Bobyrev | 6c2f5bd | 2018-09-25 11:54:51 +0000 | [diff] [blame] | 217 | const PostingList L2({1, 5}); |
| 218 | const PostingList L3({0, 3, 5}); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 219 | |
| 220 | // Root of the query tree: [1, 5] |
Sam McCall | a659d77 | 2018-10-02 19:59:23 +0000 | [diff] [blame] | 221 | auto Root = C.intersect( |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 222 | // Lower And Iterator: [1, 5, 9] |
Sam McCall | a659d77 | 2018-10-02 19:59:23 +0000 | [diff] [blame] | 223 | C.intersect(L0.iterator(), C.boost(L1.iterator(), 2U)), |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 224 | // Lower Or Iterator: [0, 1, 5] |
Sam McCall | a659d77 | 2018-10-02 19:59:23 +0000 | [diff] [blame] | 225 | C.unionOf(C.boost(L2.iterator(), 3U), C.boost(L3.iterator(), 4U))); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 226 | |
Kirill Bobyrev | 6d8bd7f | 2018-08-20 09:16:14 +0000 | [diff] [blame] | 227 | EXPECT_FALSE(Root->reachedEnd()); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 228 | EXPECT_EQ(Root->peek(), 1U); |
| 229 | Root->advanceTo(0); |
| 230 | // Advance multiple times. Shouldn't do anything. |
| 231 | Root->advanceTo(1); |
| 232 | Root->advanceTo(0); |
| 233 | EXPECT_EQ(Root->peek(), 1U); |
Kirill Bobyrev | a98961b | 2018-08-24 11:25:43 +0000 | [diff] [blame] | 234 | auto ElementBoost = Root->consume(); |
Kirill Bobyrev | 7413e98 | 2018-08-22 13:44:15 +0000 | [diff] [blame] | 235 | EXPECT_THAT(ElementBoost, 6); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 236 | Root->advance(); |
| 237 | EXPECT_EQ(Root->peek(), 5U); |
| 238 | Root->advanceTo(5); |
| 239 | EXPECT_EQ(Root->peek(), 5U); |
Kirill Bobyrev | a98961b | 2018-08-24 11:25:43 +0000 | [diff] [blame] | 240 | ElementBoost = Root->consume(); |
Kirill Bobyrev | 7413e98 | 2018-08-22 13:44:15 +0000 | [diff] [blame] | 241 | EXPECT_THAT(ElementBoost, 8); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 242 | Root->advanceTo(9000); |
Kirill Bobyrev | 6d8bd7f | 2018-08-20 09:16:14 +0000 | [diff] [blame] | 243 | EXPECT_TRUE(Root->reachedEnd()); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 244 | } |
| 245 | |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 246 | TEST(DexIterators, StringRepresentation) { |
Sam McCall | a659d77 | 2018-10-02 19:59:23 +0000 | [diff] [blame] | 247 | Corpus C{10}; |
Sam McCall | 7402836 | 2018-10-02 11:51:36 +0000 | [diff] [blame] | 248 | const PostingList L1({1, 3, 5}); |
| 249 | const PostingList L2({1, 7, 9}); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 250 | |
Sam McCall | 7402836 | 2018-10-02 11:51:36 +0000 | [diff] [blame] | 251 | // No token given, prints full posting list. |
| 252 | auto I1 = L1.iterator(); |
Sam McCall | c008af6 | 2018-10-20 15:30:37 +0000 | [diff] [blame] | 253 | EXPECT_EQ(to_string(*I1), "[1 3 5]"); |
Sam McCall | 7402836 | 2018-10-02 11:51:36 +0000 | [diff] [blame] | 254 | |
| 255 | // Token given, uses token's string representation. |
| 256 | Token Tok(Token::Kind::Trigram, "L2"); |
| 257 | auto I2 = L1.iterator(&Tok); |
Sam McCall | c008af6 | 2018-10-20 15:30:37 +0000 | [diff] [blame] | 258 | EXPECT_EQ(to_string(*I2), "T=L2"); |
Sam McCall | 7402836 | 2018-10-02 11:51:36 +0000 | [diff] [blame] | 259 | |
Sam McCall | a659d77 | 2018-10-02 19:59:23 +0000 | [diff] [blame] | 260 | auto Tree = C.limit(C.intersect(move(I1), move(I2)), 10); |
Sam McCall | c92e4f3 | 2018-10-09 10:02:02 +0000 | [diff] [blame] | 261 | // AND reorders its children, we don't care which order it prints. |
Sam McCall | c008af6 | 2018-10-20 15:30:37 +0000 | [diff] [blame] | 262 | EXPECT_THAT(to_string(*Tree), AnyOf("(LIMIT 10 (& [1 3 5] T=L2))", |
| 263 | "(LIMIT 10 (& T=L2 [1 3 5]))")); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 264 | } |
| 265 | |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 266 | TEST(DexIterators, Limit) { |
Sam McCall | a659d77 | 2018-10-02 19:59:23 +0000 | [diff] [blame] | 267 | Corpus C{10000}; |
Kirill Bobyrev | 249c586 | 2018-09-13 17:11:03 +0000 | [diff] [blame] | 268 | const PostingList L0({3, 6, 7, 20, 42, 100}); |
| 269 | const PostingList L1({1, 3, 5, 6, 7, 30, 100}); |
| 270 | const PostingList L2({0, 3, 5, 7, 8, 100}); |
Kirill Bobyrev | 0a75766 | 2018-08-10 11:50:44 +0000 | [diff] [blame] | 271 | |
Sam McCall | a659d77 | 2018-10-02 19:59:23 +0000 | [diff] [blame] | 272 | auto DocIterator = C.limit(L0.iterator(), 42); |
Kirill Bobyrev | a98961b | 2018-08-24 11:25:43 +0000 | [diff] [blame] | 273 | EXPECT_THAT(consumeIDs(*DocIterator), ElementsAre(3, 6, 7, 20, 42, 100)); |
Kirill Bobyrev | 0a75766 | 2018-08-10 11:50:44 +0000 | [diff] [blame] | 274 | |
Sam McCall | a659d77 | 2018-10-02 19:59:23 +0000 | [diff] [blame] | 275 | DocIterator = C.limit(L0.iterator(), 3); |
Kirill Bobyrev | a98961b | 2018-08-24 11:25:43 +0000 | [diff] [blame] | 276 | EXPECT_THAT(consumeIDs(*DocIterator), ElementsAre(3, 6, 7)); |
Kirill Bobyrev | 0a75766 | 2018-08-10 11:50:44 +0000 | [diff] [blame] | 277 | |
Sam McCall | a659d77 | 2018-10-02 19:59:23 +0000 | [diff] [blame] | 278 | DocIterator = C.limit(L0.iterator(), 0); |
Kirill Bobyrev | a98961b | 2018-08-24 11:25:43 +0000 | [diff] [blame] | 279 | EXPECT_THAT(consumeIDs(*DocIterator), ElementsAre()); |
Kirill Bobyrev | 0a75766 | 2018-08-10 11:50:44 +0000 | [diff] [blame] | 280 | |
Sam McCall | a659d77 | 2018-10-02 19:59:23 +0000 | [diff] [blame] | 281 | auto AndIterator = |
| 282 | C.intersect(C.limit(C.all(), 343), C.limit(L0.iterator(), 2), |
| 283 | C.limit(L1.iterator(), 3), C.limit(L2.iterator(), 42)); |
Kirill Bobyrev | a98961b | 2018-08-24 11:25:43 +0000 | [diff] [blame] | 284 | EXPECT_THAT(consumeIDs(*AndIterator), ElementsAre(3, 7)); |
Kirill Bobyrev | 0a75766 | 2018-08-10 11:50:44 +0000 | [diff] [blame] | 285 | } |
| 286 | |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 287 | TEST(DexIterators, True) { |
Sam McCall | 87f69eaf | 2018-10-04 13:12:23 +0000 | [diff] [blame] | 288 | EXPECT_TRUE(Corpus{0}.all()->reachedEnd()); |
| 289 | EXPECT_THAT(consumeIDs(*Corpus{4}.all()), ElementsAre(0, 1, 2, 3)); |
Kirill Bobyrev | 7413e98 | 2018-08-22 13:44:15 +0000 | [diff] [blame] | 290 | } |
| 291 | |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 292 | TEST(DexIterators, Boost) { |
Sam McCall | a659d77 | 2018-10-02 19:59:23 +0000 | [diff] [blame] | 293 | Corpus C{5}; |
| 294 | auto BoostIterator = C.boost(C.all(), 42U); |
Kirill Bobyrev | 7413e98 | 2018-08-22 13:44:15 +0000 | [diff] [blame] | 295 | EXPECT_FALSE(BoostIterator->reachedEnd()); |
Kirill Bobyrev | a98961b | 2018-08-24 11:25:43 +0000 | [diff] [blame] | 296 | auto ElementBoost = BoostIterator->consume(); |
Kirill Bobyrev | 7413e98 | 2018-08-22 13:44:15 +0000 | [diff] [blame] | 297 | EXPECT_THAT(ElementBoost, 42U); |
| 298 | |
Kirill Bobyrev | 249c586 | 2018-09-13 17:11:03 +0000 | [diff] [blame] | 299 | const PostingList L0({2, 4}); |
| 300 | const PostingList L1({1, 4}); |
Sam McCall | a659d77 | 2018-10-02 19:59:23 +0000 | [diff] [blame] | 301 | auto Root = C.unionOf(C.all(), C.boost(L0.iterator(), 2U), |
| 302 | C.boost(L1.iterator(), 3U)); |
Kirill Bobyrev | 7413e98 | 2018-08-22 13:44:15 +0000 | [diff] [blame] | 303 | |
Kirill Bobyrev | a98961b | 2018-08-24 11:25:43 +0000 | [diff] [blame] | 304 | ElementBoost = Root->consume(); |
Sam McCall | a659d77 | 2018-10-02 19:59:23 +0000 | [diff] [blame] | 305 | EXPECT_THAT(ElementBoost, 1); |
Kirill Bobyrev | 7413e98 | 2018-08-22 13:44:15 +0000 | [diff] [blame] | 306 | Root->advance(); |
| 307 | EXPECT_THAT(Root->peek(), 1U); |
Kirill Bobyrev | a98961b | 2018-08-24 11:25:43 +0000 | [diff] [blame] | 308 | ElementBoost = Root->consume(); |
Kirill Bobyrev | 7413e98 | 2018-08-22 13:44:15 +0000 | [diff] [blame] | 309 | EXPECT_THAT(ElementBoost, 3); |
| 310 | |
| 311 | Root->advance(); |
| 312 | EXPECT_THAT(Root->peek(), 2U); |
Kirill Bobyrev | a98961b | 2018-08-24 11:25:43 +0000 | [diff] [blame] | 313 | ElementBoost = Root->consume(); |
Kirill Bobyrev | 7413e98 | 2018-08-22 13:44:15 +0000 | [diff] [blame] | 314 | EXPECT_THAT(ElementBoost, 2); |
| 315 | |
| 316 | Root->advanceTo(4); |
Kirill Bobyrev | a98961b | 2018-08-24 11:25:43 +0000 | [diff] [blame] | 317 | ElementBoost = Root->consume(); |
Kirill Bobyrev | 7413e98 | 2018-08-22 13:44:15 +0000 | [diff] [blame] | 318 | EXPECT_THAT(ElementBoost, 3); |
Kirill Bobyrev | 30ffdf4 | 2018-08-20 08:47:30 +0000 | [diff] [blame] | 319 | } |
| 320 | |
Sam McCall | 87f69eaf | 2018-10-04 13:12:23 +0000 | [diff] [blame] | 321 | TEST(DexIterators, Optimizations) { |
| 322 | Corpus C{5}; |
Jonas Toth | 0451440 | 2018-10-04 16:29:58 +0000 | [diff] [blame] | 323 | const PostingList L1{1}; |
| 324 | const PostingList L2{2}; |
| 325 | const PostingList L3{3}; |
Sam McCall | 87f69eaf | 2018-10-04 13:12:23 +0000 | [diff] [blame] | 326 | |
| 327 | // empty and/or yield true/false |
Sam McCall | c008af6 | 2018-10-20 15:30:37 +0000 | [diff] [blame] | 328 | EXPECT_EQ(to_string(*C.intersect()), "true"); |
| 329 | EXPECT_EQ(to_string(*C.unionOf()), "false"); |
Sam McCall | 87f69eaf | 2018-10-04 13:12:23 +0000 | [diff] [blame] | 330 | |
| 331 | // true/false inside and/or short-circuit |
Sam McCall | c008af6 | 2018-10-20 15:30:37 +0000 | [diff] [blame] | 332 | EXPECT_EQ(to_string(*C.intersect(L1.iterator(), C.all())), "[1]"); |
| 333 | EXPECT_EQ(to_string(*C.intersect(L1.iterator(), C.none())), "false"); |
Sam McCall | 87f69eaf | 2018-10-04 13:12:23 +0000 | [diff] [blame] | 334 | // Not optimized to avoid breaking boosts. |
Sam McCall | c008af6 | 2018-10-20 15:30:37 +0000 | [diff] [blame] | 335 | EXPECT_EQ(to_string(*C.unionOf(L1.iterator(), C.all())), "(| [1] true)"); |
| 336 | EXPECT_EQ(to_string(*C.unionOf(L1.iterator(), C.none())), "[1]"); |
Sam McCall | 87f69eaf | 2018-10-04 13:12:23 +0000 | [diff] [blame] | 337 | |
| 338 | // and/or nested inside and/or are flattened |
Sam McCall | c008af6 | 2018-10-20 15:30:37 +0000 | [diff] [blame] | 339 | EXPECT_EQ(to_string(*C.intersect(L1.iterator(), |
| 340 | C.intersect(L1.iterator(), L1.iterator()))), |
Sam McCall | 87f69eaf | 2018-10-04 13:12:23 +0000 | [diff] [blame] | 341 | "(& [1] [1] [1])"); |
Sam McCall | c008af6 | 2018-10-20 15:30:37 +0000 | [diff] [blame] | 342 | EXPECT_EQ(to_string(*C.unionOf(L1.iterator(), |
| 343 | C.unionOf(L2.iterator(), L3.iterator()))), |
Sam McCall | 87f69eaf | 2018-10-04 13:12:23 +0000 | [diff] [blame] | 344 | "(| [1] [2] [3])"); |
| 345 | |
| 346 | // optimizations combine over multiple levels |
Sam McCall | c008af6 | 2018-10-20 15:30:37 +0000 | [diff] [blame] | 347 | EXPECT_EQ(to_string(*C.intersect(C.intersect(L1.iterator(), C.intersect()), |
| 348 | C.unionOf(C.all()))), |
Sam McCall | 87f69eaf | 2018-10-04 13:12:23 +0000 | [diff] [blame] | 349 | "[1]"); |
| 350 | } |
| 351 | |
Kirill Bobyrev | 19a9461 | 2018-09-06 12:54:43 +0000 | [diff] [blame] | 352 | //===----------------------------------------------------------------------===// |
| 353 | // Search token tests. |
| 354 | //===----------------------------------------------------------------------===// |
| 355 | |
Kirill Bobyrev | 5e82f05 | 2018-07-25 10:34:57 +0000 | [diff] [blame] | 356 | testing::Matcher<std::vector<Token>> |
Kirill Bobyrev | 19a9461 | 2018-09-06 12:54:43 +0000 | [diff] [blame] | 357 | tokensAre(std::initializer_list<std::string> Strings, Token::Kind Kind) { |
Kirill Bobyrev | 5e82f05 | 2018-07-25 10:34:57 +0000 | [diff] [blame] | 358 | std::vector<Token> Tokens; |
Kirill Bobyrev | 19a9461 | 2018-09-06 12:54:43 +0000 | [diff] [blame] | 359 | for (const auto &TokenData : Strings) { |
| 360 | Tokens.push_back(Token(Kind, TokenData)); |
Kirill Bobyrev | 5e82f05 | 2018-07-25 10:34:57 +0000 | [diff] [blame] | 361 | } |
| 362 | return testing::UnorderedElementsAreArray(Tokens); |
| 363 | } |
| 364 | |
Kirill Bobyrev | 19a9461 | 2018-09-06 12:54:43 +0000 | [diff] [blame] | 365 | testing::Matcher<std::vector<Token>> |
| 366 | trigramsAre(std::initializer_list<std::string> Trigrams) { |
| 367 | return tokensAre(Trigrams, Token::Kind::Trigram); |
| 368 | } |
| 369 | |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 370 | TEST(DexTrigrams, IdentifierTrigrams) { |
Kirill Bobyrev | ff2dd90 | 2018-08-13 08:57:06 +0000 | [diff] [blame] | 371 | EXPECT_THAT(generateIdentifierTrigrams("X86"), |
Sam McCall | b5bbfef | 2018-10-04 14:01:55 +0000 | [diff] [blame] | 372 | trigramsAre({"x86", "x", "x8"})); |
Kirill Bobyrev | 5e82f05 | 2018-07-25 10:34:57 +0000 | [diff] [blame] | 373 | |
Sam McCall | b5bbfef | 2018-10-04 14:01:55 +0000 | [diff] [blame] | 374 | EXPECT_THAT(generateIdentifierTrigrams("nl"), trigramsAre({"nl", "n"})); |
Kirill Bobyrev | ff2dd90 | 2018-08-13 08:57:06 +0000 | [diff] [blame] | 375 | |
Sam McCall | b5bbfef | 2018-10-04 14:01:55 +0000 | [diff] [blame] | 376 | EXPECT_THAT(generateIdentifierTrigrams("n"), trigramsAre({"n"})); |
Kirill Bobyrev | 5e82f05 | 2018-07-25 10:34:57 +0000 | [diff] [blame] | 377 | |
| 378 | EXPECT_THAT(generateIdentifierTrigrams("clangd"), |
Sam McCall | b5bbfef | 2018-10-04 14:01:55 +0000 | [diff] [blame] | 379 | trigramsAre({"c", "cl", "cla", "lan", "ang", "ngd"})); |
Kirill Bobyrev | 5e82f05 | 2018-07-25 10:34:57 +0000 | [diff] [blame] | 380 | |
| 381 | EXPECT_THAT(generateIdentifierTrigrams("abc_def"), |
Sam McCall | b5bbfef | 2018-10-04 14:01:55 +0000 | [diff] [blame] | 382 | trigramsAre({"a", "ab", "ad", "abc", "abd", "ade", "bcd", "bde", |
| 383 | "cde", "def"})); |
Kirill Bobyrev | 5e82f05 | 2018-07-25 10:34:57 +0000 | [diff] [blame] | 384 | |
Kirill Bobyrev | ff2dd90 | 2018-08-13 08:57:06 +0000 | [diff] [blame] | 385 | EXPECT_THAT(generateIdentifierTrigrams("a_b_c_d_e_"), |
Sam McCall | 2ec5a10 | 2018-10-04 14:08:11 +0000 | [diff] [blame] | 386 | trigramsAre({"a", "a_", "ab", "abc", "bcd", "cde"})); |
Kirill Bobyrev | 5e82f05 | 2018-07-25 10:34:57 +0000 | [diff] [blame] | 387 | |
Kirill Bobyrev | ff2dd90 | 2018-08-13 08:57:06 +0000 | [diff] [blame] | 388 | EXPECT_THAT(generateIdentifierTrigrams("unique_ptr"), |
Sam McCall | b5bbfef | 2018-10-04 14:01:55 +0000 | [diff] [blame] | 389 | trigramsAre({"u", "un", "up", "uni", "unp", "upt", "niq", "nip", |
| 390 | "npt", "iqu", "iqp", "ipt", "que", "qup", "qpt", |
| 391 | "uep", "ept", "ptr"})); |
Kirill Bobyrev | 5e82f05 | 2018-07-25 10:34:57 +0000 | [diff] [blame] | 392 | |
Kirill Bobyrev | e6d5fd8 | 2018-08-27 17:26:43 +0000 | [diff] [blame] | 393 | EXPECT_THAT( |
| 394 | generateIdentifierTrigrams("TUDecl"), |
Sam McCall | b5bbfef | 2018-10-04 14:01:55 +0000 | [diff] [blame] | 395 | trigramsAre({"t", "tu", "td", "tud", "tde", "ude", "dec", "ecl"})); |
Kirill Bobyrev | 5e82f05 | 2018-07-25 10:34:57 +0000 | [diff] [blame] | 396 | |
| 397 | EXPECT_THAT(generateIdentifierTrigrams("IsOK"), |
Sam McCall | b5bbfef | 2018-10-04 14:01:55 +0000 | [diff] [blame] | 398 | trigramsAre({"i", "is", "io", "iso", "iok", "sok"})); |
Kirill Bobyrev | 5e82f05 | 2018-07-25 10:34:57 +0000 | [diff] [blame] | 399 | |
Kirill Bobyrev | ff2dd90 | 2018-08-13 08:57:06 +0000 | [diff] [blame] | 400 | EXPECT_THAT( |
| 401 | generateIdentifierTrigrams("abc_defGhij__klm"), |
Sam McCall | 2ec5a10 | 2018-10-04 14:08:11 +0000 | [diff] [blame] | 402 | trigramsAre({"a", "ab", "ad", "abc", "abd", "ade", "adg", "bcd", |
| 403 | "bde", "bdg", "cde", "cdg", "def", "deg", "dgh", "dgk", |
| 404 | "efg", "egh", "egk", "fgh", "fgk", "ghi", "ghk", "gkl", |
Sam McCall | b5bbfef | 2018-10-04 14:01:55 +0000 | [diff] [blame] | 405 | "hij", "hik", "hkl", "ijk", "ikl", "jkl", "klm"})); |
Kirill Bobyrev | 5e82f05 | 2018-07-25 10:34:57 +0000 | [diff] [blame] | 406 | } |
| 407 | |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 408 | TEST(DexTrigrams, QueryTrigrams) { |
Sam McCall | b5bbfef | 2018-10-04 14:01:55 +0000 | [diff] [blame] | 409 | EXPECT_THAT(generateQueryTrigrams("c"), trigramsAre({"c"})); |
| 410 | EXPECT_THAT(generateQueryTrigrams("cl"), trigramsAre({"cl"})); |
Kirill Bobyrev | ff2dd90 | 2018-08-13 08:57:06 +0000 | [diff] [blame] | 411 | EXPECT_THAT(generateQueryTrigrams("cla"), trigramsAre({"cla"})); |
Kirill Bobyrev | 5e82f05 | 2018-07-25 10:34:57 +0000 | [diff] [blame] | 412 | |
Sam McCall | 50b89f0 | 2018-10-04 17:18:55 +0000 | [diff] [blame] | 413 | EXPECT_THAT(generateQueryTrigrams(""), trigramsAre({})); |
Sam McCall | b5bbfef | 2018-10-04 14:01:55 +0000 | [diff] [blame] | 414 | EXPECT_THAT(generateQueryTrigrams("_"), trigramsAre({"_"})); |
| 415 | EXPECT_THAT(generateQueryTrigrams("__"), trigramsAre({"__"})); |
| 416 | EXPECT_THAT(generateQueryTrigrams("___"), trigramsAre({})); |
Kirill Bobyrev | ff2dd90 | 2018-08-13 08:57:06 +0000 | [diff] [blame] | 417 | |
| 418 | EXPECT_THAT(generateQueryTrigrams("X86"), trigramsAre({"x86"})); |
Kirill Bobyrev | 5e82f05 | 2018-07-25 10:34:57 +0000 | [diff] [blame] | 419 | |
| 420 | EXPECT_THAT(generateQueryTrigrams("clangd"), |
| 421 | trigramsAre({"cla", "lan", "ang", "ngd"})); |
| 422 | |
| 423 | EXPECT_THAT(generateQueryTrigrams("abc_def"), |
| 424 | trigramsAre({"abc", "bcd", "cde", "def"})); |
| 425 | |
| 426 | EXPECT_THAT(generateQueryTrigrams("a_b_c_d_e_"), |
| 427 | trigramsAre({"abc", "bcd", "cde"})); |
| 428 | |
| 429 | EXPECT_THAT(generateQueryTrigrams("unique_ptr"), |
| 430 | trigramsAre({"uni", "niq", "iqu", "que", "uep", "ept", "ptr"})); |
| 431 | |
| 432 | EXPECT_THAT(generateQueryTrigrams("TUDecl"), |
| 433 | trigramsAre({"tud", "ude", "dec", "ecl"})); |
| 434 | |
| 435 | EXPECT_THAT(generateQueryTrigrams("IsOK"), trigramsAre({"iso", "sok"})); |
| 436 | |
| 437 | EXPECT_THAT(generateQueryTrigrams("abc_defGhij__klm"), |
| 438 | trigramsAre({"abc", "bcd", "cde", "def", "efg", "fgh", "ghi", |
| 439 | "hij", "ijk", "jkl", "klm"})); |
| 440 | } |
| 441 | |
Kirill Bobyrev | 19a9461 | 2018-09-06 12:54:43 +0000 | [diff] [blame] | 442 | TEST(DexSearchTokens, SymbolPath) { |
| 443 | EXPECT_THAT(generateProximityURIs( |
| 444 | "unittest:///clang-tools-extra/clangd/index/Token.h"), |
| 445 | ElementsAre("unittest:///clang-tools-extra/clangd/index/Token.h", |
| 446 | "unittest:///clang-tools-extra/clangd/index", |
| 447 | "unittest:///clang-tools-extra/clangd", |
| 448 | "unittest:///clang-tools-extra", "unittest:///")); |
| 449 | |
| 450 | EXPECT_THAT(generateProximityURIs("unittest:///a/b/c.h"), |
| 451 | ElementsAre("unittest:///a/b/c.h", "unittest:///a/b", |
| 452 | "unittest:///a", "unittest:///")); |
| 453 | } |
| 454 | |
| 455 | //===----------------------------------------------------------------------===// |
| 456 | // Index tests. |
| 457 | //===----------------------------------------------------------------------===// |
| 458 | |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 459 | TEST(Dex, Lookup) { |
Sam McCall | d9eae39 | 2018-10-04 09:16:12 +0000 | [diff] [blame] | 460 | auto I = Dex::build(generateSymbols({"ns::abc", "ns::xyz"}), RefSlab(), |
| 461 | URISchemes); |
Sam McCall | 9c7624e | 2018-09-03 14:37:43 +0000 | [diff] [blame] | 462 | EXPECT_THAT(lookup(*I, SymbolID("ns::abc")), UnorderedElementsAre("ns::abc")); |
| 463 | EXPECT_THAT(lookup(*I, {SymbolID("ns::abc"), SymbolID("ns::xyz")}), |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 464 | UnorderedElementsAre("ns::abc", "ns::xyz")); |
Sam McCall | 9c7624e | 2018-09-03 14:37:43 +0000 | [diff] [blame] | 465 | EXPECT_THAT(lookup(*I, {SymbolID("ns::nonono"), SymbolID("ns::xyz")}), |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 466 | UnorderedElementsAre("ns::xyz")); |
Sam McCall | 9c7624e | 2018-09-03 14:37:43 +0000 | [diff] [blame] | 467 | EXPECT_THAT(lookup(*I, SymbolID("ns::nonono")), UnorderedElementsAre()); |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 468 | } |
| 469 | |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 470 | TEST(Dex, FuzzyFind) { |
Kirill Bobyrev | 249c586 | 2018-09-13 17:11:03 +0000 | [diff] [blame] | 471 | auto Index = |
| 472 | Dex::build(generateSymbols({"ns::ABC", "ns::BCD", "::ABC", |
| 473 | "ns::nested::ABC", "other::ABC", "other::A"}), |
Sam McCall | d9eae39 | 2018-10-04 09:16:12 +0000 | [diff] [blame] | 474 | RefSlab(), URISchemes); |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 475 | FuzzyFindRequest Req; |
| 476 | Req.Query = "ABC"; |
| 477 | Req.Scopes = {"ns::"}; |
Sam McCall | 9c7624e | 2018-09-03 14:37:43 +0000 | [diff] [blame] | 478 | EXPECT_THAT(match(*Index, Req), UnorderedElementsAre("ns::ABC")); |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 479 | Req.Scopes = {"ns::", "ns::nested::"}; |
Sam McCall | 9c7624e | 2018-09-03 14:37:43 +0000 | [diff] [blame] | 480 | EXPECT_THAT(match(*Index, Req), |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 481 | UnorderedElementsAre("ns::ABC", "ns::nested::ABC")); |
| 482 | Req.Query = "A"; |
| 483 | Req.Scopes = {"other::"}; |
Sam McCall | 9c7624e | 2018-09-03 14:37:43 +0000 | [diff] [blame] | 484 | EXPECT_THAT(match(*Index, Req), |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 485 | UnorderedElementsAre("other::A", "other::ABC")); |
| 486 | Req.Query = ""; |
| 487 | Req.Scopes = {}; |
Sam McCall | 9c7624e | 2018-09-03 14:37:43 +0000 | [diff] [blame] | 488 | EXPECT_THAT(match(*Index, Req), |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 489 | UnorderedElementsAre("ns::ABC", "ns::BCD", "::ABC", |
| 490 | "ns::nested::ABC", "other::ABC", |
| 491 | "other::A")); |
| 492 | } |
| 493 | |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 494 | TEST(DexTest, DexDeduplicate) { |
Sam McCall | 9c7624e | 2018-09-03 14:37:43 +0000 | [diff] [blame] | 495 | std::vector<Symbol> Symbols = {symbol("1"), symbol("2"), symbol("3"), |
| 496 | symbol("2") /* duplicate */}; |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 497 | FuzzyFindRequest Req; |
Sam McCall | 9c7624e | 2018-09-03 14:37:43 +0000 | [diff] [blame] | 498 | Req.Query = "2"; |
Sam McCall | d9eae39 | 2018-10-04 09:16:12 +0000 | [diff] [blame] | 499 | Dex I(Symbols, RefSlab(), URISchemes); |
Sam McCall | 96f2489 | 2018-10-16 08:53:52 +0000 | [diff] [blame] | 500 | EXPECT_THAT(match(I, Req), ElementsAre("2")); |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 501 | } |
| 502 | |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 503 | TEST(DexTest, DexLimitedNumMatches) { |
Sam McCall | d9eae39 | 2018-10-04 09:16:12 +0000 | [diff] [blame] | 504 | auto I = Dex::build(generateNumSymbols(0, 100), RefSlab(), URISchemes); |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 505 | FuzzyFindRequest Req; |
| 506 | Req.Query = "5"; |
Kirill Bobyrev | e6dd080 | 2018-09-13 14:27:03 +0000 | [diff] [blame] | 507 | Req.Limit = 3; |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 508 | bool Incomplete; |
Sam McCall | 9c7624e | 2018-09-03 14:37:43 +0000 | [diff] [blame] | 509 | auto Matches = match(*I, Req, &Incomplete); |
Kirill Bobyrev | e6dd080 | 2018-09-13 14:27:03 +0000 | [diff] [blame] | 510 | EXPECT_TRUE(Req.Limit); |
| 511 | EXPECT_EQ(Matches.size(), *Req.Limit); |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 512 | EXPECT_TRUE(Incomplete); |
| 513 | } |
| 514 | |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 515 | TEST(DexTest, FuzzyMatch) { |
| 516 | auto I = Dex::build( |
Kirill Bobyrev | 19a9461 | 2018-09-06 12:54:43 +0000 | [diff] [blame] | 517 | generateSymbols({"LaughingOutLoud", "LionPopulation", "LittleOldLady"}), |
Sam McCall | d9eae39 | 2018-10-04 09:16:12 +0000 | [diff] [blame] | 518 | RefSlab(), URISchemes); |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 519 | FuzzyFindRequest Req; |
| 520 | Req.Query = "lol"; |
Kirill Bobyrev | e6dd080 | 2018-09-13 14:27:03 +0000 | [diff] [blame] | 521 | Req.Limit = 2; |
Sam McCall | 9c7624e | 2018-09-03 14:37:43 +0000 | [diff] [blame] | 522 | EXPECT_THAT(match(*I, Req), |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 523 | UnorderedElementsAre("LaughingOutLoud", "LittleOldLady")); |
| 524 | } |
| 525 | |
Sam McCall | b5bbfef | 2018-10-04 14:01:55 +0000 | [diff] [blame] | 526 | TEST(DexTest, ShortQuery) { |
| 527 | auto I = |
| 528 | Dex::build(generateSymbols({"OneTwoThreeFour"}), RefSlab(), URISchemes); |
| 529 | FuzzyFindRequest Req; |
| 530 | bool Incomplete; |
| 531 | |
| 532 | EXPECT_THAT(match(*I, Req, &Incomplete), ElementsAre("OneTwoThreeFour")); |
| 533 | EXPECT_FALSE(Incomplete) << "Empty string is not a short query"; |
| 534 | |
| 535 | Req.Query = "t"; |
| 536 | EXPECT_THAT(match(*I, Req, &Incomplete), ElementsAre()); |
| 537 | EXPECT_TRUE(Incomplete) << "Short queries have different semantics"; |
| 538 | |
| 539 | Req.Query = "tt"; |
| 540 | EXPECT_THAT(match(*I, Req, &Incomplete), ElementsAre()); |
| 541 | EXPECT_TRUE(Incomplete) << "Short queries have different semantics"; |
| 542 | |
| 543 | Req.Query = "ttf"; |
| 544 | EXPECT_THAT(match(*I, Req, &Incomplete), ElementsAre("OneTwoThreeFour")); |
| 545 | EXPECT_FALSE(Incomplete) << "3-char string is not a short query"; |
| 546 | } |
Sam McCall | b5bbfef | 2018-10-04 14:01:55 +0000 | [diff] [blame] | 547 | |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 548 | TEST(DexTest, MatchQualifiedNamesWithoutSpecificScope) { |
Sam McCall | d9eae39 | 2018-10-04 09:16:12 +0000 | [diff] [blame] | 549 | auto I = Dex::build(generateSymbols({"a::y1", "b::y2", "y3"}), RefSlab(), |
| 550 | URISchemes); |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 551 | FuzzyFindRequest Req; |
| 552 | Req.Query = "y"; |
Sam McCall | 9c7624e | 2018-09-03 14:37:43 +0000 | [diff] [blame] | 553 | EXPECT_THAT(match(*I, Req), UnorderedElementsAre("a::y1", "b::y2", "y3")); |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 554 | } |
| 555 | |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 556 | TEST(DexTest, MatchQualifiedNamesWithGlobalScope) { |
Sam McCall | d9eae39 | 2018-10-04 09:16:12 +0000 | [diff] [blame] | 557 | auto I = Dex::build(generateSymbols({"a::y1", "b::y2", "y3"}), RefSlab(), |
| 558 | URISchemes); |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 559 | FuzzyFindRequest Req; |
| 560 | Req.Query = "y"; |
| 561 | Req.Scopes = {""}; |
Sam McCall | 9c7624e | 2018-09-03 14:37:43 +0000 | [diff] [blame] | 562 | EXPECT_THAT(match(*I, Req), UnorderedElementsAre("y3")); |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 563 | } |
| 564 | |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 565 | TEST(DexTest, MatchQualifiedNamesWithOneScope) { |
Sam McCall | d9eae39 | 2018-10-04 09:16:12 +0000 | [diff] [blame] | 566 | auto I = |
| 567 | Dex::build(generateSymbols({"a::y1", "a::y2", "a::x", "b::y2", "y3"}), |
| 568 | RefSlab(), URISchemes); |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 569 | FuzzyFindRequest Req; |
| 570 | Req.Query = "y"; |
| 571 | Req.Scopes = {"a::"}; |
Sam McCall | 9c7624e | 2018-09-03 14:37:43 +0000 | [diff] [blame] | 572 | EXPECT_THAT(match(*I, Req), UnorderedElementsAre("a::y1", "a::y2")); |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 573 | } |
| 574 | |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 575 | TEST(DexTest, MatchQualifiedNamesWithMultipleScopes) { |
| 576 | auto I = Dex::build( |
Sam McCall | d9eae39 | 2018-10-04 09:16:12 +0000 | [diff] [blame] | 577 | generateSymbols({"a::y1", "a::y2", "a::x", "b::y3", "y3"}), RefSlab(), URISchemes); |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 578 | FuzzyFindRequest Req; |
| 579 | Req.Query = "y"; |
| 580 | Req.Scopes = {"a::", "b::"}; |
Sam McCall | 9c7624e | 2018-09-03 14:37:43 +0000 | [diff] [blame] | 581 | EXPECT_THAT(match(*I, Req), UnorderedElementsAre("a::y1", "a::y2", "b::y3")); |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 582 | } |
| 583 | |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 584 | TEST(DexTest, NoMatchNestedScopes) { |
Sam McCall | d9eae39 | 2018-10-04 09:16:12 +0000 | [diff] [blame] | 585 | auto I = Dex::build(generateSymbols({"a::y1", "a::b::y2"}), RefSlab(), URISchemes); |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 586 | FuzzyFindRequest Req; |
| 587 | Req.Query = "y"; |
| 588 | Req.Scopes = {"a::"}; |
Sam McCall | 9c7624e | 2018-09-03 14:37:43 +0000 | [diff] [blame] | 589 | EXPECT_THAT(match(*I, Req), UnorderedElementsAre("a::y1")); |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 590 | } |
| 591 | |
Eric Liu | 670c147 | 2018-09-27 18:46:00 +0000 | [diff] [blame] | 592 | TEST(DexTest, WildcardScope) { |
| 593 | auto I = |
Sam McCall | d9eae39 | 2018-10-04 09:16:12 +0000 | [diff] [blame] | 594 | Dex::build(generateSymbols({"a::y1", "a::b::y2", "c::y3"}), RefSlab(), URISchemes); |
Eric Liu | 670c147 | 2018-09-27 18:46:00 +0000 | [diff] [blame] | 595 | FuzzyFindRequest Req; |
| 596 | Req.Query = "y"; |
| 597 | Req.Scopes = {"a::"}; |
| 598 | Req.AnyScope = true; |
| 599 | EXPECT_THAT(match(*I, Req), |
| 600 | UnorderedElementsAre("a::y1", "a::b::y2", "c::y3")); |
| 601 | } |
| 602 | |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 603 | TEST(DexTest, IgnoreCases) { |
Sam McCall | d9eae39 | 2018-10-04 09:16:12 +0000 | [diff] [blame] | 604 | auto I = Dex::build(generateSymbols({"ns::ABC", "ns::abc"}), RefSlab(), URISchemes); |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 605 | FuzzyFindRequest Req; |
| 606 | Req.Query = "AB"; |
| 607 | Req.Scopes = {"ns::"}; |
Sam McCall | 9c7624e | 2018-09-03 14:37:43 +0000 | [diff] [blame] | 608 | EXPECT_THAT(match(*I, Req), UnorderedElementsAre("ns::ABC", "ns::abc")); |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 609 | } |
| 610 | |
Sam McCall | 50b89f0 | 2018-10-04 17:18:55 +0000 | [diff] [blame] | 611 | TEST(DexTest, UnknownPostingList) { |
| 612 | // Regression test: we used to ignore unknown scopes and accept any symbol. |
| 613 | auto I = Dex::build(generateSymbols({"ns::ABC", "ns::abc"}), RefSlab(), |
| 614 | URISchemes); |
| 615 | FuzzyFindRequest Req; |
| 616 | Req.Scopes = {"ns2::"}; |
| 617 | EXPECT_THAT(match(*I, Req), UnorderedElementsAre()); |
| 618 | } |
| 619 | |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 620 | TEST(DexTest, Lookup) { |
Sam McCall | d9eae39 | 2018-10-04 09:16:12 +0000 | [diff] [blame] | 621 | auto I = Dex::build(generateSymbols({"ns::abc", "ns::xyz"}), RefSlab(), URISchemes); |
Sam McCall | 9c7624e | 2018-09-03 14:37:43 +0000 | [diff] [blame] | 622 | EXPECT_THAT(lookup(*I, SymbolID("ns::abc")), UnorderedElementsAre("ns::abc")); |
| 623 | EXPECT_THAT(lookup(*I, {SymbolID("ns::abc"), SymbolID("ns::xyz")}), |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 624 | UnorderedElementsAre("ns::abc", "ns::xyz")); |
Sam McCall | 9c7624e | 2018-09-03 14:37:43 +0000 | [diff] [blame] | 625 | EXPECT_THAT(lookup(*I, {SymbolID("ns::nonono"), SymbolID("ns::xyz")}), |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 626 | UnorderedElementsAre("ns::xyz")); |
Sam McCall | 9c7624e | 2018-09-03 14:37:43 +0000 | [diff] [blame] | 627 | EXPECT_THAT(lookup(*I, SymbolID("ns::nonono")), UnorderedElementsAre()); |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 628 | } |
| 629 | |
Kirill Bobyrev | 94af061 | 2018-09-24 08:45:18 +0000 | [diff] [blame] | 630 | TEST(DexTest, SymbolIndexOptionsFilter) { |
| 631 | auto CodeCompletionSymbol = symbol("Completion"); |
| 632 | auto NonCodeCompletionSymbol = symbol("NoCompletion"); |
| 633 | CodeCompletionSymbol.Flags = Symbol::SymbolFlag::IndexedForCodeCompletion; |
| 634 | NonCodeCompletionSymbol.Flags = Symbol::SymbolFlag::None; |
| 635 | std::vector<Symbol> Symbols{CodeCompletionSymbol, NonCodeCompletionSymbol}; |
Sam McCall | d9eae39 | 2018-10-04 09:16:12 +0000 | [diff] [blame] | 636 | Dex I(Symbols, RefSlab(), URISchemes); |
Kirill Bobyrev | 94af061 | 2018-09-24 08:45:18 +0000 | [diff] [blame] | 637 | FuzzyFindRequest Req; |
| 638 | Req.RestrictForCodeCompletion = false; |
| 639 | EXPECT_THAT(match(I, Req), ElementsAre("Completion", "NoCompletion")); |
| 640 | Req.RestrictForCodeCompletion = true; |
| 641 | EXPECT_THAT(match(I, Req), ElementsAre("Completion")); |
| 642 | } |
| 643 | |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 644 | TEST(DexTest, ProximityPathsBoosting) { |
Kirill Bobyrev | 19a9461 | 2018-09-06 12:54:43 +0000 | [diff] [blame] | 645 | auto RootSymbol = symbol("root::abc"); |
| 646 | RootSymbol.CanonicalDeclaration.FileURI = "unittest:///file.h"; |
| 647 | auto CloseSymbol = symbol("close::abc"); |
| 648 | CloseSymbol.CanonicalDeclaration.FileURI = "unittest:///a/b/c/d/e/f/file.h"; |
| 649 | |
| 650 | std::vector<Symbol> Symbols{CloseSymbol, RootSymbol}; |
Sam McCall | d9eae39 | 2018-10-04 09:16:12 +0000 | [diff] [blame] | 651 | Dex I(Symbols, RefSlab(), URISchemes); |
Kirill Bobyrev | 19a9461 | 2018-09-06 12:54:43 +0000 | [diff] [blame] | 652 | |
| 653 | FuzzyFindRequest Req; |
| 654 | Req.Query = "abc"; |
| 655 | // The best candidate can change depending on the proximity paths. |
Kirill Bobyrev | e6dd080 | 2018-09-13 14:27:03 +0000 | [diff] [blame] | 656 | Req.Limit = 1; |
Kirill Bobyrev | 19a9461 | 2018-09-06 12:54:43 +0000 | [diff] [blame] | 657 | |
| 658 | // FuzzyFind request comes from the file which is far from the root: expect |
| 659 | // CloseSymbol to come out. |
| 660 | Req.ProximityPaths = {testPath("a/b/c/d/e/f/file.h")}; |
| 661 | EXPECT_THAT(match(I, Req), ElementsAre("close::abc")); |
| 662 | |
| 663 | // FuzzyFind request comes from the file which is close to the root: expect |
| 664 | // RootSymbol to come out. |
| 665 | Req.ProximityPaths = {testPath("file.h")}; |
| 666 | EXPECT_THAT(match(I, Req), ElementsAre("root::abc")); |
| 667 | } |
| 668 | |
Sam McCall | d9eae39 | 2018-10-04 09:16:12 +0000 | [diff] [blame] | 669 | TEST(DexTests, Refs) { |
| 670 | DenseMap<SymbolID, std::vector<Ref>> Refs; |
| 671 | auto AddRef = [&](const Symbol& Sym, StringRef Filename, RefKind Kind) { |
| 672 | auto& SymbolRefs = Refs[Sym.ID]; |
| 673 | SymbolRefs.emplace_back(); |
| 674 | SymbolRefs.back().Kind = Kind; |
| 675 | SymbolRefs.back().Location.FileURI = Filename; |
| 676 | }; |
| 677 | auto Foo = symbol("foo"); |
| 678 | auto Bar = symbol("bar"); |
| 679 | AddRef(Foo, "foo.h", RefKind::Declaration); |
| 680 | AddRef(Foo, "reffoo.h", RefKind::Reference); |
| 681 | AddRef(Bar, "bar.h", RefKind::Declaration); |
| 682 | |
| 683 | std::vector<std::string> Files; |
| 684 | RefsRequest Req; |
| 685 | Req.IDs.insert(Foo.ID); |
| 686 | Req.Filter = RefKind::Declaration | RefKind::Definition; |
| 687 | Dex(std::vector<Symbol>{Foo, Bar}, Refs, {}).refs(Req, [&](const Ref &R) { |
| 688 | Files.push_back(R.Location.FileURI); |
| 689 | }); |
| 690 | |
| 691 | EXPECT_THAT(Files, ElementsAre("foo.h")); |
| 692 | } |
| 693 | |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 694 | } // namespace |
Kirill Bobyrev | 5e82f05 | 2018-07-25 10:34:57 +0000 | [diff] [blame] | 695 | } // namespace dex |
| 696 | } // namespace clangd |
| 697 | } // namespace clang |