Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 1 | //===-- DexTests.cpp ---------------------------------*- C++ -*-----------===// |
Kirill Bobyrev | 5e82f05 | 2018-07-25 10:34:57 +0000 | [diff] [blame] | 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
| 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
| 9 | |
Kirill Bobyrev | 19a9461 | 2018-09-06 12:54:43 +0000 | [diff] [blame] | 10 | #include "FuzzyMatch.h" |
| 11 | #include "TestFS.h" |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 12 | #include "TestIndex.h" |
| 13 | #include "index/Index.h" |
| 14 | #include "index/Merge.h" |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 15 | #include "index/dex/Dex.h" |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 16 | #include "index/dex/Iterator.h" |
Kirill Bobyrev | 5e82f05 | 2018-07-25 10:34:57 +0000 | [diff] [blame] | 17 | #include "index/dex/Token.h" |
| 18 | #include "index/dex/Trigram.h" |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 19 | #include "llvm/Support/ScopedPrinter.h" |
| 20 | #include "llvm/Support/raw_ostream.h" |
Kirill Bobyrev | 5e82f05 | 2018-07-25 10:34:57 +0000 | [diff] [blame] | 21 | #include "gmock/gmock.h" |
| 22 | #include "gtest/gtest.h" |
Kirill Bobyrev | 5e82f05 | 2018-07-25 10:34:57 +0000 | [diff] [blame] | 23 | #include <string> |
| 24 | #include <vector> |
| 25 | |
Sam McCall | c92e4f3 | 2018-10-09 10:02:02 +0000 | [diff] [blame^] | 26 | using ::testing::AnyOf; |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 27 | using ::testing::ElementsAre; |
| 28 | using ::testing::UnorderedElementsAre; |
Sam McCall | 9c7624e | 2018-09-03 14:37:43 +0000 | [diff] [blame] | 29 | using namespace llvm; |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 30 | |
Kirill Bobyrev | 5e82f05 | 2018-07-25 10:34:57 +0000 | [diff] [blame] | 31 | namespace clang { |
| 32 | namespace clangd { |
| 33 | namespace dex { |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 34 | namespace { |
Kirill Bobyrev | bea258d | 2018-07-26 10:42:31 +0000 | [diff] [blame] | 35 | |
Kirill Bobyrev | 19a9461 | 2018-09-06 12:54:43 +0000 | [diff] [blame] | 36 | std::vector<std::string> URISchemes = {"unittest"}; |
| 37 | |
| 38 | //===----------------------------------------------------------------------===// |
| 39 | // Query iterator tests. |
| 40 | //===----------------------------------------------------------------------===// |
| 41 | |
Kirill Bobyrev | a98961b | 2018-08-24 11:25:43 +0000 | [diff] [blame] | 42 | std::vector<DocID> consumeIDs(Iterator &It) { |
| 43 | auto IDAndScore = consume(It); |
Kirill Bobyrev | 7413e98 | 2018-08-22 13:44:15 +0000 | [diff] [blame] | 44 | std::vector<DocID> IDs(IDAndScore.size()); |
| 45 | for (size_t I = 0; I < IDAndScore.size(); ++I) |
| 46 | IDs[I] = IDAndScore[I].first; |
| 47 | return IDs; |
| 48 | } |
| 49 | |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 50 | TEST(DexIterators, DocumentIterator) { |
Kirill Bobyrev | 249c586 | 2018-09-13 17:11:03 +0000 | [diff] [blame] | 51 | const PostingList L({4, 7, 8, 20, 42, 100}); |
| 52 | auto DocIterator = L.iterator(); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 53 | |
| 54 | EXPECT_EQ(DocIterator->peek(), 4U); |
Kirill Bobyrev | 6d8bd7f | 2018-08-20 09:16:14 +0000 | [diff] [blame] | 55 | EXPECT_FALSE(DocIterator->reachedEnd()); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 56 | |
| 57 | DocIterator->advance(); |
| 58 | EXPECT_EQ(DocIterator->peek(), 7U); |
Kirill Bobyrev | 6d8bd7f | 2018-08-20 09:16:14 +0000 | [diff] [blame] | 59 | EXPECT_FALSE(DocIterator->reachedEnd()); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 60 | |
| 61 | DocIterator->advanceTo(20); |
| 62 | EXPECT_EQ(DocIterator->peek(), 20U); |
Kirill Bobyrev | 6d8bd7f | 2018-08-20 09:16:14 +0000 | [diff] [blame] | 63 | EXPECT_FALSE(DocIterator->reachedEnd()); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 64 | |
| 65 | DocIterator->advanceTo(65); |
| 66 | EXPECT_EQ(DocIterator->peek(), 100U); |
Kirill Bobyrev | 6d8bd7f | 2018-08-20 09:16:14 +0000 | [diff] [blame] | 67 | EXPECT_FALSE(DocIterator->reachedEnd()); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 68 | |
| 69 | DocIterator->advanceTo(420); |
Kirill Bobyrev | 6d8bd7f | 2018-08-20 09:16:14 +0000 | [diff] [blame] | 70 | EXPECT_TRUE(DocIterator->reachedEnd()); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 71 | } |
| 72 | |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 73 | TEST(DexIterators, AndTwoLists) { |
Sam McCall | a659d77 | 2018-10-02 19:59:23 +0000 | [diff] [blame] | 74 | Corpus C{10000}; |
Kirill Bobyrev | 249c586 | 2018-09-13 17:11:03 +0000 | [diff] [blame] | 75 | const PostingList L0({0, 5, 7, 10, 42, 320, 9000}); |
| 76 | const PostingList L1({0, 4, 7, 10, 30, 60, 320, 9000}); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 77 | |
Sam McCall | a659d77 | 2018-10-02 19:59:23 +0000 | [diff] [blame] | 78 | auto And = C.intersect(L1.iterator(), L0.iterator()); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 79 | |
Kirill Bobyrev | 6d8bd7f | 2018-08-20 09:16:14 +0000 | [diff] [blame] | 80 | EXPECT_FALSE(And->reachedEnd()); |
Kirill Bobyrev | 7413e98 | 2018-08-22 13:44:15 +0000 | [diff] [blame] | 81 | EXPECT_THAT(consumeIDs(*And), ElementsAre(0U, 7U, 10U, 320U, 9000U)); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 82 | |
Sam McCall | a659d77 | 2018-10-02 19:59:23 +0000 | [diff] [blame] | 83 | And = C.intersect(L0.iterator(), L1.iterator()); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 84 | |
| 85 | And->advanceTo(0); |
| 86 | EXPECT_EQ(And->peek(), 0U); |
| 87 | And->advanceTo(5); |
| 88 | EXPECT_EQ(And->peek(), 7U); |
| 89 | And->advanceTo(10); |
| 90 | EXPECT_EQ(And->peek(), 10U); |
| 91 | And->advanceTo(42); |
| 92 | EXPECT_EQ(And->peek(), 320U); |
| 93 | And->advanceTo(8999); |
| 94 | EXPECT_EQ(And->peek(), 9000U); |
| 95 | And->advanceTo(9001); |
| 96 | } |
| 97 | |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 98 | TEST(DexIterators, AndThreeLists) { |
Sam McCall | a659d77 | 2018-10-02 19:59:23 +0000 | [diff] [blame] | 99 | Corpus C{10000}; |
Kirill Bobyrev | 249c586 | 2018-09-13 17:11:03 +0000 | [diff] [blame] | 100 | const PostingList L0({0, 5, 7, 10, 42, 320, 9000}); |
| 101 | const PostingList L1({0, 4, 7, 10, 30, 60, 320, 9000}); |
| 102 | const PostingList L2({1, 4, 7, 11, 30, 60, 320, 9000}); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 103 | |
Sam McCall | a659d77 | 2018-10-02 19:59:23 +0000 | [diff] [blame] | 104 | auto And = C.intersect(L0.iterator(), L1.iterator(), L2.iterator()); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 105 | EXPECT_EQ(And->peek(), 7U); |
| 106 | And->advanceTo(300); |
| 107 | EXPECT_EQ(And->peek(), 320U); |
| 108 | And->advanceTo(100000); |
| 109 | |
Kirill Bobyrev | 6d8bd7f | 2018-08-20 09:16:14 +0000 | [diff] [blame] | 110 | EXPECT_TRUE(And->reachedEnd()); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 111 | } |
| 112 | |
Sam McCall | 87f69eaf | 2018-10-04 13:12:23 +0000 | [diff] [blame] | 113 | TEST(DexIterators, AndEmpty) { |
| 114 | Corpus C{10000}; |
Sam McCall | a4c17dd | 2018-10-04 16:05:22 +0000 | [diff] [blame] | 115 | const PostingList L1{1}; |
| 116 | const PostingList L2{2}; |
Sam McCall | 87f69eaf | 2018-10-04 13:12:23 +0000 | [diff] [blame] | 117 | // These iterators are empty, but the optimizer can't tell. |
| 118 | auto Empty1 = C.intersect(L1.iterator(), L2.iterator()); |
| 119 | auto Empty2 = C.intersect(L1.iterator(), L2.iterator()); |
| 120 | // And syncs iterators on construction, and used to fail on empty children. |
| 121 | auto And = C.intersect(std::move(Empty1), std::move(Empty2)); |
| 122 | EXPECT_TRUE(And->reachedEnd()); |
| 123 | } |
| 124 | |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 125 | TEST(DexIterators, OrTwoLists) { |
Sam McCall | a659d77 | 2018-10-02 19:59:23 +0000 | [diff] [blame] | 126 | Corpus C{10000}; |
Kirill Bobyrev | 249c586 | 2018-09-13 17:11:03 +0000 | [diff] [blame] | 127 | const PostingList L0({0, 5, 7, 10, 42, 320, 9000}); |
| 128 | const PostingList L1({0, 4, 7, 10, 30, 60, 320, 9000}); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 129 | |
Sam McCall | a659d77 | 2018-10-02 19:59:23 +0000 | [diff] [blame] | 130 | auto Or = C.unionOf(L0.iterator(), L1.iterator()); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 131 | |
Kirill Bobyrev | 6d8bd7f | 2018-08-20 09:16:14 +0000 | [diff] [blame] | 132 | EXPECT_FALSE(Or->reachedEnd()); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 133 | EXPECT_EQ(Or->peek(), 0U); |
| 134 | Or->advance(); |
| 135 | EXPECT_EQ(Or->peek(), 4U); |
| 136 | Or->advance(); |
| 137 | EXPECT_EQ(Or->peek(), 5U); |
| 138 | Or->advance(); |
| 139 | EXPECT_EQ(Or->peek(), 7U); |
| 140 | Or->advance(); |
| 141 | EXPECT_EQ(Or->peek(), 10U); |
| 142 | Or->advance(); |
| 143 | EXPECT_EQ(Or->peek(), 30U); |
| 144 | Or->advanceTo(42); |
| 145 | EXPECT_EQ(Or->peek(), 42U); |
| 146 | Or->advanceTo(300); |
| 147 | EXPECT_EQ(Or->peek(), 320U); |
| 148 | Or->advanceTo(9000); |
| 149 | EXPECT_EQ(Or->peek(), 9000U); |
| 150 | Or->advanceTo(9001); |
Kirill Bobyrev | 6d8bd7f | 2018-08-20 09:16:14 +0000 | [diff] [blame] | 151 | EXPECT_TRUE(Or->reachedEnd()); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 152 | |
Sam McCall | a659d77 | 2018-10-02 19:59:23 +0000 | [diff] [blame] | 153 | Or = C.unionOf(L0.iterator(), L1.iterator()); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 154 | |
Kirill Bobyrev | 7413e98 | 2018-08-22 13:44:15 +0000 | [diff] [blame] | 155 | EXPECT_THAT(consumeIDs(*Or), |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 156 | ElementsAre(0U, 4U, 5U, 7U, 10U, 30U, 42U, 60U, 320U, 9000U)); |
| 157 | } |
| 158 | |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 159 | TEST(DexIterators, OrThreeLists) { |
Sam McCall | a659d77 | 2018-10-02 19:59:23 +0000 | [diff] [blame] | 160 | Corpus C{10000}; |
Kirill Bobyrev | 249c586 | 2018-09-13 17:11:03 +0000 | [diff] [blame] | 161 | const PostingList L0({0, 5, 7, 10, 42, 320, 9000}); |
| 162 | const PostingList L1({0, 4, 7, 10, 30, 60, 320, 9000}); |
| 163 | const PostingList L2({1, 4, 7, 11, 30, 60, 320, 9000}); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 164 | |
Sam McCall | a659d77 | 2018-10-02 19:59:23 +0000 | [diff] [blame] | 165 | auto Or = C.unionOf(L0.iterator(), L1.iterator(), L2.iterator()); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 166 | |
Kirill Bobyrev | 6d8bd7f | 2018-08-20 09:16:14 +0000 | [diff] [blame] | 167 | EXPECT_FALSE(Or->reachedEnd()); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 168 | EXPECT_EQ(Or->peek(), 0U); |
| 169 | |
| 170 | Or->advance(); |
| 171 | EXPECT_EQ(Or->peek(), 1U); |
| 172 | |
| 173 | Or->advance(); |
| 174 | EXPECT_EQ(Or->peek(), 4U); |
| 175 | |
| 176 | Or->advanceTo(7); |
| 177 | |
| 178 | Or->advanceTo(59); |
| 179 | EXPECT_EQ(Or->peek(), 60U); |
| 180 | |
| 181 | Or->advanceTo(9001); |
Kirill Bobyrev | 6d8bd7f | 2018-08-20 09:16:14 +0000 | [diff] [blame] | 182 | EXPECT_TRUE(Or->reachedEnd()); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 183 | } |
| 184 | |
| 185 | // FIXME(kbobyrev): The testcase below is similar to what is expected in real |
| 186 | // queries. It should be updated once new iterators (such as boosting, limiting, |
| 187 | // etc iterators) appear. However, it is not exhaustive and it would be |
Kirill Bobyrev | 7413e98 | 2018-08-22 13:44:15 +0000 | [diff] [blame] | 188 | // beneficial to implement automatic generation (e.g. fuzzing) of query trees |
| 189 | // for more comprehensive testing. |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 190 | TEST(DexIterators, QueryTree) { |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 191 | // |
| 192 | // +-----------------+ |
| 193 | // |And Iterator:1, 5| |
| 194 | // +--------+--------+ |
| 195 | // | |
| 196 | // | |
Kirill Bobyrev | 7413e98 | 2018-08-22 13:44:15 +0000 | [diff] [blame] | 197 | // +-------------+----------------------+ |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 198 | // | | |
| 199 | // | | |
Kirill Bobyrev | 7413e98 | 2018-08-22 13:44:15 +0000 | [diff] [blame] | 200 | // +----------v----------+ +----------v------------+ |
| 201 | // |And Iterator: 1, 5, 9| |Or Iterator: 0, 1, 3, 5| |
| 202 | // +----------+----------+ +----------+------------+ |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 203 | // | | |
Kirill Bobyrev | 6c2f5bd | 2018-09-25 11:54:51 +0000 | [diff] [blame] | 204 | // +------+-----+ ------------+ |
| 205 | // | | | | |
| 206 | // +-------v-----+ +----+---+ +---v----+ +----v---+ |
| 207 | // |1, 3, 5, 8, 9| |Boost: 2| |Boost: 3| |Boost: 4| |
| 208 | // +-------------+ +----+---+ +---+----+ +----+---+ |
| 209 | // | | | |
| 210 | // +----v-----+ +-v--+ +---v---+ |
| 211 | // |1, 5, 7, 9| |1, 5| |0, 3, 5| |
| 212 | // +----------+ +----+ +-------+ |
Kirill Bobyrev | 7413e98 | 2018-08-22 13:44:15 +0000 | [diff] [blame] | 213 | // |
Sam McCall | a659d77 | 2018-10-02 19:59:23 +0000 | [diff] [blame] | 214 | Corpus C{10}; |
Kirill Bobyrev | 249c586 | 2018-09-13 17:11:03 +0000 | [diff] [blame] | 215 | const PostingList L0({1, 3, 5, 8, 9}); |
| 216 | const PostingList L1({1, 5, 7, 9}); |
Kirill Bobyrev | 6c2f5bd | 2018-09-25 11:54:51 +0000 | [diff] [blame] | 217 | const PostingList L2({1, 5}); |
| 218 | const PostingList L3({0, 3, 5}); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 219 | |
| 220 | // Root of the query tree: [1, 5] |
Sam McCall | a659d77 | 2018-10-02 19:59:23 +0000 | [diff] [blame] | 221 | auto Root = C.intersect( |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 222 | // Lower And Iterator: [1, 5, 9] |
Sam McCall | a659d77 | 2018-10-02 19:59:23 +0000 | [diff] [blame] | 223 | C.intersect(L0.iterator(), C.boost(L1.iterator(), 2U)), |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 224 | // Lower Or Iterator: [0, 1, 5] |
Sam McCall | a659d77 | 2018-10-02 19:59:23 +0000 | [diff] [blame] | 225 | C.unionOf(C.boost(L2.iterator(), 3U), C.boost(L3.iterator(), 4U))); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 226 | |
Kirill Bobyrev | 6d8bd7f | 2018-08-20 09:16:14 +0000 | [diff] [blame] | 227 | EXPECT_FALSE(Root->reachedEnd()); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 228 | EXPECT_EQ(Root->peek(), 1U); |
| 229 | Root->advanceTo(0); |
| 230 | // Advance multiple times. Shouldn't do anything. |
| 231 | Root->advanceTo(1); |
| 232 | Root->advanceTo(0); |
| 233 | EXPECT_EQ(Root->peek(), 1U); |
Kirill Bobyrev | a98961b | 2018-08-24 11:25:43 +0000 | [diff] [blame] | 234 | auto ElementBoost = Root->consume(); |
Kirill Bobyrev | 7413e98 | 2018-08-22 13:44:15 +0000 | [diff] [blame] | 235 | EXPECT_THAT(ElementBoost, 6); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 236 | Root->advance(); |
| 237 | EXPECT_EQ(Root->peek(), 5U); |
| 238 | Root->advanceTo(5); |
| 239 | EXPECT_EQ(Root->peek(), 5U); |
Kirill Bobyrev | a98961b | 2018-08-24 11:25:43 +0000 | [diff] [blame] | 240 | ElementBoost = Root->consume(); |
Kirill Bobyrev | 7413e98 | 2018-08-22 13:44:15 +0000 | [diff] [blame] | 241 | EXPECT_THAT(ElementBoost, 8); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 242 | Root->advanceTo(9000); |
Kirill Bobyrev | 6d8bd7f | 2018-08-20 09:16:14 +0000 | [diff] [blame] | 243 | EXPECT_TRUE(Root->reachedEnd()); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 244 | } |
| 245 | |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 246 | TEST(DexIterators, StringRepresentation) { |
Sam McCall | a659d77 | 2018-10-02 19:59:23 +0000 | [diff] [blame] | 247 | Corpus C{10}; |
Sam McCall | 7402836 | 2018-10-02 11:51:36 +0000 | [diff] [blame] | 248 | const PostingList L1({1, 3, 5}); |
| 249 | const PostingList L2({1, 7, 9}); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 250 | |
Sam McCall | 7402836 | 2018-10-02 11:51:36 +0000 | [diff] [blame] | 251 | // No token given, prints full posting list. |
| 252 | auto I1 = L1.iterator(); |
| 253 | EXPECT_EQ(llvm::to_string(*I1), "[1 3 5]"); |
| 254 | |
| 255 | // Token given, uses token's string representation. |
| 256 | Token Tok(Token::Kind::Trigram, "L2"); |
| 257 | auto I2 = L1.iterator(&Tok); |
| 258 | EXPECT_EQ(llvm::to_string(*I2), "T=L2"); |
| 259 | |
Sam McCall | a659d77 | 2018-10-02 19:59:23 +0000 | [diff] [blame] | 260 | auto Tree = C.limit(C.intersect(move(I1), move(I2)), 10); |
Sam McCall | c92e4f3 | 2018-10-09 10:02:02 +0000 | [diff] [blame^] | 261 | // AND reorders its children, we don't care which order it prints. |
| 262 | EXPECT_THAT(llvm::to_string(*Tree), AnyOf("(LIMIT 10 (& [1 3 5] T=L2))", |
| 263 | "(LIMIT 10 (& T=L2 [1 3 5]))")); |
Kirill Bobyrev | a522c1c | 2018-07-27 09:54:27 +0000 | [diff] [blame] | 264 | } |
| 265 | |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 266 | TEST(DexIterators, Limit) { |
Sam McCall | a659d77 | 2018-10-02 19:59:23 +0000 | [diff] [blame] | 267 | Corpus C{10000}; |
Kirill Bobyrev | 249c586 | 2018-09-13 17:11:03 +0000 | [diff] [blame] | 268 | const PostingList L0({3, 6, 7, 20, 42, 100}); |
| 269 | const PostingList L1({1, 3, 5, 6, 7, 30, 100}); |
| 270 | const PostingList L2({0, 3, 5, 7, 8, 100}); |
Kirill Bobyrev | 0a75766 | 2018-08-10 11:50:44 +0000 | [diff] [blame] | 271 | |
Sam McCall | a659d77 | 2018-10-02 19:59:23 +0000 | [diff] [blame] | 272 | auto DocIterator = C.limit(L0.iterator(), 42); |
Kirill Bobyrev | a98961b | 2018-08-24 11:25:43 +0000 | [diff] [blame] | 273 | EXPECT_THAT(consumeIDs(*DocIterator), ElementsAre(3, 6, 7, 20, 42, 100)); |
Kirill Bobyrev | 0a75766 | 2018-08-10 11:50:44 +0000 | [diff] [blame] | 274 | |
Sam McCall | a659d77 | 2018-10-02 19:59:23 +0000 | [diff] [blame] | 275 | DocIterator = C.limit(L0.iterator(), 3); |
Kirill Bobyrev | a98961b | 2018-08-24 11:25:43 +0000 | [diff] [blame] | 276 | EXPECT_THAT(consumeIDs(*DocIterator), ElementsAre(3, 6, 7)); |
Kirill Bobyrev | 0a75766 | 2018-08-10 11:50:44 +0000 | [diff] [blame] | 277 | |
Sam McCall | a659d77 | 2018-10-02 19:59:23 +0000 | [diff] [blame] | 278 | DocIterator = C.limit(L0.iterator(), 0); |
Kirill Bobyrev | a98961b | 2018-08-24 11:25:43 +0000 | [diff] [blame] | 279 | EXPECT_THAT(consumeIDs(*DocIterator), ElementsAre()); |
Kirill Bobyrev | 0a75766 | 2018-08-10 11:50:44 +0000 | [diff] [blame] | 280 | |
Sam McCall | a659d77 | 2018-10-02 19:59:23 +0000 | [diff] [blame] | 281 | auto AndIterator = |
| 282 | C.intersect(C.limit(C.all(), 343), C.limit(L0.iterator(), 2), |
| 283 | C.limit(L1.iterator(), 3), C.limit(L2.iterator(), 42)); |
Kirill Bobyrev | a98961b | 2018-08-24 11:25:43 +0000 | [diff] [blame] | 284 | EXPECT_THAT(consumeIDs(*AndIterator), ElementsAre(3, 7)); |
Kirill Bobyrev | 0a75766 | 2018-08-10 11:50:44 +0000 | [diff] [blame] | 285 | } |
| 286 | |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 287 | TEST(DexIterators, True) { |
Sam McCall | 87f69eaf | 2018-10-04 13:12:23 +0000 | [diff] [blame] | 288 | EXPECT_TRUE(Corpus{0}.all()->reachedEnd()); |
| 289 | EXPECT_THAT(consumeIDs(*Corpus{4}.all()), ElementsAre(0, 1, 2, 3)); |
Kirill Bobyrev | 7413e98 | 2018-08-22 13:44:15 +0000 | [diff] [blame] | 290 | } |
| 291 | |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 292 | TEST(DexIterators, Boost) { |
Sam McCall | a659d77 | 2018-10-02 19:59:23 +0000 | [diff] [blame] | 293 | Corpus C{5}; |
| 294 | auto BoostIterator = C.boost(C.all(), 42U); |
Kirill Bobyrev | 7413e98 | 2018-08-22 13:44:15 +0000 | [diff] [blame] | 295 | EXPECT_FALSE(BoostIterator->reachedEnd()); |
Kirill Bobyrev | a98961b | 2018-08-24 11:25:43 +0000 | [diff] [blame] | 296 | auto ElementBoost = BoostIterator->consume(); |
Kirill Bobyrev | 7413e98 | 2018-08-22 13:44:15 +0000 | [diff] [blame] | 297 | EXPECT_THAT(ElementBoost, 42U); |
| 298 | |
Kirill Bobyrev | 249c586 | 2018-09-13 17:11:03 +0000 | [diff] [blame] | 299 | const PostingList L0({2, 4}); |
| 300 | const PostingList L1({1, 4}); |
Sam McCall | a659d77 | 2018-10-02 19:59:23 +0000 | [diff] [blame] | 301 | auto Root = C.unionOf(C.all(), C.boost(L0.iterator(), 2U), |
| 302 | C.boost(L1.iterator(), 3U)); |
Kirill Bobyrev | 7413e98 | 2018-08-22 13:44:15 +0000 | [diff] [blame] | 303 | |
Kirill Bobyrev | a98961b | 2018-08-24 11:25:43 +0000 | [diff] [blame] | 304 | ElementBoost = Root->consume(); |
Sam McCall | a659d77 | 2018-10-02 19:59:23 +0000 | [diff] [blame] | 305 | EXPECT_THAT(ElementBoost, 1); |
Kirill Bobyrev | 7413e98 | 2018-08-22 13:44:15 +0000 | [diff] [blame] | 306 | Root->advance(); |
| 307 | EXPECT_THAT(Root->peek(), 1U); |
Kirill Bobyrev | a98961b | 2018-08-24 11:25:43 +0000 | [diff] [blame] | 308 | ElementBoost = Root->consume(); |
Kirill Bobyrev | 7413e98 | 2018-08-22 13:44:15 +0000 | [diff] [blame] | 309 | EXPECT_THAT(ElementBoost, 3); |
| 310 | |
| 311 | Root->advance(); |
| 312 | EXPECT_THAT(Root->peek(), 2U); |
Kirill Bobyrev | a98961b | 2018-08-24 11:25:43 +0000 | [diff] [blame] | 313 | ElementBoost = Root->consume(); |
Kirill Bobyrev | 7413e98 | 2018-08-22 13:44:15 +0000 | [diff] [blame] | 314 | EXPECT_THAT(ElementBoost, 2); |
| 315 | |
| 316 | Root->advanceTo(4); |
Kirill Bobyrev | a98961b | 2018-08-24 11:25:43 +0000 | [diff] [blame] | 317 | ElementBoost = Root->consume(); |
Kirill Bobyrev | 7413e98 | 2018-08-22 13:44:15 +0000 | [diff] [blame] | 318 | EXPECT_THAT(ElementBoost, 3); |
Kirill Bobyrev | 30ffdf4 | 2018-08-20 08:47:30 +0000 | [diff] [blame] | 319 | } |
| 320 | |
Sam McCall | 87f69eaf | 2018-10-04 13:12:23 +0000 | [diff] [blame] | 321 | TEST(DexIterators, Optimizations) { |
| 322 | Corpus C{5}; |
Jonas Toth | 0451440 | 2018-10-04 16:29:58 +0000 | [diff] [blame] | 323 | const PostingList L1{1}; |
| 324 | const PostingList L2{2}; |
| 325 | const PostingList L3{3}; |
Sam McCall | 87f69eaf | 2018-10-04 13:12:23 +0000 | [diff] [blame] | 326 | |
| 327 | // empty and/or yield true/false |
| 328 | EXPECT_EQ(llvm::to_string(*C.intersect()), "true"); |
| 329 | EXPECT_EQ(llvm::to_string(*C.unionOf()), "false"); |
| 330 | |
| 331 | // true/false inside and/or short-circuit |
| 332 | EXPECT_EQ(llvm::to_string(*C.intersect(L1.iterator(), C.all())), "[1]"); |
| 333 | EXPECT_EQ(llvm::to_string(*C.intersect(L1.iterator(), C.none())), "false"); |
| 334 | // Not optimized to avoid breaking boosts. |
| 335 | EXPECT_EQ(llvm::to_string(*C.unionOf(L1.iterator(), C.all())), |
| 336 | "(| [1] true)"); |
| 337 | EXPECT_EQ(llvm::to_string(*C.unionOf(L1.iterator(), C.none())), "[1]"); |
| 338 | |
| 339 | // and/or nested inside and/or are flattened |
| 340 | EXPECT_EQ(llvm::to_string(*C.intersect( |
| 341 | L1.iterator(), C.intersect(L1.iterator(), L1.iterator()))), |
| 342 | "(& [1] [1] [1])"); |
| 343 | EXPECT_EQ(llvm::to_string(*C.unionOf( |
| 344 | L1.iterator(), C.unionOf(L2.iterator(), L3.iterator()))), |
| 345 | "(| [1] [2] [3])"); |
| 346 | |
| 347 | // optimizations combine over multiple levels |
| 348 | EXPECT_EQ(llvm::to_string(*C.intersect( |
| 349 | C.intersect(L1.iterator(), C.intersect()), C.unionOf(C.all()))), |
| 350 | "[1]"); |
| 351 | } |
| 352 | |
Kirill Bobyrev | 19a9461 | 2018-09-06 12:54:43 +0000 | [diff] [blame] | 353 | //===----------------------------------------------------------------------===// |
| 354 | // Search token tests. |
| 355 | //===----------------------------------------------------------------------===// |
| 356 | |
Kirill Bobyrev | 5e82f05 | 2018-07-25 10:34:57 +0000 | [diff] [blame] | 357 | testing::Matcher<std::vector<Token>> |
Kirill Bobyrev | 19a9461 | 2018-09-06 12:54:43 +0000 | [diff] [blame] | 358 | tokensAre(std::initializer_list<std::string> Strings, Token::Kind Kind) { |
Kirill Bobyrev | 5e82f05 | 2018-07-25 10:34:57 +0000 | [diff] [blame] | 359 | std::vector<Token> Tokens; |
Kirill Bobyrev | 19a9461 | 2018-09-06 12:54:43 +0000 | [diff] [blame] | 360 | for (const auto &TokenData : Strings) { |
| 361 | Tokens.push_back(Token(Kind, TokenData)); |
Kirill Bobyrev | 5e82f05 | 2018-07-25 10:34:57 +0000 | [diff] [blame] | 362 | } |
| 363 | return testing::UnorderedElementsAreArray(Tokens); |
| 364 | } |
| 365 | |
Kirill Bobyrev | 19a9461 | 2018-09-06 12:54:43 +0000 | [diff] [blame] | 366 | testing::Matcher<std::vector<Token>> |
| 367 | trigramsAre(std::initializer_list<std::string> Trigrams) { |
| 368 | return tokensAre(Trigrams, Token::Kind::Trigram); |
| 369 | } |
| 370 | |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 371 | TEST(DexTrigrams, IdentifierTrigrams) { |
Kirill Bobyrev | ff2dd90 | 2018-08-13 08:57:06 +0000 | [diff] [blame] | 372 | EXPECT_THAT(generateIdentifierTrigrams("X86"), |
Sam McCall | b5bbfef | 2018-10-04 14:01:55 +0000 | [diff] [blame] | 373 | trigramsAre({"x86", "x", "x8"})); |
Kirill Bobyrev | 5e82f05 | 2018-07-25 10:34:57 +0000 | [diff] [blame] | 374 | |
Sam McCall | b5bbfef | 2018-10-04 14:01:55 +0000 | [diff] [blame] | 375 | EXPECT_THAT(generateIdentifierTrigrams("nl"), trigramsAre({"nl", "n"})); |
Kirill Bobyrev | ff2dd90 | 2018-08-13 08:57:06 +0000 | [diff] [blame] | 376 | |
Sam McCall | b5bbfef | 2018-10-04 14:01:55 +0000 | [diff] [blame] | 377 | EXPECT_THAT(generateIdentifierTrigrams("n"), trigramsAre({"n"})); |
Kirill Bobyrev | 5e82f05 | 2018-07-25 10:34:57 +0000 | [diff] [blame] | 378 | |
| 379 | EXPECT_THAT(generateIdentifierTrigrams("clangd"), |
Sam McCall | b5bbfef | 2018-10-04 14:01:55 +0000 | [diff] [blame] | 380 | trigramsAre({"c", "cl", "cla", "lan", "ang", "ngd"})); |
Kirill Bobyrev | 5e82f05 | 2018-07-25 10:34:57 +0000 | [diff] [blame] | 381 | |
| 382 | EXPECT_THAT(generateIdentifierTrigrams("abc_def"), |
Sam McCall | b5bbfef | 2018-10-04 14:01:55 +0000 | [diff] [blame] | 383 | trigramsAre({"a", "ab", "ad", "abc", "abd", "ade", "bcd", "bde", |
| 384 | "cde", "def"})); |
Kirill Bobyrev | 5e82f05 | 2018-07-25 10:34:57 +0000 | [diff] [blame] | 385 | |
Kirill Bobyrev | ff2dd90 | 2018-08-13 08:57:06 +0000 | [diff] [blame] | 386 | EXPECT_THAT(generateIdentifierTrigrams("a_b_c_d_e_"), |
Sam McCall | 2ec5a10 | 2018-10-04 14:08:11 +0000 | [diff] [blame] | 387 | trigramsAre({"a", "a_", "ab", "abc", "bcd", "cde"})); |
Kirill Bobyrev | 5e82f05 | 2018-07-25 10:34:57 +0000 | [diff] [blame] | 388 | |
Kirill Bobyrev | ff2dd90 | 2018-08-13 08:57:06 +0000 | [diff] [blame] | 389 | EXPECT_THAT(generateIdentifierTrigrams("unique_ptr"), |
Sam McCall | b5bbfef | 2018-10-04 14:01:55 +0000 | [diff] [blame] | 390 | trigramsAre({"u", "un", "up", "uni", "unp", "upt", "niq", "nip", |
| 391 | "npt", "iqu", "iqp", "ipt", "que", "qup", "qpt", |
| 392 | "uep", "ept", "ptr"})); |
Kirill Bobyrev | 5e82f05 | 2018-07-25 10:34:57 +0000 | [diff] [blame] | 393 | |
Kirill Bobyrev | e6d5fd8 | 2018-08-27 17:26:43 +0000 | [diff] [blame] | 394 | EXPECT_THAT( |
| 395 | generateIdentifierTrigrams("TUDecl"), |
Sam McCall | b5bbfef | 2018-10-04 14:01:55 +0000 | [diff] [blame] | 396 | trigramsAre({"t", "tu", "td", "tud", "tde", "ude", "dec", "ecl"})); |
Kirill Bobyrev | 5e82f05 | 2018-07-25 10:34:57 +0000 | [diff] [blame] | 397 | |
| 398 | EXPECT_THAT(generateIdentifierTrigrams("IsOK"), |
Sam McCall | b5bbfef | 2018-10-04 14:01:55 +0000 | [diff] [blame] | 399 | trigramsAre({"i", "is", "io", "iso", "iok", "sok"})); |
Kirill Bobyrev | 5e82f05 | 2018-07-25 10:34:57 +0000 | [diff] [blame] | 400 | |
Kirill Bobyrev | ff2dd90 | 2018-08-13 08:57:06 +0000 | [diff] [blame] | 401 | EXPECT_THAT( |
| 402 | generateIdentifierTrigrams("abc_defGhij__klm"), |
Sam McCall | 2ec5a10 | 2018-10-04 14:08:11 +0000 | [diff] [blame] | 403 | trigramsAre({"a", "ab", "ad", "abc", "abd", "ade", "adg", "bcd", |
| 404 | "bde", "bdg", "cde", "cdg", "def", "deg", "dgh", "dgk", |
| 405 | "efg", "egh", "egk", "fgh", "fgk", "ghi", "ghk", "gkl", |
Sam McCall | b5bbfef | 2018-10-04 14:01:55 +0000 | [diff] [blame] | 406 | "hij", "hik", "hkl", "ijk", "ikl", "jkl", "klm"})); |
Kirill Bobyrev | 5e82f05 | 2018-07-25 10:34:57 +0000 | [diff] [blame] | 407 | } |
| 408 | |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 409 | TEST(DexTrigrams, QueryTrigrams) { |
Sam McCall | b5bbfef | 2018-10-04 14:01:55 +0000 | [diff] [blame] | 410 | EXPECT_THAT(generateQueryTrigrams("c"), trigramsAre({"c"})); |
| 411 | EXPECT_THAT(generateQueryTrigrams("cl"), trigramsAre({"cl"})); |
Kirill Bobyrev | ff2dd90 | 2018-08-13 08:57:06 +0000 | [diff] [blame] | 412 | EXPECT_THAT(generateQueryTrigrams("cla"), trigramsAre({"cla"})); |
Kirill Bobyrev | 5e82f05 | 2018-07-25 10:34:57 +0000 | [diff] [blame] | 413 | |
Sam McCall | 50b89f0 | 2018-10-04 17:18:55 +0000 | [diff] [blame] | 414 | EXPECT_THAT(generateQueryTrigrams(""), trigramsAre({})); |
Sam McCall | b5bbfef | 2018-10-04 14:01:55 +0000 | [diff] [blame] | 415 | EXPECT_THAT(generateQueryTrigrams("_"), trigramsAre({"_"})); |
| 416 | EXPECT_THAT(generateQueryTrigrams("__"), trigramsAre({"__"})); |
| 417 | EXPECT_THAT(generateQueryTrigrams("___"), trigramsAre({})); |
Kirill Bobyrev | ff2dd90 | 2018-08-13 08:57:06 +0000 | [diff] [blame] | 418 | |
| 419 | EXPECT_THAT(generateQueryTrigrams("X86"), trigramsAre({"x86"})); |
Kirill Bobyrev | 5e82f05 | 2018-07-25 10:34:57 +0000 | [diff] [blame] | 420 | |
| 421 | EXPECT_THAT(generateQueryTrigrams("clangd"), |
| 422 | trigramsAre({"cla", "lan", "ang", "ngd"})); |
| 423 | |
| 424 | EXPECT_THAT(generateQueryTrigrams("abc_def"), |
| 425 | trigramsAre({"abc", "bcd", "cde", "def"})); |
| 426 | |
| 427 | EXPECT_THAT(generateQueryTrigrams("a_b_c_d_e_"), |
| 428 | trigramsAre({"abc", "bcd", "cde"})); |
| 429 | |
| 430 | EXPECT_THAT(generateQueryTrigrams("unique_ptr"), |
| 431 | trigramsAre({"uni", "niq", "iqu", "que", "uep", "ept", "ptr"})); |
| 432 | |
| 433 | EXPECT_THAT(generateQueryTrigrams("TUDecl"), |
| 434 | trigramsAre({"tud", "ude", "dec", "ecl"})); |
| 435 | |
| 436 | EXPECT_THAT(generateQueryTrigrams("IsOK"), trigramsAre({"iso", "sok"})); |
| 437 | |
| 438 | EXPECT_THAT(generateQueryTrigrams("abc_defGhij__klm"), |
| 439 | trigramsAre({"abc", "bcd", "cde", "def", "efg", "fgh", "ghi", |
| 440 | "hij", "ijk", "jkl", "klm"})); |
| 441 | } |
| 442 | |
Kirill Bobyrev | 19a9461 | 2018-09-06 12:54:43 +0000 | [diff] [blame] | 443 | TEST(DexSearchTokens, SymbolPath) { |
| 444 | EXPECT_THAT(generateProximityURIs( |
| 445 | "unittest:///clang-tools-extra/clangd/index/Token.h"), |
| 446 | ElementsAre("unittest:///clang-tools-extra/clangd/index/Token.h", |
| 447 | "unittest:///clang-tools-extra/clangd/index", |
| 448 | "unittest:///clang-tools-extra/clangd", |
| 449 | "unittest:///clang-tools-extra", "unittest:///")); |
| 450 | |
| 451 | EXPECT_THAT(generateProximityURIs("unittest:///a/b/c.h"), |
| 452 | ElementsAre("unittest:///a/b/c.h", "unittest:///a/b", |
| 453 | "unittest:///a", "unittest:///")); |
| 454 | } |
| 455 | |
| 456 | //===----------------------------------------------------------------------===// |
| 457 | // Index tests. |
| 458 | //===----------------------------------------------------------------------===// |
| 459 | |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 460 | TEST(Dex, Lookup) { |
Sam McCall | d9eae39 | 2018-10-04 09:16:12 +0000 | [diff] [blame] | 461 | auto I = Dex::build(generateSymbols({"ns::abc", "ns::xyz"}), RefSlab(), |
| 462 | URISchemes); |
Sam McCall | 9c7624e | 2018-09-03 14:37:43 +0000 | [diff] [blame] | 463 | EXPECT_THAT(lookup(*I, SymbolID("ns::abc")), UnorderedElementsAre("ns::abc")); |
| 464 | EXPECT_THAT(lookup(*I, {SymbolID("ns::abc"), SymbolID("ns::xyz")}), |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 465 | UnorderedElementsAre("ns::abc", "ns::xyz")); |
Sam McCall | 9c7624e | 2018-09-03 14:37:43 +0000 | [diff] [blame] | 466 | EXPECT_THAT(lookup(*I, {SymbolID("ns::nonono"), SymbolID("ns::xyz")}), |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 467 | UnorderedElementsAre("ns::xyz")); |
Sam McCall | 9c7624e | 2018-09-03 14:37:43 +0000 | [diff] [blame] | 468 | EXPECT_THAT(lookup(*I, SymbolID("ns::nonono")), UnorderedElementsAre()); |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 469 | } |
| 470 | |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 471 | TEST(Dex, FuzzyFind) { |
Kirill Bobyrev | 249c586 | 2018-09-13 17:11:03 +0000 | [diff] [blame] | 472 | auto Index = |
| 473 | Dex::build(generateSymbols({"ns::ABC", "ns::BCD", "::ABC", |
| 474 | "ns::nested::ABC", "other::ABC", "other::A"}), |
Sam McCall | d9eae39 | 2018-10-04 09:16:12 +0000 | [diff] [blame] | 475 | RefSlab(), URISchemes); |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 476 | FuzzyFindRequest Req; |
| 477 | Req.Query = "ABC"; |
| 478 | Req.Scopes = {"ns::"}; |
Sam McCall | 9c7624e | 2018-09-03 14:37:43 +0000 | [diff] [blame] | 479 | EXPECT_THAT(match(*Index, Req), UnorderedElementsAre("ns::ABC")); |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 480 | Req.Scopes = {"ns::", "ns::nested::"}; |
Sam McCall | 9c7624e | 2018-09-03 14:37:43 +0000 | [diff] [blame] | 481 | EXPECT_THAT(match(*Index, Req), |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 482 | UnorderedElementsAre("ns::ABC", "ns::nested::ABC")); |
| 483 | Req.Query = "A"; |
| 484 | Req.Scopes = {"other::"}; |
Sam McCall | 9c7624e | 2018-09-03 14:37:43 +0000 | [diff] [blame] | 485 | EXPECT_THAT(match(*Index, Req), |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 486 | UnorderedElementsAre("other::A", "other::ABC")); |
| 487 | Req.Query = ""; |
| 488 | Req.Scopes = {}; |
Sam McCall | 9c7624e | 2018-09-03 14:37:43 +0000 | [diff] [blame] | 489 | EXPECT_THAT(match(*Index, Req), |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 490 | UnorderedElementsAre("ns::ABC", "ns::BCD", "::ABC", |
| 491 | "ns::nested::ABC", "other::ABC", |
| 492 | "other::A")); |
| 493 | } |
| 494 | |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 495 | // FIXME(kbobyrev): This test is different for Dex and MemIndex: while |
| 496 | // MemIndex manages response deduplication, Dex simply returns all matched |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 497 | // symbols which means there might be equivalent symbols in the response. |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 498 | // Before drop-in replacement of MemIndex with Dex happens, FileIndex |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 499 | // should handle deduplication instead. |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 500 | TEST(DexTest, DexDeduplicate) { |
Sam McCall | 9c7624e | 2018-09-03 14:37:43 +0000 | [diff] [blame] | 501 | std::vector<Symbol> Symbols = {symbol("1"), symbol("2"), symbol("3"), |
| 502 | symbol("2") /* duplicate */}; |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 503 | FuzzyFindRequest Req; |
Sam McCall | 9c7624e | 2018-09-03 14:37:43 +0000 | [diff] [blame] | 504 | Req.Query = "2"; |
Sam McCall | d9eae39 | 2018-10-04 09:16:12 +0000 | [diff] [blame] | 505 | Dex I(Symbols, RefSlab(), URISchemes); |
Kirill Bobyrev | e6dd080 | 2018-09-13 14:27:03 +0000 | [diff] [blame] | 506 | EXPECT_FALSE(Req.Limit); |
Sam McCall | 9c7624e | 2018-09-03 14:37:43 +0000 | [diff] [blame] | 507 | EXPECT_THAT(match(I, Req), ElementsAre("2", "2")); |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 508 | } |
| 509 | |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 510 | TEST(DexTest, DexLimitedNumMatches) { |
Sam McCall | d9eae39 | 2018-10-04 09:16:12 +0000 | [diff] [blame] | 511 | auto I = Dex::build(generateNumSymbols(0, 100), RefSlab(), URISchemes); |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 512 | FuzzyFindRequest Req; |
| 513 | Req.Query = "5"; |
Kirill Bobyrev | e6dd080 | 2018-09-13 14:27:03 +0000 | [diff] [blame] | 514 | Req.Limit = 3; |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 515 | bool Incomplete; |
Sam McCall | 9c7624e | 2018-09-03 14:37:43 +0000 | [diff] [blame] | 516 | auto Matches = match(*I, Req, &Incomplete); |
Kirill Bobyrev | e6dd080 | 2018-09-13 14:27:03 +0000 | [diff] [blame] | 517 | EXPECT_TRUE(Req.Limit); |
| 518 | EXPECT_EQ(Matches.size(), *Req.Limit); |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 519 | EXPECT_TRUE(Incomplete); |
| 520 | } |
| 521 | |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 522 | TEST(DexTest, FuzzyMatch) { |
| 523 | auto I = Dex::build( |
Kirill Bobyrev | 19a9461 | 2018-09-06 12:54:43 +0000 | [diff] [blame] | 524 | generateSymbols({"LaughingOutLoud", "LionPopulation", "LittleOldLady"}), |
Sam McCall | d9eae39 | 2018-10-04 09:16:12 +0000 | [diff] [blame] | 525 | RefSlab(), URISchemes); |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 526 | FuzzyFindRequest Req; |
| 527 | Req.Query = "lol"; |
Kirill Bobyrev | e6dd080 | 2018-09-13 14:27:03 +0000 | [diff] [blame] | 528 | Req.Limit = 2; |
Sam McCall | 9c7624e | 2018-09-03 14:37:43 +0000 | [diff] [blame] | 529 | EXPECT_THAT(match(*I, Req), |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 530 | UnorderedElementsAre("LaughingOutLoud", "LittleOldLady")); |
| 531 | } |
| 532 | |
Sam McCall | b5bbfef | 2018-10-04 14:01:55 +0000 | [diff] [blame] | 533 | TEST(DexTest, ShortQuery) { |
| 534 | auto I = |
| 535 | Dex::build(generateSymbols({"OneTwoThreeFour"}), RefSlab(), URISchemes); |
| 536 | FuzzyFindRequest Req; |
| 537 | bool Incomplete; |
| 538 | |
| 539 | EXPECT_THAT(match(*I, Req, &Incomplete), ElementsAre("OneTwoThreeFour")); |
| 540 | EXPECT_FALSE(Incomplete) << "Empty string is not a short query"; |
| 541 | |
| 542 | Req.Query = "t"; |
| 543 | EXPECT_THAT(match(*I, Req, &Incomplete), ElementsAre()); |
| 544 | EXPECT_TRUE(Incomplete) << "Short queries have different semantics"; |
| 545 | |
| 546 | Req.Query = "tt"; |
| 547 | EXPECT_THAT(match(*I, Req, &Incomplete), ElementsAre()); |
| 548 | EXPECT_TRUE(Incomplete) << "Short queries have different semantics"; |
| 549 | |
| 550 | Req.Query = "ttf"; |
| 551 | EXPECT_THAT(match(*I, Req, &Incomplete), ElementsAre("OneTwoThreeFour")); |
| 552 | EXPECT_FALSE(Incomplete) << "3-char string is not a short query"; |
| 553 | } |
Sam McCall | b5bbfef | 2018-10-04 14:01:55 +0000 | [diff] [blame] | 554 | |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 555 | TEST(DexTest, MatchQualifiedNamesWithoutSpecificScope) { |
Sam McCall | d9eae39 | 2018-10-04 09:16:12 +0000 | [diff] [blame] | 556 | auto I = Dex::build(generateSymbols({"a::y1", "b::y2", "y3"}), RefSlab(), |
| 557 | URISchemes); |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 558 | FuzzyFindRequest Req; |
| 559 | Req.Query = "y"; |
Sam McCall | 9c7624e | 2018-09-03 14:37:43 +0000 | [diff] [blame] | 560 | EXPECT_THAT(match(*I, Req), UnorderedElementsAre("a::y1", "b::y2", "y3")); |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 561 | } |
| 562 | |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 563 | TEST(DexTest, MatchQualifiedNamesWithGlobalScope) { |
Sam McCall | d9eae39 | 2018-10-04 09:16:12 +0000 | [diff] [blame] | 564 | auto I = Dex::build(generateSymbols({"a::y1", "b::y2", "y3"}), RefSlab(), |
| 565 | URISchemes); |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 566 | FuzzyFindRequest Req; |
| 567 | Req.Query = "y"; |
| 568 | Req.Scopes = {""}; |
Sam McCall | 9c7624e | 2018-09-03 14:37:43 +0000 | [diff] [blame] | 569 | EXPECT_THAT(match(*I, Req), UnorderedElementsAre("y3")); |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 570 | } |
| 571 | |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 572 | TEST(DexTest, MatchQualifiedNamesWithOneScope) { |
Sam McCall | d9eae39 | 2018-10-04 09:16:12 +0000 | [diff] [blame] | 573 | auto I = |
| 574 | Dex::build(generateSymbols({"a::y1", "a::y2", "a::x", "b::y2", "y3"}), |
| 575 | RefSlab(), URISchemes); |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 576 | FuzzyFindRequest Req; |
| 577 | Req.Query = "y"; |
| 578 | Req.Scopes = {"a::"}; |
Sam McCall | 9c7624e | 2018-09-03 14:37:43 +0000 | [diff] [blame] | 579 | EXPECT_THAT(match(*I, Req), UnorderedElementsAre("a::y1", "a::y2")); |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 580 | } |
| 581 | |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 582 | TEST(DexTest, MatchQualifiedNamesWithMultipleScopes) { |
| 583 | auto I = Dex::build( |
Sam McCall | d9eae39 | 2018-10-04 09:16:12 +0000 | [diff] [blame] | 584 | generateSymbols({"a::y1", "a::y2", "a::x", "b::y3", "y3"}), RefSlab(), URISchemes); |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 585 | FuzzyFindRequest Req; |
| 586 | Req.Query = "y"; |
| 587 | Req.Scopes = {"a::", "b::"}; |
Sam McCall | 9c7624e | 2018-09-03 14:37:43 +0000 | [diff] [blame] | 588 | EXPECT_THAT(match(*I, Req), UnorderedElementsAre("a::y1", "a::y2", "b::y3")); |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 589 | } |
| 590 | |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 591 | TEST(DexTest, NoMatchNestedScopes) { |
Sam McCall | d9eae39 | 2018-10-04 09:16:12 +0000 | [diff] [blame] | 592 | auto I = Dex::build(generateSymbols({"a::y1", "a::b::y2"}), RefSlab(), URISchemes); |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 593 | FuzzyFindRequest Req; |
| 594 | Req.Query = "y"; |
| 595 | Req.Scopes = {"a::"}; |
Sam McCall | 9c7624e | 2018-09-03 14:37:43 +0000 | [diff] [blame] | 596 | EXPECT_THAT(match(*I, Req), UnorderedElementsAre("a::y1")); |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 597 | } |
| 598 | |
Eric Liu | 670c147 | 2018-09-27 18:46:00 +0000 | [diff] [blame] | 599 | TEST(DexTest, WildcardScope) { |
| 600 | auto I = |
Sam McCall | d9eae39 | 2018-10-04 09:16:12 +0000 | [diff] [blame] | 601 | Dex::build(generateSymbols({"a::y1", "a::b::y2", "c::y3"}), RefSlab(), URISchemes); |
Eric Liu | 670c147 | 2018-09-27 18:46:00 +0000 | [diff] [blame] | 602 | FuzzyFindRequest Req; |
| 603 | Req.Query = "y"; |
| 604 | Req.Scopes = {"a::"}; |
| 605 | Req.AnyScope = true; |
| 606 | EXPECT_THAT(match(*I, Req), |
| 607 | UnorderedElementsAre("a::y1", "a::b::y2", "c::y3")); |
| 608 | } |
| 609 | |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 610 | TEST(DexTest, IgnoreCases) { |
Sam McCall | d9eae39 | 2018-10-04 09:16:12 +0000 | [diff] [blame] | 611 | auto I = Dex::build(generateSymbols({"ns::ABC", "ns::abc"}), RefSlab(), URISchemes); |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 612 | FuzzyFindRequest Req; |
| 613 | Req.Query = "AB"; |
| 614 | Req.Scopes = {"ns::"}; |
Sam McCall | 9c7624e | 2018-09-03 14:37:43 +0000 | [diff] [blame] | 615 | EXPECT_THAT(match(*I, Req), UnorderedElementsAre("ns::ABC", "ns::abc")); |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 616 | } |
| 617 | |
Sam McCall | 50b89f0 | 2018-10-04 17:18:55 +0000 | [diff] [blame] | 618 | TEST(DexTest, UnknownPostingList) { |
| 619 | // Regression test: we used to ignore unknown scopes and accept any symbol. |
| 620 | auto I = Dex::build(generateSymbols({"ns::ABC", "ns::abc"}), RefSlab(), |
| 621 | URISchemes); |
| 622 | FuzzyFindRequest Req; |
| 623 | Req.Scopes = {"ns2::"}; |
| 624 | EXPECT_THAT(match(*I, Req), UnorderedElementsAre()); |
| 625 | } |
| 626 | |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 627 | TEST(DexTest, Lookup) { |
Sam McCall | d9eae39 | 2018-10-04 09:16:12 +0000 | [diff] [blame] | 628 | auto I = Dex::build(generateSymbols({"ns::abc", "ns::xyz"}), RefSlab(), URISchemes); |
Sam McCall | 9c7624e | 2018-09-03 14:37:43 +0000 | [diff] [blame] | 629 | EXPECT_THAT(lookup(*I, SymbolID("ns::abc")), UnorderedElementsAre("ns::abc")); |
| 630 | EXPECT_THAT(lookup(*I, {SymbolID("ns::abc"), SymbolID("ns::xyz")}), |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 631 | UnorderedElementsAre("ns::abc", "ns::xyz")); |
Sam McCall | 9c7624e | 2018-09-03 14:37:43 +0000 | [diff] [blame] | 632 | EXPECT_THAT(lookup(*I, {SymbolID("ns::nonono"), SymbolID("ns::xyz")}), |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 633 | UnorderedElementsAre("ns::xyz")); |
Sam McCall | 9c7624e | 2018-09-03 14:37:43 +0000 | [diff] [blame] | 634 | EXPECT_THAT(lookup(*I, SymbolID("ns::nonono")), UnorderedElementsAre()); |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 635 | } |
| 636 | |
Kirill Bobyrev | 94af061 | 2018-09-24 08:45:18 +0000 | [diff] [blame] | 637 | TEST(DexTest, SymbolIndexOptionsFilter) { |
| 638 | auto CodeCompletionSymbol = symbol("Completion"); |
| 639 | auto NonCodeCompletionSymbol = symbol("NoCompletion"); |
| 640 | CodeCompletionSymbol.Flags = Symbol::SymbolFlag::IndexedForCodeCompletion; |
| 641 | NonCodeCompletionSymbol.Flags = Symbol::SymbolFlag::None; |
| 642 | std::vector<Symbol> Symbols{CodeCompletionSymbol, NonCodeCompletionSymbol}; |
Sam McCall | d9eae39 | 2018-10-04 09:16:12 +0000 | [diff] [blame] | 643 | Dex I(Symbols, RefSlab(), URISchemes); |
Kirill Bobyrev | 94af061 | 2018-09-24 08:45:18 +0000 | [diff] [blame] | 644 | FuzzyFindRequest Req; |
| 645 | Req.RestrictForCodeCompletion = false; |
| 646 | EXPECT_THAT(match(I, Req), ElementsAre("Completion", "NoCompletion")); |
| 647 | Req.RestrictForCodeCompletion = true; |
| 648 | EXPECT_THAT(match(I, Req), ElementsAre("Completion")); |
| 649 | } |
| 650 | |
Kirill Bobyrev | 5abe478 | 2018-09-10 08:23:53 +0000 | [diff] [blame] | 651 | TEST(DexTest, ProximityPathsBoosting) { |
Kirill Bobyrev | 19a9461 | 2018-09-06 12:54:43 +0000 | [diff] [blame] | 652 | auto RootSymbol = symbol("root::abc"); |
| 653 | RootSymbol.CanonicalDeclaration.FileURI = "unittest:///file.h"; |
| 654 | auto CloseSymbol = symbol("close::abc"); |
| 655 | CloseSymbol.CanonicalDeclaration.FileURI = "unittest:///a/b/c/d/e/f/file.h"; |
| 656 | |
| 657 | std::vector<Symbol> Symbols{CloseSymbol, RootSymbol}; |
Sam McCall | d9eae39 | 2018-10-04 09:16:12 +0000 | [diff] [blame] | 658 | Dex I(Symbols, RefSlab(), URISchemes); |
Kirill Bobyrev | 19a9461 | 2018-09-06 12:54:43 +0000 | [diff] [blame] | 659 | |
| 660 | FuzzyFindRequest Req; |
| 661 | Req.Query = "abc"; |
| 662 | // The best candidate can change depending on the proximity paths. |
Kirill Bobyrev | e6dd080 | 2018-09-13 14:27:03 +0000 | [diff] [blame] | 663 | Req.Limit = 1; |
Kirill Bobyrev | 19a9461 | 2018-09-06 12:54:43 +0000 | [diff] [blame] | 664 | |
| 665 | // FuzzyFind request comes from the file which is far from the root: expect |
| 666 | // CloseSymbol to come out. |
| 667 | Req.ProximityPaths = {testPath("a/b/c/d/e/f/file.h")}; |
| 668 | EXPECT_THAT(match(I, Req), ElementsAre("close::abc")); |
| 669 | |
| 670 | // FuzzyFind request comes from the file which is close to the root: expect |
| 671 | // RootSymbol to come out. |
| 672 | Req.ProximityPaths = {testPath("file.h")}; |
| 673 | EXPECT_THAT(match(I, Req), ElementsAre("root::abc")); |
| 674 | } |
| 675 | |
Sam McCall | d9eae39 | 2018-10-04 09:16:12 +0000 | [diff] [blame] | 676 | TEST(DexTests, Refs) { |
| 677 | DenseMap<SymbolID, std::vector<Ref>> Refs; |
| 678 | auto AddRef = [&](const Symbol& Sym, StringRef Filename, RefKind Kind) { |
| 679 | auto& SymbolRefs = Refs[Sym.ID]; |
| 680 | SymbolRefs.emplace_back(); |
| 681 | SymbolRefs.back().Kind = Kind; |
| 682 | SymbolRefs.back().Location.FileURI = Filename; |
| 683 | }; |
| 684 | auto Foo = symbol("foo"); |
| 685 | auto Bar = symbol("bar"); |
| 686 | AddRef(Foo, "foo.h", RefKind::Declaration); |
| 687 | AddRef(Foo, "reffoo.h", RefKind::Reference); |
| 688 | AddRef(Bar, "bar.h", RefKind::Declaration); |
| 689 | |
| 690 | std::vector<std::string> Files; |
| 691 | RefsRequest Req; |
| 692 | Req.IDs.insert(Foo.ID); |
| 693 | Req.Filter = RefKind::Declaration | RefKind::Definition; |
| 694 | Dex(std::vector<Symbol>{Foo, Bar}, Refs, {}).refs(Req, [&](const Ref &R) { |
| 695 | Files.push_back(R.Location.FileURI); |
| 696 | }); |
| 697 | |
| 698 | EXPECT_THAT(Files, ElementsAre("foo.h")); |
| 699 | } |
| 700 | |
Kirill Bobyrev | 870aaf2 | 2018-08-20 14:39:32 +0000 | [diff] [blame] | 701 | } // namespace |
Kirill Bobyrev | 5e82f05 | 2018-07-25 10:34:57 +0000 | [diff] [blame] | 702 | } // namespace dex |
| 703 | } // namespace clangd |
| 704 | } // namespace clang |