| Mike Yu | bab3daa | 2018-10-19 22:11:43 +0800 | [diff] [blame] | 1 | /* |
| 2 | * Copyright (C) 2017 The Android Open Source Project |
| 3 | * |
| 4 | * Licensed under the Apache License, Version 2.0 (the "License"); |
| 5 | * you may not use this file except in compliance with the License. |
| 6 | * You may obtain a copy of the License at |
| 7 | * |
| 8 | * http://www.apache.org/licenses/LICENSE-2.0 |
| 9 | * |
| 10 | * Unless required by applicable law or agreed to in writing, software |
| 11 | * distributed under the License is distributed on an "AS IS" BASIS, |
| 12 | * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| 13 | * See the License for the specific language governing permissions and |
| 14 | * limitations under the License. |
| 15 | */ |
| 16 | |
| Ken Chen | 5471dca | 2019-04-15 15:25:35 +0800 | [diff] [blame] | 17 | #define LOG_TAG "resolv" |
| Mike Yu | bab3daa | 2018-10-19 22:11:43 +0800 | [diff] [blame] | 18 | |
| Bernie Innocenti | ec4219b | 2019-01-30 11:16:36 +0900 | [diff] [blame] | 19 | #include "DnsTlsDispatcher.h" |
| Mike Yu | e655b1d | 2019-08-28 17:49:59 +0800 | [diff] [blame] | 20 | |
| lifr | 9498178 | 2019-05-17 21:15:19 +0800 | [diff] [blame] | 21 | #include <netdutils/Stopwatch.h> |
| Mike Yu | e655b1d | 2019-08-28 17:49:59 +0800 | [diff] [blame] | 22 | |
| Bernie Innocenti | ec4219b | 2019-01-30 11:16:36 +0900 | [diff] [blame] | 23 | #include "DnsTlsSocketFactory.h" |
| Mike Yu | e655b1d | 2019-08-28 17:49:59 +0800 | [diff] [blame] | 24 | #include "resolv_cache.h" |
| lifr | 9498178 | 2019-05-17 21:15:19 +0800 | [diff] [blame] | 25 | #include "resolv_private.h" |
| 26 | #include "stats.pb.h" |
| Mike Yu | bab3daa | 2018-10-19 22:11:43 +0800 | [diff] [blame] | 27 | |
| chenbruce | aff8584 | 2019-05-31 15:46:42 +0800 | [diff] [blame] | 28 | #include <android-base/logging.h> |
| Mike Yu | bab3daa | 2018-10-19 22:11:43 +0800 | [diff] [blame] | 29 | |
| 30 | namespace android { |
| 31 | namespace net { |
| 32 | |
| Mike Yu | e655b1d | 2019-08-28 17:49:59 +0800 | [diff] [blame] | 33 | using android::netdutils::IPSockAddr; |
| lifr | 9498178 | 2019-05-17 21:15:19 +0800 | [diff] [blame] | 34 | using android::netdutils::Stopwatch; |
| Mike Yu | bab3daa | 2018-10-19 22:11:43 +0800 | [diff] [blame] | 35 | using netdutils::Slice; |
| 36 | |
| 37 | // static |
| 38 | std::mutex DnsTlsDispatcher::sLock; |
| 39 | |
| 40 | DnsTlsDispatcher::DnsTlsDispatcher() { |
| 41 | mFactory.reset(new DnsTlsSocketFactory()); |
| 42 | } |
| 43 | |
| Mike Yu | 9e8cf8d | 2020-10-26 19:04:33 +0800 | [diff] [blame] | 44 | DnsTlsDispatcher& DnsTlsDispatcher::getInstance() { |
| 45 | static DnsTlsDispatcher instance; |
| 46 | return instance; |
| 47 | } |
| 48 | |
| Mike Yu | bab3daa | 2018-10-19 22:11:43 +0800 | [diff] [blame] | 49 | std::list<DnsTlsServer> DnsTlsDispatcher::getOrderedServerList( |
| 50 | const std::list<DnsTlsServer> &tlsServers, unsigned mark) const { |
| 51 | // Our preferred DnsTlsServer order is: |
| 52 | // 1) reuse existing IPv6 connections |
| 53 | // 2) reuse existing IPv4 connections |
| 54 | // 3) establish new IPv6 connections |
| 55 | // 4) establish new IPv4 connections |
| 56 | std::list<DnsTlsServer> existing6; |
| 57 | std::list<DnsTlsServer> existing4; |
| 58 | std::list<DnsTlsServer> new6; |
| 59 | std::list<DnsTlsServer> new4; |
| 60 | |
| 61 | // Pull out any servers for which we might have existing connections and |
| 62 | // place them at the from the list of servers to try. |
| 63 | { |
| 64 | std::lock_guard guard(sLock); |
| 65 | |
| 66 | for (const auto& tlsServer : tlsServers) { |
| 67 | const Key key = std::make_pair(mark, tlsServer); |
| 68 | if (mStore.find(key) != mStore.end()) { |
| 69 | switch (tlsServer.ss.ss_family) { |
| 70 | case AF_INET: |
| 71 | existing4.push_back(tlsServer); |
| 72 | break; |
| 73 | case AF_INET6: |
| 74 | existing6.push_back(tlsServer); |
| 75 | break; |
| 76 | } |
| 77 | } else { |
| 78 | switch (tlsServer.ss.ss_family) { |
| 79 | case AF_INET: |
| 80 | new4.push_back(tlsServer); |
| 81 | break; |
| 82 | case AF_INET6: |
| 83 | new6.push_back(tlsServer); |
| 84 | break; |
| 85 | } |
| 86 | } |
| 87 | } |
| 88 | } |
| 89 | |
| 90 | auto& out = existing6; |
| 91 | out.splice(out.cend(), existing4); |
| 92 | out.splice(out.cend(), new6); |
| 93 | out.splice(out.cend(), new4); |
| 94 | return out; |
| 95 | } |
| 96 | |
| lifr | 9498178 | 2019-05-17 21:15:19 +0800 | [diff] [blame] | 97 | DnsTlsTransport::Response DnsTlsDispatcher::query(const std::list<DnsTlsServer>& tlsServers, |
| 98 | res_state statp, const Slice query, |
| 99 | const Slice ans, int* resplen) { |
| 100 | const std::list<DnsTlsServer> orderedServers(getOrderedServerList(tlsServers, statp->_mark)); |
| Mike Yu | bab3daa | 2018-10-19 22:11:43 +0800 | [diff] [blame] | 101 | |
| chenbruce | aff8584 | 2019-05-31 15:46:42 +0800 | [diff] [blame] | 102 | if (orderedServers.empty()) LOG(WARNING) << "Empty DnsTlsServer list"; |
| Mike Yu | bab3daa | 2018-10-19 22:11:43 +0800 | [diff] [blame] | 103 | |
| 104 | DnsTlsTransport::Response code = DnsTlsTransport::Response::internal_error; |
| lifr | 9498178 | 2019-05-17 21:15:19 +0800 | [diff] [blame] | 105 | int serverCount = 0; |
| Mike Yu | bab3daa | 2018-10-19 22:11:43 +0800 | [diff] [blame] | 106 | for (const auto& server : orderedServers) { |
| lifr | 9498178 | 2019-05-17 21:15:19 +0800 | [diff] [blame] | 107 | DnsQueryEvent* dnsQueryEvent = |
| 108 | statp->event->mutable_dns_query_events()->add_dns_query_event(); |
| Mike Yu | cb2bb7c | 2019-11-22 20:42:13 +0800 | [diff] [blame] | 109 | |
| 110 | bool connectTriggered = false; |
| lifr | d4d9fbb | 2019-07-31 20:18:35 +0800 | [diff] [blame] | 111 | Stopwatch queryStopwatch; |
| Mike Yu | cb2bb7c | 2019-11-22 20:42:13 +0800 | [diff] [blame] | 112 | code = this->query(server, statp->_mark, query, ans, resplen, &connectTriggered); |
| lifr | 9498178 | 2019-05-17 21:15:19 +0800 | [diff] [blame] | 113 | |
| lifr | d4d9fbb | 2019-07-31 20:18:35 +0800 | [diff] [blame] | 114 | dnsQueryEvent->set_latency_micros(saturate_cast<int32_t>(queryStopwatch.timeTakenUs())); |
| lifr | 9498178 | 2019-05-17 21:15:19 +0800 | [diff] [blame] | 115 | dnsQueryEvent->set_dns_server_index(serverCount++); |
| 116 | dnsQueryEvent->set_ip_version(ipFamilyToIPVersion(server.ss.ss_family)); |
| 117 | dnsQueryEvent->set_protocol(PROTO_DOT); |
| 118 | dnsQueryEvent->set_type(getQueryType(query.base(), query.size())); |
| Mike Yu | cb2bb7c | 2019-11-22 20:42:13 +0800 | [diff] [blame] | 119 | dnsQueryEvent->set_connected(connectTriggered); |
| lifr | 9498178 | 2019-05-17 21:15:19 +0800 | [diff] [blame] | 120 | |
| Mike Yu | bab3daa | 2018-10-19 22:11:43 +0800 | [diff] [blame] | 121 | switch (code) { |
| 122 | // These response codes are valid responses and not expected to |
| 123 | // change if another server is queried. |
| 124 | case DnsTlsTransport::Response::success: |
| lifr | 9498178 | 2019-05-17 21:15:19 +0800 | [diff] [blame] | 125 | dnsQueryEvent->set_rcode( |
| 126 | static_cast<NsRcode>(reinterpret_cast<HEADER*>(ans.base())->rcode)); |
| Mike Yu | e655b1d | 2019-08-28 17:49:59 +0800 | [diff] [blame] | 127 | resolv_stats_add(statp->netid, IPSockAddr::toIPSockAddr(server.ss), dnsQueryEvent); |
| lifr | d4d9fbb | 2019-07-31 20:18:35 +0800 | [diff] [blame] | 128 | return code; |
| Mike Yu | bab3daa | 2018-10-19 22:11:43 +0800 | [diff] [blame] | 129 | case DnsTlsTransport::Response::limit_error: |
| lifr | d4d9fbb | 2019-07-31 20:18:35 +0800 | [diff] [blame] | 130 | dnsQueryEvent->set_rcode(NS_R_INTERNAL_ERROR); |
| Mike Yu | e655b1d | 2019-08-28 17:49:59 +0800 | [diff] [blame] | 131 | resolv_stats_add(statp->netid, IPSockAddr::toIPSockAddr(server.ss), dnsQueryEvent); |
| Mike Yu | bab3daa | 2018-10-19 22:11:43 +0800 | [diff] [blame] | 132 | return code; |
| Mike Yu | bab3daa | 2018-10-19 22:11:43 +0800 | [diff] [blame] | 133 | // These response codes might differ when trying other servers, so |
| 134 | // keep iterating to see if we can get a different (better) result. |
| 135 | case DnsTlsTransport::Response::network_error: |
| lifr | 9498178 | 2019-05-17 21:15:19 +0800 | [diff] [blame] | 136 | // Sync from res_tls_send in res_send.cpp |
| 137 | dnsQueryEvent->set_rcode(NS_R_TIMEOUT); |
| Mike Yu | e655b1d | 2019-08-28 17:49:59 +0800 | [diff] [blame] | 138 | resolv_stats_add(statp->netid, IPSockAddr::toIPSockAddr(server.ss), dnsQueryEvent); |
| 139 | break; |
| Mike Yu | bab3daa | 2018-10-19 22:11:43 +0800 | [diff] [blame] | 140 | case DnsTlsTransport::Response::internal_error: |
| lifr | d4d9fbb | 2019-07-31 20:18:35 +0800 | [diff] [blame] | 141 | dnsQueryEvent->set_rcode(NS_R_INTERNAL_ERROR); |
| Mike Yu | e655b1d | 2019-08-28 17:49:59 +0800 | [diff] [blame] | 142 | resolv_stats_add(statp->netid, IPSockAddr::toIPSockAddr(server.ss), dnsQueryEvent); |
| 143 | break; |
| Mike Yu | bab3daa | 2018-10-19 22:11:43 +0800 | [diff] [blame] | 144 | // No "default" statement. |
| 145 | } |
| 146 | } |
| 147 | |
| 148 | return code; |
| 149 | } |
| 150 | |
| 151 | DnsTlsTransport::Response DnsTlsDispatcher::query(const DnsTlsServer& server, unsigned mark, |
| Mike Yu | cb2bb7c | 2019-11-22 20:42:13 +0800 | [diff] [blame] | 152 | const Slice query, const Slice ans, int* resplen, |
| 153 | bool* connectTriggered) { |
| Mike Yu | e9b78d8 | 2020-05-20 20:58:49 +0800 | [diff] [blame] | 154 | // TODO: This can cause the resolver to create multiple connections to the same DoT server |
| 155 | // merely due to different mark, such as the bit explicitlySelected unset. |
| 156 | // See if we can save them and just create one connection for one DoT server. |
| Mike Yu | bab3daa | 2018-10-19 22:11:43 +0800 | [diff] [blame] | 157 | const Key key = std::make_pair(mark, server); |
| 158 | Transport* xport; |
| 159 | { |
| 160 | std::lock_guard guard(sLock); |
| 161 | auto it = mStore.find(key); |
| 162 | if (it == mStore.end()) { |
| 163 | xport = new Transport(server, mark, mFactory.get()); |
| 164 | mStore[key].reset(xport); |
| 165 | } else { |
| 166 | xport = it->second.get(); |
| 167 | } |
| 168 | ++xport->useCount; |
| 169 | } |
| 170 | |
| Mike Yu | 568ed6c | 2020-07-01 12:02:14 +0800 | [diff] [blame] | 171 | // Don't call this function and hold sLock at the same time because of the following reason: |
| 172 | // TLS handshake requires a lock which is also needed by this function, if the handshake gets |
| 173 | // stuck, this function also gets blocked. |
| 174 | const int connectCounter = xport->transport.getConnectCounter(); |
| 175 | |
| chenbruce | aff8584 | 2019-05-31 15:46:42 +0800 | [diff] [blame] | 176 | LOG(DEBUG) << "Sending query of length " << query.size(); |
| Mike Yu | bab3daa | 2018-10-19 22:11:43 +0800 | [diff] [blame] | 177 | auto res = xport->transport.query(query); |
| chenbruce | aff8584 | 2019-05-31 15:46:42 +0800 | [diff] [blame] | 178 | LOG(DEBUG) << "Awaiting response"; |
| Mike Yu | bab3daa | 2018-10-19 22:11:43 +0800 | [diff] [blame] | 179 | const auto& result = res.get(); |
| Mike Yu | 568ed6c | 2020-07-01 12:02:14 +0800 | [diff] [blame] | 180 | *connectTriggered = (xport->transport.getConnectCounter() > connectCounter); |
| 181 | |
| Mike Yu | bab3daa | 2018-10-19 22:11:43 +0800 | [diff] [blame] | 182 | DnsTlsTransport::Response code = result.code; |
| 183 | if (code == DnsTlsTransport::Response::success) { |
| 184 | if (result.response.size() > ans.size()) { |
| chenbruce | aff8584 | 2019-05-31 15:46:42 +0800 | [diff] [blame] | 185 | LOG(DEBUG) << "Response too large: " << result.response.size() << " > " << ans.size(); |
| Mike Yu | bab3daa | 2018-10-19 22:11:43 +0800 | [diff] [blame] | 186 | code = DnsTlsTransport::Response::limit_error; |
| 187 | } else { |
| chenbruce | aff8584 | 2019-05-31 15:46:42 +0800 | [diff] [blame] | 188 | LOG(DEBUG) << "Got response successfully"; |
| Mike Yu | bab3daa | 2018-10-19 22:11:43 +0800 | [diff] [blame] | 189 | *resplen = result.response.size(); |
| 190 | netdutils::copy(ans, netdutils::makeSlice(result.response)); |
| 191 | } |
| 192 | } else { |
| chenbruce | aff8584 | 2019-05-31 15:46:42 +0800 | [diff] [blame] | 193 | LOG(DEBUG) << "Query failed: " << (unsigned int)code; |
| Mike Yu | bab3daa | 2018-10-19 22:11:43 +0800 | [diff] [blame] | 194 | } |
| 195 | |
| 196 | auto now = std::chrono::steady_clock::now(); |
| 197 | { |
| 198 | std::lock_guard guard(sLock); |
| Mike Yu | bab3daa | 2018-10-19 22:11:43 +0800 | [diff] [blame] | 199 | --xport->useCount; |
| 200 | xport->lastUsed = now; |
| 201 | cleanup(now); |
| 202 | } |
| 203 | return code; |
| 204 | } |
| 205 | |
| 206 | // This timeout effectively controls how long to keep SSL session tickets. |
| 207 | static constexpr std::chrono::minutes IDLE_TIMEOUT(5); |
| 208 | void DnsTlsDispatcher::cleanup(std::chrono::time_point<std::chrono::steady_clock> now) { |
| 209 | // To avoid scanning mStore after every query, return early if a cleanup has been |
| 210 | // performed recently. |
| 211 | if (now - mLastCleanup < IDLE_TIMEOUT) { |
| 212 | return; |
| 213 | } |
| 214 | for (auto it = mStore.begin(); it != mStore.end();) { |
| 215 | auto& s = it->second; |
| 216 | if (s->useCount == 0 && now - s->lastUsed > IDLE_TIMEOUT) { |
| 217 | it = mStore.erase(it); |
| 218 | } else { |
| 219 | ++it; |
| 220 | } |
| 221 | } |
| 222 | mLastCleanup = now; |
| 223 | } |
| 224 | |
| 225 | } // end of namespace net |
| 226 | } // end of namespace android |