blob: da8f5da18ec8dd140230faac6ca277bb1511dc91 [file] [log] [blame]
Daniel Drown0da73fc2012-06-20 16:51:39 -05001/*
2 * Copyright (C) 2008 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
Bernie Innocenti51a0e0f2018-10-05 20:24:06 +090016
Lorenzo Colittiac7fefc2014-10-20 17:14:13 +090017#include <map>
18#include <string>
19
Lorenzo Colitti7ef8c0f2019-01-11 22:34:58 +090020#include <arpa/inet.h>
Daniel Drown0da73fc2012-06-20 16:51:39 -050021#include <errno.h>
Maciej Żenczykowski1c086e52019-03-29 23:13:49 -070022#include <linux/if_arp.h>
Maciej Żenczykowskif4b44fe2019-04-08 16:18:50 -070023#include <linux/if_tun.h>
24#include <linux/ioctl.h>
Maciej Żenczykowskic8c38aa2019-03-29 01:24:51 -070025#include <net/if.h>
Lorenzo Colitti7ef8c0f2019-01-11 22:34:58 +090026#include <netinet/in.h>
Luke Huang94c43a12019-02-14 19:51:38 +080027#include <spawn.h>
Daniel Drown0da73fc2012-06-20 16:51:39 -050028#include <sys/types.h>
29#include <sys/wait.h>
Luke Huang94c43a12019-02-14 19:51:38 +080030#include <unistd.h>
Daniel Drown0da73fc2012-06-20 16:51:39 -050031
32#define LOG_TAG "ClatdController"
Logan Chien3f461482018-04-23 14:31:32 +080033#include <log/log.h>
Daniel Drown0da73fc2012-06-20 16:51:39 -050034
Maciej Żenczykowski1c086e52019-03-29 23:13:49 -070035#include "ClatdController.h"
Maciej Żenczykowskia1699952019-05-11 17:07:44 -070036#include "InterfaceController.h"
Maciej Żenczykowski1c086e52019-03-29 23:13:49 -070037
38#include "android-base/properties.h"
Maciej Żenczykowskif4b44fe2019-04-08 16:18:50 -070039#include "android-base/scopeguard.h"
Lorenzo Colitti91fd5802019-06-28 19:22:01 +090040#include "android-base/stringprintf.h"
Lorenzo Colitti7ef8c0f2019-01-11 22:34:58 +090041#include "android-base/unique_fd.h"
Maciej Żenczykowski55262712019-03-29 23:44:56 -070042#include "bpf/BpfMap.h"
43#include "netdbpf/bpf_shared.h"
44#include "netdutils/DumpWriter.h"
Lorenzo Colitti7ef8c0f2019-01-11 22:34:58 +090045
46extern "C" {
47#include "netutils/checksum.h"
48}
49
Maciej Żenczykowski55262712019-03-29 23:44:56 -070050#include "ClatUtils.h"
Lorenzo Colitti45d3dd02014-06-09 14:09:20 +090051#include "Fwmark.h"
Paul Jensen84c1d032014-05-30 13:29:41 -040052#include "NetdConstants.h"
53#include "NetworkController.h"
Bernie Innocenti189eb502018-10-01 23:10:18 +090054#include "netid_client.h"
Daniel Drown0da73fc2012-06-20 16:51:39 -050055
Lorenzo Colittiac7fefc2014-10-20 17:14:13 +090056static const char* kClatdPath = "/system/bin/clatd";
57
Lorenzo Colitti7ef8c0f2019-01-11 22:34:58 +090058// For historical reasons, start with 192.0.0.4, and after that, use all subsequent addresses in
59// 192.0.0.0/29 (RFC 7335).
60static const char* kV4AddrString = "192.0.0.4";
61static const in_addr kV4Addr = {inet_addr(kV4AddrString)};
62static const int kV4AddrLen = 29;
63
Lorenzo Colitti91fd5802019-06-28 19:22:01 +090064using android::base::StringPrintf;
Lorenzo Colitti7ef8c0f2019-01-11 22:34:58 +090065using android::base::unique_fd;
Maciej Żenczykowski55262712019-03-29 23:44:56 -070066using android::bpf::BpfMap;
67using android::netdutils::DumpWriter;
68using android::netdutils::ScopedIndent;
Lorenzo Colitti7ef8c0f2019-01-11 22:34:58 +090069
Lorenzo Colitti7035f222017-02-13 18:29:00 +090070namespace android {
71namespace net {
72
Maciej Żenczykowski35bc6ed2019-12-16 15:39:04 -080073void ClatdController::resetIngressMap() {
74 int netlinkFd = mNetlinkFd.get();
75
76 const auto del = [&netlinkFd](const ClatIngressKey& key,
77 const BpfMap<ClatIngressKey, ClatIngressValue>&) {
78 ALOGW("Removing stale clat config on interface %d.", key.iif);
79 int rv = tcQdiscDelDevClsact(netlinkFd, key.iif);
80 if (rv < 0) ALOGE("tcQdiscDelDevClsact() failure: %s", strerror(-rv));
81 return netdutils::status::ok; // keep on going regardless
82 };
83 auto ret = mClatIngressMap.iterate(del);
84 if (!isOk(ret)) ALOGE("mClatIngressMap.iterate() failure: %s", strerror(ret.code()));
85 ret = mClatIngressMap.clear();
86 if (!isOk(ret)) ALOGE("mClatIngressMap.clear() failure: %s", strerror(ret.code()));
87}
88
Maciej Żenczykowski56280272019-03-30 03:32:51 -070089void ClatdController::init(void) {
90 std::lock_guard guard(mutex);
91
Maciej Żenczykowski1c086e52019-03-29 23:13:49 -070092 // TODO: should refactor into separate function for testability
93 if (bpf::getBpfSupportLevel() == bpf::BpfLevel::NONE) {
94 ALOGI("Pre-4.9 kernel or pre-P api shipping level - disabling clat ebpf.");
95 mClatEbpfMode = ClatEbpfDisabled;
96 return;
97 }
98
99 // We know the device initially shipped with at least P...,
100 // but did it ship with at least Q?
101
102 uint64_t api_level = base::GetUintProperty<uint64_t>("ro.product.first_api_level", 0);
103 if (api_level == 0) {
104 ALOGE("Cannot determine initial API level of the device.");
105 api_level = base::GetUintProperty<uint64_t>("ro.build.version.sdk", 0);
106 }
107
108 // Note: MINIMUM_API_REQUIRED is for eBPF as a whole and is thus P
109 if (api_level > bpf::MINIMUM_API_REQUIRED) {
110 ALOGI("4.9+ kernel and device shipped with Q+ - clat ebpf should work.");
111 mClatEbpfMode = ClatEbpfEnabled;
112 } else {
113 // We cannot guarantee that 4.9-P kernels will include NET_CLS_BPF support.
114 ALOGI("4.9+ kernel and device shipped with P - clat ebpf might work.");
115 mClatEbpfMode = ClatEbpfMaybe;
116 }
117
118 int rv = openNetlinkSocket();
119 if (rv < 0) {
120 ALOGE("openNetlinkSocket() failure: %s", strerror(-rv));
121 mClatEbpfMode = ClatEbpfDisabled;
122 return;
123 }
124 mNetlinkFd.reset(rv);
125
Maciej Żenczykowski0bd8da72019-12-16 15:16:28 -0800126 rv = getClatEgressMapFd();
127 if (rv < 0) {
128 ALOGE("getClatEgressMapFd() failure: %s", strerror(-rv));
129 mClatEbpfMode = ClatEbpfDisabled;
130 mNetlinkFd.reset(-1);
131 return;
132 }
133 mClatEgressMap.reset(rv);
134
Maciej Żenczykowski1c086e52019-03-29 23:13:49 -0700135 rv = getClatIngressMapFd();
136 if (rv < 0) {
137 ALOGE("getClatIngressMapFd() failure: %s", strerror(-rv));
138 mClatEbpfMode = ClatEbpfDisabled;
Maciej Żenczykowski0bd8da72019-12-16 15:16:28 -0800139 mClatEgressMap.reset(-1);
Maciej Żenczykowski1c086e52019-03-29 23:13:49 -0700140 mNetlinkFd.reset(-1);
141 return;
142 }
143 mClatIngressMap.reset(rv);
144
Maciej Żenczykowski35bc6ed2019-12-16 15:39:04 -0800145 resetIngressMap();
Maciej Żenczykowski1c086e52019-03-29 23:13:49 -0700146}
147
Lorenzo Colitti7ef8c0f2019-01-11 22:34:58 +0900148bool ClatdController::isIpv4AddressFree(in_addr_t addr) {
149 int s = socket(AF_INET, SOCK_DGRAM | SOCK_CLOEXEC, 0);
150 if (s == -1) {
151 return 0;
152 }
153
154 // Attempt to connect to the address. If the connection succeeds and getsockname returns the
155 // same then the address is already assigned to the system and we can't use it.
Nick Desaulniers6b357502019-10-11 09:26:44 -0700156 struct sockaddr_in sin = {
157 .sin_family = AF_INET,
Maciej Żenczykowski268190e2019-10-31 23:47:53 -0700158 .sin_port = htons(53),
Nick Desaulniers6b357502019-10-11 09:26:44 -0700159 .sin_addr = {addr},
160 };
Lorenzo Colitti7ef8c0f2019-01-11 22:34:58 +0900161 socklen_t len = sizeof(sin);
162 bool inuse = connect(s, (struct sockaddr*)&sin, sizeof(sin)) == 0 &&
163 getsockname(s, (struct sockaddr*)&sin, &len) == 0 && (size_t)len >= sizeof(sin) &&
164 sin.sin_addr.s_addr == addr;
165
166 close(s);
167 return !inuse;
Lorenzo Colittiac7fefc2014-10-20 17:14:13 +0900168}
Daniel Drown0da73fc2012-06-20 16:51:39 -0500169
Lorenzo Colitti7ef8c0f2019-01-11 22:34:58 +0900170// Picks a free IPv4 address, starting from ip and trying all addresses in the prefix in order.
171// ip - the IP address from the configuration file
172// prefixlen - the length of the prefix from which addresses may be selected.
173// returns: the IPv4 address, or INADDR_NONE if no addresses were available
174in_addr_t ClatdController::selectIpv4Address(const in_addr ip, int16_t prefixlen) {
175 // Don't accept prefixes that are too large because we scan addresses one by one.
176 if (prefixlen < 16 || prefixlen > 32) {
177 return INADDR_NONE;
178 }
Lorenzo Colittiac7fefc2014-10-20 17:14:13 +0900179
Lorenzo Colitti7ef8c0f2019-01-11 22:34:58 +0900180 // All these are in host byte order.
181 in_addr_t mask = 0xffffffff >> (32 - prefixlen) << (32 - prefixlen);
182 in_addr_t ipv4 = ntohl(ip.s_addr);
183 in_addr_t first_ipv4 = ipv4;
184 in_addr_t prefix = ipv4 & mask;
185
186 // Pick the first IPv4 address in the pool, wrapping around if necessary.
187 // So, for example, 192.0.0.4 -> 192.0.0.5 -> 192.0.0.6 -> 192.0.0.7 -> 192.0.0.0.
188 do {
189 if (isIpv4AddressFreeFunc(htonl(ipv4))) {
190 return htonl(ipv4);
191 }
192 ipv4 = prefix | ((ipv4 + 1) & ~mask);
193 } while (ipv4 != first_ipv4);
194
195 return INADDR_NONE;
196}
197
198// Alters the bits in the IPv6 address to make them checksum neutral with v4 and nat64Prefix.
199void ClatdController::makeChecksumNeutral(in6_addr* v6, const in_addr v4,
200 const in6_addr& nat64Prefix) {
201 // Fill last 8 bytes of IPv6 address with random bits.
202 arc4random_buf(&v6->s6_addr[8], 8);
203
204 // Make the IID checksum-neutral. That is, make it so that:
205 // checksum(Local IPv4 | Remote IPv4) = checksum(Local IPv6 | Remote IPv6)
206 // in other words (because remote IPv6 = NAT64 prefix | Remote IPv4):
207 // checksum(Local IPv4) = checksum(Local IPv6 | NAT64 prefix)
208 // Do this by adjusting the two bytes in the middle of the IID.
209
210 uint16_t middlebytes = (v6->s6_addr[11] << 8) + v6->s6_addr[12];
211
212 uint32_t c1 = ip_checksum_add(0, &v4, sizeof(v4));
213 uint32_t c2 = ip_checksum_add(0, &nat64Prefix, sizeof(nat64Prefix)) +
214 ip_checksum_add(0, v6, sizeof(*v6));
215
216 uint16_t delta = ip_checksum_adjust(middlebytes, c1, c2);
217 v6->s6_addr[11] = delta >> 8;
218 v6->s6_addr[12] = delta & 0xff;
219}
220
221// Picks a random interface ID that is checksum neutral with the IPv4 address and the NAT64 prefix.
222int ClatdController::generateIpv6Address(const char* iface, const in_addr v4,
223 const in6_addr& nat64Prefix, in6_addr* v6) {
224 unique_fd s(socket(AF_INET6, SOCK_DGRAM | SOCK_CLOEXEC, 0));
225 if (s == -1) return -errno;
226
227 if (setsockopt(s, SOL_SOCKET, SO_BINDTODEVICE, iface, strlen(iface) + 1) == -1) {
Luke Huang6d301232018-08-01 14:05:18 +0800228 return -errno;
Daniel Drown0da73fc2012-06-20 16:51:39 -0500229 }
230
Lorenzo Colitti7ef8c0f2019-01-11 22:34:58 +0900231 sockaddr_in6 sin6 = {.sin6_family = AF_INET6, .sin6_addr = nat64Prefix};
232 if (connect(s, reinterpret_cast<struct sockaddr*>(&sin6), sizeof(sin6)) == -1) {
233 return -errno;
234 }
235
236 socklen_t len = sizeof(sin6);
237 if (getsockname(s, reinterpret_cast<struct sockaddr*>(&sin6), &len) == -1) {
238 return -errno;
239 }
240
241 *v6 = sin6.sin6_addr;
242
243 if (IN6_IS_ADDR_UNSPECIFIED(v6) || IN6_IS_ADDR_LOOPBACK(v6) || IN6_IS_ADDR_LINKLOCAL(v6) ||
244 IN6_IS_ADDR_SITELOCAL(v6) || IN6_IS_ADDR_ULA(v6)) {
245 return -ENETUNREACH;
246 }
247
248 makeChecksumNeutral(v6, v4, nat64Prefix);
249
250 return 0;
251}
252
Maciej Żenczykowski1c086e52019-03-29 23:13:49 -0700253void ClatdController::maybeStartBpf(const ClatdTracker& tracker) {
254 if (mClatEbpfMode == ClatEbpfDisabled) return;
255
256 int rv = hardwareAddressType(tracker.iface);
257 if (rv < 0) {
258 ALOGE("hardwareAddressType(%s[%d]) failure: %s", tracker.iface, tracker.ifIndex,
259 strerror(-rv));
260 return;
261 }
262
263 bool isEthernet;
264 switch (rv) {
265 case ARPHRD_ETHER:
266 isEthernet = true;
267 break;
268 case ARPHRD_RAWIP: // in Linux 4.14+ rmnet support was upstreamed and this is 519
269 case 530: // this is ARPHRD_RAWIP on some Android 4.9 kernels with rmnet
270 isEthernet = false;
271 break;
272 default:
273 ALOGE("hardwareAddressType(%s[%d]) returned unknown type %d.", tracker.iface,
274 tracker.ifIndex, rv);
275 return;
276 }
277
278 rv = getClatIngressProgFd(isEthernet);
279 if (rv < 0) {
280 ALOGE("getClatIngressProgFd(%d) failure: %s", isEthernet, strerror(-rv));
281 return;
282 }
283 unique_fd progFd(rv);
284
285 ClatIngressKey key = {
286 .iif = tracker.ifIndex,
287 .pfx96 = tracker.pfx96,
288 .local6 = tracker.v6,
289 };
290 ClatIngressValue value = {
Maciej Żenczykowski1c086e52019-03-29 23:13:49 -0700291 // TODO: move all the clat code to eBPF and remove the tun interface entirely.
Maciej Żenczykowski39b0b902019-05-08 00:36:30 -0700292 .oif = tracker.v4ifIndex,
Maciej Żenczykowski1c086e52019-03-29 23:13:49 -0700293 .local4 = tracker.v4,
294 };
295
296 auto ret = mClatIngressMap.writeValue(key, value, BPF_ANY);
297 if (!isOk(ret)) {
298 ALOGE("mClatIngress.Map.writeValue failure: %s", strerror(ret.code()));
299 return;
300 }
301
302 // We do tc setup *after* populating map, so scanning through map
303 // can always be used to tell us what needs cleanup.
304
305 rv = tcQdiscAddDevClsact(mNetlinkFd, tracker.ifIndex);
306 if (rv) {
307 ALOGE("tcQdiscAddDevClsact(%d[%s]) failure: %s", tracker.ifIndex, tracker.iface,
308 strerror(-rv));
309 ret = mClatIngressMap.deleteValue(key);
310 if (!isOk(ret)) ALOGE("mClatIngressMap.deleteValue failure: %s", strerror(ret.code()));
311 return;
312 }
313
Maciej Żenczykowskib140a3a2019-12-15 11:53:46 -0800314 rv = tcFilterAddDevIngressBpf(mNetlinkFd, tracker.ifIndex, progFd, isEthernet);
Maciej Żenczykowski1c086e52019-03-29 23:13:49 -0700315 if (rv) {
316 if ((rv == -ENOENT) && (mClatEbpfMode == ClatEbpfMaybe)) {
Maciej Żenczykowskib140a3a2019-12-15 11:53:46 -0800317 ALOGI("tcFilterAddDevIngressBpf(%d[%s], %d): %s", tracker.ifIndex, tracker.iface,
Maciej Żenczykowski1c086e52019-03-29 23:13:49 -0700318 isEthernet, strerror(-rv));
Maciej Żenczykowskib140a3a2019-12-15 11:53:46 -0800319 } else {
320 ALOGE("tcFilterAddDevIngressBpf(%d[%s], %d) failure: %s", tracker.ifIndex,
321 tracker.iface, isEthernet, strerror(-rv));
Maciej Żenczykowski1c086e52019-03-29 23:13:49 -0700322 }
323 rv = tcQdiscDelDevClsact(mNetlinkFd, tracker.ifIndex);
324 if (rv)
325 ALOGE("tcQdiscDelDevClsact(%d[%s]) failure: %s", tracker.ifIndex, tracker.iface,
326 strerror(-rv));
327 ret = mClatIngressMap.deleteValue(key);
328 if (!isOk(ret)) ALOGE("mClatIngressMap.deleteValue failure: %s", strerror(ret.code()));
329 return;
330 }
331
332 // success
333}
334
Lorenzo Colitti91fd5802019-06-28 19:22:01 +0900335void ClatdController::maybeSetIptablesDropRule(bool add, const char* pfx96Str, const char* v6Str) {
336 if (mClatEbpfMode == ClatEbpfDisabled) return;
337
338 std::string cmd = StringPrintf(
339 "*raw\n"
340 "%s %s -s %s/96 -d %s -j DROP\n"
341 "COMMIT\n",
342 (add ? "-A" : "-D"), LOCAL_RAW_PREROUTING, pfx96Str, v6Str);
343
344 iptablesRestoreFunction(V6, cmd);
345}
346
Maciej Żenczykowski1c086e52019-03-29 23:13:49 -0700347void ClatdController::maybeStopBpf(const ClatdTracker& tracker) {
348 if (mClatEbpfMode == ClatEbpfDisabled) return;
349
350 // No need to remove filter, since we remove qdisc it is attached to,
351 // which automatically removes everything attached to the qdisc.
352 int rv = tcQdiscDelDevClsact(mNetlinkFd, tracker.ifIndex);
353 if (rv < 0)
354 ALOGE("tcQdiscDelDevClsact(%d[%s]) failure: %s", tracker.ifIndex, tracker.iface,
355 strerror(-rv));
356
357 // We cleanup map last, so scanning through map can be used to
358 // determine what still needs cleanup.
359
360 ClatIngressKey key = {
361 .iif = tracker.ifIndex,
362 .pfx96 = tracker.pfx96,
363 .local6 = tracker.v6,
364 };
365
366 auto ret = mClatIngressMap.deleteValue(key);
367 if (!isOk(ret)) ALOGE("mClatIngressMap.deleteValue failure: %s", strerror(ret.code()));
368}
369
Lorenzo Colitti7ef8c0f2019-01-11 22:34:58 +0900370// Finds the tracker of the clatd running on interface |interface|, or nullptr if clatd has not been
371// started on |interface|.
372ClatdController::ClatdTracker* ClatdController::getClatdTracker(const std::string& interface) {
373 auto it = mClatdTrackers.find(interface);
374 return (it == mClatdTrackers.end() ? nullptr : &it->second);
375}
376
377// Initializes a ClatdTracker for the specified interface.
Maciej Żenczykowskia56b2e62019-04-24 13:17:18 -0700378int ClatdController::ClatdTracker::init(unsigned networkId, const std::string& interface,
Maciej Żenczykowski4657e512019-05-08 06:35:08 -0700379 const std::string& v4interface,
Lorenzo Colitti7ef8c0f2019-01-11 22:34:58 +0900380 const std::string& nat64Prefix) {
Maciej Żenczykowskia56b2e62019-04-24 13:17:18 -0700381 netId = networkId;
Lorenzo Colitti32b2e792015-01-07 15:11:30 +0900382
Lorenzo Colitti32b2e792015-01-07 15:11:30 +0900383 fwmark.netId = netId;
384 fwmark.explicitlySelected = true;
385 fwmark.protectedFromVpn = true;
386 fwmark.permission = PERMISSION_SYSTEM;
387
Lorenzo Colitti32b2e792015-01-07 15:11:30 +0900388 snprintf(fwmarkString, sizeof(fwmarkString), "0x%x", fwmark.intValue);
Lorenzo Colitti7ef8c0f2019-01-11 22:34:58 +0900389 snprintf(netIdString, sizeof(netIdString), "%u", netId);
390 strlcpy(iface, interface.c_str(), sizeof(iface));
Maciej Żenczykowskif4b44fe2019-04-08 16:18:50 -0700391 ifIndex = if_nametoindex(iface);
Maciej Żenczykowski4657e512019-05-08 06:35:08 -0700392 strlcpy(v4iface, v4interface.c_str(), sizeof(v4iface));
Maciej Żenczykowskif4b44fe2019-04-08 16:18:50 -0700393 v4ifIndex = if_nametoindex(v4iface);
Lorenzo Colitti32b2e792015-01-07 15:11:30 +0900394
Lorenzo Colitti7ef8c0f2019-01-11 22:34:58 +0900395 // Pass in everything that clatd needs: interface, a netid to use for DNS lookups, a fwmark for
396 // outgoing packets, the NAT64 prefix, and the IPv4 and IPv6 addresses.
397 // Validate the prefix and strip off the prefix length.
398 uint8_t family;
399 uint8_t prefixLen;
Maciej Żenczykowski1c06f9c2019-03-29 23:19:19 -0700400 int res = parsePrefix(nat64Prefix.c_str(), &family, &pfx96, sizeof(pfx96), &prefixLen);
Lorenzo Colitti7ef8c0f2019-01-11 22:34:58 +0900401 // clatd only supports /96 prefixes.
Maciej Żenczykowski1c06f9c2019-03-29 23:19:19 -0700402 if (res != sizeof(pfx96)) return res;
Lorenzo Colitti7ef8c0f2019-01-11 22:34:58 +0900403 if (family != AF_INET6) return -EAFNOSUPPORT;
404 if (prefixLen != 96) return -EINVAL;
Maciej Żenczykowski1c06f9c2019-03-29 23:19:19 -0700405 if (!inet_ntop(AF_INET6, &pfx96, pfx96String, sizeof(pfx96String))) return -errno;
Luke Huang6d301232018-08-01 14:05:18 +0800406
Lorenzo Colitti7ef8c0f2019-01-11 22:34:58 +0900407 // Pick an IPv4 address.
408 // TODO: this picks the address based on other addresses that are assigned to interfaces, but
409 // the address is only actually assigned to an interface once clatd starts up. So we could end
410 // up with two clatd instances with the same IPv4 address.
411 // Stop doing this and instead pick a free one from the kV4Addr pool.
Maciej Żenczykowski55cacfb2019-03-30 02:01:35 -0700412 v4 = {selectIpv4Address(kV4Addr, kV4AddrLen)};
Lorenzo Colitti7ef8c0f2019-01-11 22:34:58 +0900413 if (v4.s_addr == INADDR_NONE) {
414 ALOGE("No free IPv4 address in %s/%d", kV4AddrString, kV4AddrLen);
415 return -EADDRNOTAVAIL;
416 }
417 if (!inet_ntop(AF_INET, &v4, v4Str, sizeof(v4Str))) return -errno;
418
419 // Generate a checksum-neutral IID.
Maciej Żenczykowski1c06f9c2019-03-29 23:19:19 -0700420 if (generateIpv6Address(iface, v4, pfx96, &v6)) {
421 ALOGE("Unable to find global source address on %s for %s", iface, pfx96String);
Lorenzo Colitti7ef8c0f2019-01-11 22:34:58 +0900422 return -EADDRNOTAVAIL;
423 }
424 if (!inet_ntop(AF_INET6, &v6, v6Str, sizeof(v6Str))) return -errno;
425
Maciej Żenczykowski1c06f9c2019-03-29 23:19:19 -0700426 ALOGD("starting clatd on %s v4=%s v6=%s pfx96=%s", iface, v4Str, v6Str, pfx96String);
Lorenzo Colitti7ef8c0f2019-01-11 22:34:58 +0900427 return 0;
428}
429
430int ClatdController::startClatd(const std::string& interface, const std::string& nat64Prefix,
431 std::string* v6Str) {
Maciej Żenczykowski56280272019-03-30 03:32:51 -0700432 std::lock_guard guard(mutex);
Maciej Żenczykowskif4b44fe2019-04-08 16:18:50 -0700433
434 // 1. fail if pre-existing tracker already exists
Lorenzo Colitti7ef8c0f2019-01-11 22:34:58 +0900435 ClatdTracker* existing = getClatdTracker(interface);
436 if (existing != nullptr) {
437 ALOGE("clatd pid=%d already started on %s", existing->pid, interface.c_str());
Maciej Żenczykowskif4b44fe2019-04-08 16:18:50 -0700438 return -EBUSY;
Lorenzo Colitti7ef8c0f2019-01-11 22:34:58 +0900439 }
440
Maciej Żenczykowskif4b44fe2019-04-08 16:18:50 -0700441 // 2. get network id associated with this external interface
Maciej Żenczykowskia56b2e62019-04-24 13:17:18 -0700442 unsigned networkId = mNetCtrl->getNetworkForInterface(interface.c_str());
443 if (networkId == NETID_UNSET) {
444 ALOGE("Interface %s not assigned to any netId", interface.c_str());
Maciej Żenczykowskif4b44fe2019-04-08 16:18:50 -0700445 return -ENODEV;
Lorenzo Colitti7ef8c0f2019-01-11 22:34:58 +0900446 }
JP Abgrall69261cb2014-06-19 18:35:24 -0700447
Maciej Żenczykowskif4b44fe2019-04-08 16:18:50 -0700448 // 3. open the tun device in non blocking mode as required by clatd
449 int res = open("/dev/tun", O_RDWR | O_NONBLOCK | O_CLOEXEC);
450 if (res == -1) {
451 res = errno;
452 ALOGE("open of tun device failed (%s)", strerror(res));
453 return -res;
454 }
455 unique_fd tmpTunFd(res);
456
457 // 4. create the v4-... tun interface
Maciej Żenczykowski4657e512019-05-08 06:35:08 -0700458 std::string v4interface("v4-");
459 v4interface += interface;
460
Maciej Żenczykowskif4b44fe2019-04-08 16:18:50 -0700461 struct ifreq ifr = {
462 .ifr_flags = IFF_TUN,
463 };
Maciej Żenczykowski4657e512019-05-08 06:35:08 -0700464 strlcpy(ifr.ifr_name, v4interface.c_str(), sizeof(ifr.ifr_name));
Maciej Żenczykowskif4b44fe2019-04-08 16:18:50 -0700465
466 res = ioctl(tmpTunFd, TUNSETIFF, &ifr, sizeof(ifr));
467 if (res == -1) {
468 res = errno;
469 ALOGE("ioctl(TUNSETIFF) failed (%s)", strerror(res));
470 return -res;
471 }
472
Maciej Żenczykowskia1699952019-05-11 17:07:44 -0700473 // disable IPv6 on it - failing to do so is not a critical error
474 res = InterfaceController::setEnableIPv6(v4interface.c_str(), 0);
475 if (res) ALOGE("setEnableIPv6 %s failed (%s)", v4interface.c_str(), strerror(res));
476
Maciej Żenczykowskif4b44fe2019-04-08 16:18:50 -0700477 // 5. initialize tracker object
Maciej Żenczykowskia56b2e62019-04-24 13:17:18 -0700478 ClatdTracker tracker;
Maciej Żenczykowski4657e512019-05-08 06:35:08 -0700479 int ret = tracker.init(networkId, interface, v4interface, nat64Prefix);
Maciej Żenczykowskia56b2e62019-04-24 13:17:18 -0700480 if (ret) return ret;
481
Maciej Żenczykowskif4b44fe2019-04-08 16:18:50 -0700482 // 6. create a throwaway socket to reserve a file descriptor number
483 res = socket(AF_INET6, SOCK_DGRAM | SOCK_CLOEXEC, 0);
484 if (res == -1) {
485 res = errno;
486 ALOGE("socket(ipv6/udp) failed (%s)", strerror(res));
487 return -res;
488 }
489 unique_fd passedTunFd(res);
490
491 // 7. this is the FD we'll pass to clatd on the cli, so need it as a string
492 char passedTunFdStr[INT32_STRLEN];
493 snprintf(passedTunFdStr, sizeof(passedTunFdStr), "%d", passedTunFd.get());
494
495 // 8. we're going to use this as argv[0] to clatd to make ps output more useful
Lorenzo Colittiac7fefc2014-10-20 17:14:13 +0900496 std::string progname("clatd-");
Lorenzo Colitti7ef8c0f2019-01-11 22:34:58 +0900497 progname += tracker.iface;
Daniel Drown0da73fc2012-06-20 16:51:39 -0500498
Lorenzo Colitti7ef8c0f2019-01-11 22:34:58 +0900499 // clang-format off
Maciej Żenczykowskif4b44fe2019-04-08 16:18:50 -0700500 const char* args[] = {progname.c_str(),
501 "-i", tracker.iface,
502 "-n", tracker.netIdString,
503 "-m", tracker.fwmarkString,
504 "-p", tracker.pfx96String,
505 "-4", tracker.v4Str,
506 "-6", tracker.v6Str,
507 "-t", passedTunFdStr,
508 nullptr};
Lorenzo Colitti7ef8c0f2019-01-11 22:34:58 +0900509 // clang-format on
510
Maciej Żenczykowskif4b44fe2019-04-08 16:18:50 -0700511 // 9. register vfork requirement
512 posix_spawnattr_t attr;
513 res = posix_spawnattr_init(&attr);
514 if (res) {
515 ALOGE("posix_spawnattr_init failed (%s)", strerror(res));
516 return -res;
517 }
518 const android::base::ScopeGuard attrGuard = [&] { posix_spawnattr_destroy(&attr); };
519 res = posix_spawnattr_setflags(&attr, POSIX_SPAWN_USEVFORK);
520 if (res) {
521 ALOGE("posix_spawnattr_setflags failed (%s)", strerror(res));
522 return -res;
523 }
524
525 // 10. register dup2() action: this is what 'clears' the CLOEXEC flag
526 // on the tun fd that we want the child clatd process to inherit
527 // (this will happen after the vfork, and before the execve)
528 posix_spawn_file_actions_t fa;
529 res = posix_spawn_file_actions_init(&fa);
530 if (res) {
531 ALOGE("posix_spawn_file_actions_init failed (%s)", strerror(res));
532 return -res;
533 }
534 const android::base::ScopeGuard faGuard = [&] { posix_spawn_file_actions_destroy(&fa); };
535 res = posix_spawn_file_actions_adddup2(&fa, tmpTunFd, passedTunFd);
536 if (res) {
537 ALOGE("posix_spawn_file_actions_adddup2 failed (%s)", strerror(res));
538 return -res;
539 }
540
Lorenzo Colitti91fd5802019-06-28 19:22:01 +0900541 // 11. If necessary, add the drop rule for iptables.
542 maybeSetIptablesDropRule(true, tracker.pfx96String, tracker.v6Str);
543
544 // 12. actually perform vfork/dup2/execve
Maciej Żenczykowskif4b44fe2019-04-08 16:18:50 -0700545 res = posix_spawn(&tracker.pid, kClatdPath, &fa, &attr, (char* const*)args, nullptr);
Luke Huang40962442019-02-26 11:46:10 +0800546 if (res) {
547 ALOGE("posix_spawn failed (%s)", strerror(res));
Luke Huang6d301232018-08-01 14:05:18 +0800548 return -res;
Daniel Drown0da73fc2012-06-20 16:51:39 -0500549 }
550
Lorenzo Colitti91fd5802019-06-28 19:22:01 +0900551 // 13. configure eBPF offload - if possible
Maciej Żenczykowski1c086e52019-03-29 23:13:49 -0700552 maybeStartBpf(tracker);
553
Lorenzo Colitti7ef8c0f2019-01-11 22:34:58 +0900554 mClatdTrackers[interface] = tracker;
555 ALOGD("clatd started on %s", interface.c_str());
Daniel Drown0da73fc2012-06-20 16:51:39 -0500556
Lorenzo Colitti7ef8c0f2019-01-11 22:34:58 +0900557 *v6Str = tracker.v6Str;
Daniel Drown0da73fc2012-06-20 16:51:39 -0500558 return 0;
559}
560
Lorenzo Colitti7ef8c0f2019-01-11 22:34:58 +0900561int ClatdController::stopClatd(const std::string& interface) {
Maciej Żenczykowski56280272019-03-30 03:32:51 -0700562 std::lock_guard guard(mutex);
Lorenzo Colitti7ef8c0f2019-01-11 22:34:58 +0900563 ClatdTracker* tracker = getClatdTracker(interface);
Lorenzo Colittiac7fefc2014-10-20 17:14:13 +0900564
Lorenzo Colitti7ef8c0f2019-01-11 22:34:58 +0900565 if (tracker == nullptr) {
Daniel Drown0da73fc2012-06-20 16:51:39 -0500566 ALOGE("clatd already stopped");
Lorenzo Colitti7ef8c0f2019-01-11 22:34:58 +0900567 return -ENODEV;
Daniel Drown0da73fc2012-06-20 16:51:39 -0500568 }
569
Lorenzo Colitti7ef8c0f2019-01-11 22:34:58 +0900570 ALOGD("Stopping clatd pid=%d on %s", tracker->pid, interface.c_str());
Daniel Drown0da73fc2012-06-20 16:51:39 -0500571
Maciej Żenczykowski1c086e52019-03-29 23:13:49 -0700572 maybeStopBpf(*tracker);
573
Lorenzo Colitti7ef8c0f2019-01-11 22:34:58 +0900574 kill(tracker->pid, SIGTERM);
575 waitpid(tracker->pid, nullptr, 0);
Lorenzo Colitti91fd5802019-06-28 19:22:01 +0900576
577 maybeSetIptablesDropRule(false, tracker->pfx96String, tracker->v6Str);
Lorenzo Colitti7ef8c0f2019-01-11 22:34:58 +0900578 mClatdTrackers.erase(interface);
Daniel Drown0da73fc2012-06-20 16:51:39 -0500579
Lorenzo Colitti7ef8c0f2019-01-11 22:34:58 +0900580 ALOGD("clatd on %s stopped", interface.c_str());
Daniel Drown0da73fc2012-06-20 16:51:39 -0500581
582 return 0;
583}
584
Maciej Żenczykowski1afbd992019-12-16 11:44:14 -0800585void ClatdController::dumpEgress(DumpWriter& dw) {
586 int mapFd = getClatEgressMapFd();
587 if (mapFd < 0) return; // if unsupported just don't dump anything
588 BpfMap<ClatEgressKey, ClatEgressValue> configMap(mapFd);
589
590 ScopedIndent bpfIndent(dw);
591 dw.println("BPF egress map: iif(iface) v4Addr -> v6Addr nat64Prefix oif(iface)");
592
593 ScopedIndent bpfDetailIndent(dw);
594 const auto printClatMap = [&dw](const ClatEgressKey& key, const ClatEgressValue& value,
595 const BpfMap<ClatEgressKey, ClatEgressValue>&) {
596 char iifStr[IFNAMSIZ] = "?";
597 char local4Str[INET_ADDRSTRLEN] = "?";
598 char local6Str[INET6_ADDRSTRLEN] = "?";
599 char pfx96Str[INET6_ADDRSTRLEN] = "?";
600 char oifStr[IFNAMSIZ] = "?";
601
602 if_indextoname(key.iif, iifStr);
603 inet_ntop(AF_INET, &key.local4, local4Str, sizeof(local4Str));
604 inet_ntop(AF_INET6, &value.local6, local6Str, sizeof(local6Str));
605 inet_ntop(AF_INET6, &value.pfx96, pfx96Str, sizeof(pfx96Str));
606 if_indextoname(value.oif, oifStr);
607
608 dw.println("%u(%s) %s -> %s %s/96 %u(%s)", key.iif, iifStr, local4Str, local6Str, pfx96Str,
609 value.oif, oifStr);
610 return netdutils::status::ok;
611 };
612 auto res = configMap.iterateWithValue(printClatMap);
613 if (!isOk(res)) {
614 dw.println("Error printing BPF map: %s", res.msg().c_str());
615 }
616}
617
Maciej Żenczykowski7dffa6f2019-12-16 11:20:44 -0800618void ClatdController::dumpIngress(DumpWriter& dw) {
Maciej Żenczykowskiabb2cbf2019-04-01 01:29:29 -0700619 int mapFd = getClatIngressMapFd();
620 if (mapFd < 0) return; // if unsupported just don't dump anything
621 BpfMap<ClatIngressKey, ClatIngressValue> configMap(mapFd);
Maciej Żenczykowski55262712019-03-29 23:44:56 -0700622
623 ScopedIndent bpfIndent(dw);
624 dw.println("BPF ingress map: iif(iface) nat64Prefix v6Addr -> v4Addr oif(iface)");
625
626 ScopedIndent bpfDetailIndent(dw);
Maciej Żenczykowski55262712019-03-29 23:44:56 -0700627 const auto printClatMap = [&dw](const ClatIngressKey& key, const ClatIngressValue& value,
628 const BpfMap<ClatIngressKey, ClatIngressValue>&) {
629 char iifStr[IFNAMSIZ] = "?";
630 char pfx96Str[INET6_ADDRSTRLEN] = "?";
631 char local6Str[INET6_ADDRSTRLEN] = "?";
632 char local4Str[INET_ADDRSTRLEN] = "?";
633 char oifStr[IFNAMSIZ] = "?";
634
635 if_indextoname(key.iif, iifStr);
636 inet_ntop(AF_INET6, &key.pfx96, pfx96Str, sizeof(pfx96Str));
637 inet_ntop(AF_INET6, &key.local6, local6Str, sizeof(local6Str));
638 inet_ntop(AF_INET, &value.local4, local4Str, sizeof(local4Str));
639 if_indextoname(value.oif, oifStr);
640
641 dw.println("%u(%s) %s/96 %s -> %s %u(%s)", key.iif, iifStr, pfx96Str, local6Str, local4Str,
642 value.oif, oifStr);
643 return netdutils::status::ok;
644 };
645 auto res = configMap.iterateWithValue(printClatMap);
646 if (!isOk(res)) {
647 dw.println("Error printing BPF map: %s", res.msg().c_str());
648 }
649}
650
Maciej Żenczykowski4c262172019-12-16 11:31:24 -0800651void ClatdController::dumpTrackers(DumpWriter& dw) {
652 ScopedIndent trackerIndent(dw);
653 dw.println("Trackers: iif[iface] nat64Prefix v6Addr -> v4Addr v4iif[v4iface] [netId]");
654
655 ScopedIndent trackerDetailIndent(dw);
656 for (const auto& pair : mClatdTrackers) {
657 const ClatdTracker& tracker = pair.second;
658 dw.println("%u[%s] %s/96 %s -> %s %u[%s] [%u]", tracker.ifIndex, tracker.iface,
659 tracker.pfx96String, tracker.v6Str, tracker.v4Str, tracker.v4ifIndex,
660 tracker.v4iface, tracker.netId);
661 }
662}
663
Maciej Żenczykowski7dffa6f2019-12-16 11:20:44 -0800664void ClatdController::dump(DumpWriter& dw) {
665 std::lock_guard guard(mutex);
666
667 ScopedIndent clatdIndent(dw);
668 dw.println("ClatdController");
669
Maciej Żenczykowski4c262172019-12-16 11:31:24 -0800670 dumpTrackers(dw);
Maciej Żenczykowski7dffa6f2019-12-16 11:20:44 -0800671 dumpIngress(dw);
Maciej Żenczykowski1afbd992019-12-16 11:44:14 -0800672 dumpEgress(dw);
Maciej Żenczykowski7dffa6f2019-12-16 11:20:44 -0800673}
674
Lorenzo Colitti7ef8c0f2019-01-11 22:34:58 +0900675auto ClatdController::isIpv4AddressFreeFunc = isIpv4AddressFree;
Lorenzo Colitti91fd5802019-06-28 19:22:01 +0900676auto ClatdController::iptablesRestoreFunction = execIptablesRestore;
Lorenzo Colitti7ef8c0f2019-01-11 22:34:58 +0900677
Lorenzo Colitti7035f222017-02-13 18:29:00 +0900678} // namespace net
679} // namespace android