blob: be1a42c83c1915959912363122b8e0a13e6aa3a3 [file] [log] [blame]
Daniel Drowna45056e2012-03-23 10:42:54 -05001/*
2 * Copyright 2012 Daniel Drown
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 *
16 * clatd.c - tun interface setup and main event loop
17 */
junyulaic4e591a2018-11-26 22:36:10 +090018#include <arpa/inet.h>
19#include <errno.h>
20#include <fcntl.h>
Daniel Drowna45056e2012-03-23 10:42:54 -050021#include <poll.h>
22#include <signal.h>
Daniel Drowna45056e2012-03-23 10:42:54 -050023#include <stdio.h>
junyulaic4e591a2018-11-26 22:36:10 +090024#include <stdlib.h>
25#include <string.h>
Daniel Drowna45056e2012-03-23 10:42:54 -050026#include <sys/ioctl.h>
Elliott Hughes3afe9ae2014-07-18 17:25:26 -070027#include <sys/prctl.h>
Daniel Drowna45056e2012-03-23 10:42:54 -050028#include <sys/stat.h>
junyulaic4e591a2018-11-26 22:36:10 +090029#include <sys/types.h>
30#include <time.h>
Daniel Drowna45056e2012-03-23 10:42:54 -050031#include <unistd.h>
Daniel Drowna45056e2012-03-23 10:42:54 -050032
Lorenzo Colittif08c5aa2014-06-03 12:56:38 +090033#include <linux/filter.h>
Daniel Drowna45056e2012-03-23 10:42:54 -050034#include <linux/if.h>
Daniel Drowna45056e2012-03-23 10:42:54 -050035#include <linux/if_ether.h>
Lorenzo Colittif08c5aa2014-06-03 12:56:38 +090036#include <linux/if_packet.h>
junyulaic4e591a2018-11-26 22:36:10 +090037#include <linux/if_tun.h>
Lorenzo Colittif08c5aa2014-06-03 12:56:38 +090038#include <net/if.h>
junyulaic4e591a2018-11-26 22:36:10 +090039#include <sys/uio.h>
Daniel Drowna45056e2012-03-23 10:42:54 -050040
Daniel Drowna45056e2012-03-23 10:42:54 -050041#include "clatd.h"
Maciej Żenczykowskif6ec94e2022-07-12 16:17:33 -070042#include "checksum.h"
Daniel Drowna45056e2012-03-23 10:42:54 -050043#include "config.h"
Daniel Drowna45056e2012-03-23 10:42:54 -050044#include "dump.h"
junyulaic4e591a2018-11-26 22:36:10 +090045#include "getaddr.h"
46#include "logging.h"
junyulaic4e591a2018-11-26 22:36:10 +090047#include "translate.h"
Daniel Drowna45056e2012-03-23 10:42:54 -050048
Maciej Żenczykowski5ce6cda2020-06-02 14:39:33 -070049struct clat_config Global_Clatd_Config;
50
Lorenzo Colitti57d480d2014-02-09 10:35:38 +090051/* 40 bytes IPv6 header - 20 bytes IPv4 header + 8 bytes fragment header */
52#define MTU_DELTA 28
53
Daniel Drowna45056e2012-03-23 10:42:54 -050054volatile sig_atomic_t running = 1;
55
Lorenzo Colitti66deecd2019-01-04 12:27:27 +090056int ipv6_address_changed(const char *interface) {
57 union anyip *interface_ip;
58
59 interface_ip = getinterface_ip(interface, AF_INET6);
60 if (!interface_ip) {
61 logmsg(ANDROID_LOG_ERROR, "Unable to find an IPv6 address on interface %s", interface);
62 return 1;
63 }
64
65 if (!ipv6_prefix_equal(&interface_ip->ip6, &Global_Clatd_Config.ipv6_local_subnet)) {
66 char oldstr[INET6_ADDRSTRLEN];
67 char newstr[INET6_ADDRSTRLEN];
68 inet_ntop(AF_INET6, &Global_Clatd_Config.ipv6_local_subnet, oldstr, sizeof(oldstr));
69 inet_ntop(AF_INET6, &interface_ip->ip6, newstr, sizeof(newstr));
70 logmsg(ANDROID_LOG_INFO, "IPv6 prefix on %s changed: %s -> %s", interface, oldstr, newstr);
71 free(interface_ip);
72 return 1;
73 } else {
74 free(interface_ip);
75 return 0;
76 }
77}
78
Maciej Żenczykowskie6e0c002023-01-18 23:57:35 +000079// reads L3 IPv6 packet from AF_PACKET socket, translates to IPv4, writes to tun
80void process_packet_6_to_4(struct tun_data *tunnel) {
81 uint8_t buf[MAXMTU];
82 ssize_t readlen = read(tunnel->read_fd6, buf, MAXMTU);
Daniel Drowna45056e2012-03-23 10:42:54 -050083
junyulaic4e591a2018-11-26 22:36:10 +090084 if (readlen < 0) {
Lorenzo Colitti49454812015-01-31 19:18:47 +090085 if (errno != EAGAIN) {
Maciej Żenczykowskie6e0c002023-01-18 23:57:35 +000086 logmsg(ANDROID_LOG_WARN, "%s: read error: %s", __func__, strerror(errno));
Lorenzo Colitti49454812015-01-31 19:18:47 +090087 }
Daniel Drowna45056e2012-03-23 10:42:54 -050088 return;
junyulaic4e591a2018-11-26 22:36:10 +090089 } else if (readlen == 0) {
Maciej Żenczykowskie6e0c002023-01-18 23:57:35 +000090 logmsg(ANDROID_LOG_WARN, "%s: packet socket removed?", __func__);
Daniel Drowna45056e2012-03-23 10:42:54 -050091 running = 0;
Lorenzo Colittif08c5aa2014-06-03 12:56:38 +090092 return;
Maciej Żenczykowskie6e0c002023-01-18 23:57:35 +000093 } else if (readlen >= MAXMTU) {
94 logmsg(ANDROID_LOG_WARN, "%s: read truncation - ignoring pkt", __func__);
95 return;
Lorenzo Colittif08c5aa2014-06-03 12:56:38 +090096 }
97
Maciej Żenczykowskie6e0c002023-01-18 23:57:35 +000098 translate_packet(tunnel->fd4, 0 /* to_ipv6 */, buf, readlen);
99}
100
101// reads TUN_PI + L3 IPv4 packet from tun, translates to IPv6, writes to AF_INET6/RAW socket
102void process_packet_4_to_6(struct tun_data *tunnel) {
103 uint8_t buf[PACKETLEN];
104 ssize_t readlen = read(tunnel->fd4, buf, PACKETLEN);
105
106 if (readlen < 0) {
107 if (errno != EAGAIN) {
108 logmsg(ANDROID_LOG_WARN, "%s: read error: %s", __func__, strerror(errno));
109 }
110 return;
111 } else if (readlen == 0) {
112 logmsg(ANDROID_LOG_WARN, "%s: tun interface removed", __func__);
113 running = 0;
114 return;
115 } else if (readlen >= PACKETLEN) {
116 logmsg(ANDROID_LOG_WARN, "%s: read truncation - ignoring pkt", __func__);
Maciej Żenczykowski50303532020-06-02 14:46:45 -0700117 return;
118 }
119
junyulaic4e591a2018-11-26 22:36:10 +0900120 struct tun_pi *tun_header = (struct tun_pi *)buf;
121 if (readlen < (ssize_t)sizeof(*tun_header)) {
Maciej Żenczykowskie6e0c002023-01-18 23:57:35 +0000122 logmsg(ANDROID_LOG_WARN, "%s: short read: got %ld bytes", __func__, readlen);
Lorenzo Colitti9353be22014-12-03 15:18:29 +0900123 return;
Daniel Drowna45056e2012-03-23 10:42:54 -0500124 }
Lorenzo Colittif08c5aa2014-06-03 12:56:38 +0900125
Lorenzo Colitti9353be22014-12-03 15:18:29 +0900126 uint16_t proto = ntohs(tun_header->proto);
127 if (proto != ETH_P_IP) {
128 logmsg(ANDROID_LOG_WARN, "%s: unknown packet type = 0x%x", __func__, proto);
129 return;
130 }
131
junyulaic4e591a2018-11-26 22:36:10 +0900132 if (tun_header->flags != 0) {
Lorenzo Colitti9353be22014-12-03 15:18:29 +0900133 logmsg(ANDROID_LOG_WARN, "%s: unexpected flags = %d", __func__, tun_header->flags);
134 }
135
Maciej Żenczykowski50303532020-06-02 14:46:45 -0700136 uint8_t *packet = (uint8_t *)(tun_header + 1);
Lorenzo Colitti9353be22014-12-03 15:18:29 +0900137 readlen -= sizeof(*tun_header);
Maciej Żenczykowskie6e0c002023-01-18 23:57:35 +0000138 translate_packet(tunnel->write_fd6, 1 /* to_ipv6 */, packet, readlen);
Daniel Drowna45056e2012-03-23 10:42:54 -0500139}
140
Maciej Żenczykowskif6ec94e2022-07-12 16:17:33 -0700141// IPv6 DAD packet format:
142// Ethernet header (if needed) will be added by the kernel:
143// u8[6] src_mac; u8[6] dst_mac '33:33:ff:XX:XX:XX'; be16 ethertype '0x86DD'
144// IPv6 header:
145// be32 0x60000000 - ipv6, tclass 0, flowlabel 0
146// be16 payload_length '32'; u8 nxt_hdr ICMPv6 '58'; u8 hop limit '255'
147// u128 src_ip6 '::'
148// u128 dst_ip6 'ff02::1:ffXX:XXXX'
149// ICMPv6 header:
150// u8 type '135'; u8 code '0'; u16 icmp6 checksum; u32 reserved '0'
151// ICMPv6 neighbour solicitation payload:
152// u128 tgt_ip6
153// ICMPv6 ND options:
154// u8 opt nr '14'; u8 length '1'; u8[6] nonce '6 random bytes'
Maciej Żenczykowskia1cb0f32022-07-19 09:22:58 -0700155void send_dad(int fd, const struct in6_addr* tgt) {
Maciej Żenczykowskif6ec94e2022-07-12 16:17:33 -0700156 struct {
157 struct ip6_hdr ip6h;
158 struct nd_neighbor_solicit ns;
159 uint8_t ns_opt_nr;
160 uint8_t ns_opt_len;
161 uint8_t ns_opt_nonce[6];
162 } dad_pkt = {
163 .ip6h = {
164 .ip6_flow = htonl(6 << 28), // v6, 0 tclass, 0 flowlabel
165 .ip6_plen = htons(sizeof(dad_pkt) - sizeof(struct ip6_hdr)), // payload length, ie. 32
166 .ip6_nxt = IPPROTO_ICMPV6, // 58
167 .ip6_hlim = 255,
168 .ip6_src = {}, // ::
169 .ip6_dst.s6_addr = {
170 0xFF, 0x02, 0, 0,
171 0, 0, 0, 0,
172 0, 0, 0, 1,
173 0xFF, tgt->s6_addr[13], tgt->s6_addr[14], tgt->s6_addr[15],
174 }, // ff02::1:ffXX:XXXX - multicast group address derived from bottom 24-bits of tgt
175 },
176 .ns = {
177 .nd_ns_type = ND_NEIGHBOR_SOLICIT, // 135
178 .nd_ns_code = 0,
179 .nd_ns_cksum = 0, // will be calculated later
180 .nd_ns_reserved = 0,
181 .nd_ns_target = *tgt,
182 },
183 .ns_opt_nr = 14, // icmp6 option 'nonce' from RFC3971
184 .ns_opt_len = 1, // in units of 8 bytes, including option nr and len
Maciej Żenczykowskia1cb0f32022-07-19 09:22:58 -0700185 .ns_opt_nonce = {}, // opt_len *8 - sizeof u8(opt_nr) - sizeof u8(opt_len) = 6 ranodmized bytes
Maciej Żenczykowskif6ec94e2022-07-12 16:17:33 -0700186 };
Maciej Żenczykowskia1cb0f32022-07-19 09:22:58 -0700187 arc4random_buf(&dad_pkt.ns_opt_nonce, sizeof(dad_pkt.ns_opt_nonce));
Maciej Żenczykowskif6ec94e2022-07-12 16:17:33 -0700188
189 // 40 byte IPv6 header + 8 byte ICMPv6 header + 16 byte ipv6 target address + 8 byte nonce option
190 _Static_assert(sizeof(dad_pkt) == 40 + 8 + 16 + 8, "sizeof dad packet != 72");
191
192 // IPv6 header checksum is standard negated 16-bit one's complement sum over the icmpv6 pseudo
193 // header (which includes payload length, nextheader, and src/dst ip) and the icmpv6 payload.
194 //
195 // Src/dst ip immediately prefix the icmpv6 header itself, so can be handled along
196 // with the payload. We thus only need to manually account for payload len & next header.
197 //
198 // The magic '8' is simply the offset of the ip6_src field in the ipv6 header,
199 // ie. we're skipping over the ipv6 version, tclass, flowlabel, payload length, next header
200 // and hop limit fields, because they're not quite where we want them to be.
201 //
202 // ip6_plen is already in network order, while ip6_nxt is a single byte and thus needs htons().
203 uint32_t csum = dad_pkt.ip6h.ip6_plen + htons(dad_pkt.ip6h.ip6_nxt);
204 csum = ip_checksum_add(csum, &dad_pkt.ip6h.ip6_src, sizeof(dad_pkt) - 8);
205 dad_pkt.ns.nd_ns_cksum = ip_checksum_finish(csum);
206
207 const struct sockaddr_in6 dst = {
208 .sin6_family = AF_INET6,
209 .sin6_addr = dad_pkt.ip6h.ip6_dst,
210 .sin6_scope_id = if_nametoindex(Global_Clatd_Config.native_ipv6_interface),
211 };
212
Maciej Żenczykowskia1cb0f32022-07-19 09:22:58 -0700213 sendto(fd, &dad_pkt, sizeof(dad_pkt), 0 /*flags*/, (const struct sockaddr *)&dst, sizeof(dst));
Maciej Żenczykowskif6ec94e2022-07-12 16:17:33 -0700214}
215
Daniel Drowna45056e2012-03-23 10:42:54 -0500216/* function: event_loop
217 * reads packets from the tun network interface and passes them down the stack
junyulaic4e591a2018-11-26 22:36:10 +0900218 * tunnel - tun device data
Daniel Drowna45056e2012-03-23 10:42:54 -0500219 */
Lorenzo Colitti9353be22014-12-03 15:18:29 +0900220void event_loop(struct tun_data *tunnel) {
Maciej Żenczykowskif6ec94e2022-07-12 16:17:33 -0700221 // Apparently some network gear will refuse to perform NS for IPs that aren't DAD'ed,
222 // this would then result in an ipv6-only network with working native ipv6, working
223 // IPv4 via DNS64, but non-functioning IPv4 via CLAT (ie. IPv4 literals + IPv4 only apps).
224 // The kernel itself doesn't do DAD for anycast ips (but does handle IPV6 MLD and handle ND).
225 // So we'll spoof dad here, and yeah, we really should check for a response and in
226 // case of failure pick a different IP. Seeing as 48-bits of the IP are utterly random
227 // (with the other 16 chosen to guarantee checksum neutrality) this seems like a remote
228 // concern...
229 // TODO: actually perform true DAD
Maciej Żenczykowskia1cb0f32022-07-19 09:22:58 -0700230 send_dad(tunnel->write_fd6, &Global_Clatd_Config.ipv6_local_subnet);
Maciej Żenczykowskif6ec94e2022-07-12 16:17:33 -0700231
Daniel Drowna45056e2012-03-23 10:42:54 -0500232 time_t last_interface_poll;
Lorenzo Colittidce3ddf2014-08-25 16:07:12 -0700233 struct pollfd wait_fd[] = {
234 { tunnel->read_fd6, POLLIN, 0 },
235 { tunnel->fd4, POLLIN, 0 },
236 };
Daniel Drowna45056e2012-03-23 10:42:54 -0500237
238 // start the poll timer
239 last_interface_poll = time(NULL);
240
junyulaic4e591a2018-11-26 22:36:10 +0900241 while (running) {
242 if (poll(wait_fd, ARRAY_SIZE(wait_fd), NO_TRAFFIC_INTERFACE_POLL_FREQUENCY * 1000) == -1) {
Bernie Innocenti69dc60d2018-05-14 20:40:49 +0900243 if (errno != EINTR) {
junyulaic4e591a2018-11-26 22:36:10 +0900244 logmsg(ANDROID_LOG_WARN, "event_loop/poll returned an error: %s", strerror(errno));
Daniel Drowna45056e2012-03-23 10:42:54 -0500245 }
246 } else {
Maciej Żenczykowskie6e0c002023-01-18 23:57:35 +0000247 // Call process_packet if the socket has data to be read, but also if an
Lorenzo Colitti9353be22014-12-03 15:18:29 +0900248 // error is waiting. If we don't call read() after getting POLLERR, a
249 // subsequent poll() will return immediately with POLLERR again,
250 // causing this code to spin in a loop. Calling read() will clear the
251 // socket error flag instead.
Maciej Żenczykowskie6e0c002023-01-18 23:57:35 +0000252 if (wait_fd[0].revents) process_packet_6_to_4(tunnel);
253 if (wait_fd[1].revents) process_packet_4_to_6(tunnel);
Daniel Drowna45056e2012-03-23 10:42:54 -0500254 }
255
256 time_t now = time(NULL);
Rocco Yuee4b7da62020-09-02 15:21:41 +0800257 if (now >= (last_interface_poll + INTERFACE_POLL_FREQUENCY)) {
258 last_interface_poll = now;
Maciej Żenczykowskiba667df2020-06-02 01:41:54 -0700259 if (ipv6_address_changed(Global_Clatd_Config.native_ipv6_interface)) {
Lorenzo Colitti66deecd2019-01-04 12:27:27 +0900260 break;
261 }
Daniel Drowna45056e2012-03-23 10:42:54 -0500262 }
263 }
264}