Tyler Wear | 7238821 | 2021-09-09 14:49:02 -0700 | [diff] [blame] | 1 | /* |
| 2 | * Copyright (C) 2021 The Android Open Source Project |
| 3 | * |
| 4 | * Licensed under the Apache License, Version 2.0 (the "License"); |
| 5 | * you may not use this file except in compliance with the License. |
| 6 | * You may obtain a copy of the License at |
| 7 | * |
| 8 | * http://www.apache.org/licenses/LICENSE-2.0 |
| 9 | * |
| 10 | * Unless required by applicable law or agreed to in writing, software |
| 11 | * distributed under the License is distributed on an "AS IS" BASIS, |
| 12 | * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| 13 | * See the License for the specific language governing permissions and |
| 14 | * limitations under the License. |
| 15 | */ |
| 16 | |
Maciej Żenczykowski | 11141da | 2024-03-15 18:21:33 -0700 | [diff] [blame] | 17 | // The resulting .o needs to load on Android T+ |
Maciej Żenczykowski | 4e4f872 | 2024-06-15 06:38:08 -0700 | [diff] [blame] | 18 | #define BPFLOADER_MIN_VER BPFLOADER_MAINLINE_T_VERSION |
Maciej Żenczykowski | acebffb | 2022-05-16 16:05:15 -0700 | [diff] [blame] | 19 | |
Maciej Żenczykowski | 85c9c99 | 2024-08-16 17:57:36 -0700 | [diff] [blame] | 20 | #include "bpf_net_helpers.h" |
Ken Chen | 74ff3ee | 2022-07-14 16:46:39 +0800 | [diff] [blame] | 21 | #include "dscpPolicy.h" |
Tyler Wear | 7238821 | 2021-09-09 14:49:02 -0700 | [diff] [blame] | 22 | |
Tyler Wear | 11f494f | 2022-06-14 16:04:49 -0700 | [diff] [blame] | 23 | #define ECN_MASK 3 |
Maciej Żenczykowski | d7b92c0 | 2022-07-27 19:57:15 +0000 | [diff] [blame] | 24 | #define UPDATE_TOS(dscp, tos) ((dscp) << 2) | ((tos) & ECN_MASK) |
Tyler Wear | 11f494f | 2022-06-14 16:04:49 -0700 | [diff] [blame] | 25 | |
Maciej Żenczykowski | f75b7e1 | 2022-07-27 12:56:01 +0000 | [diff] [blame] | 26 | DEFINE_BPF_MAP_GRW(socket_policy_cache_map, HASH, uint64_t, RuleEntry, CACHE_MAP_SIZE, AID_SYSTEM) |
Tyler Wear | 7238821 | 2021-09-09 14:49:02 -0700 | [diff] [blame] | 27 | |
Tyler Wear | 11f494f | 2022-06-14 16:04:49 -0700 | [diff] [blame] | 28 | DEFINE_BPF_MAP_GRW(ipv4_dscp_policies_map, ARRAY, uint32_t, DscpPolicy, MAX_POLICIES, AID_SYSTEM) |
| 29 | DEFINE_BPF_MAP_GRW(ipv6_dscp_policies_map, ARRAY, uint32_t, DscpPolicy, MAX_POLICIES, AID_SYSTEM) |
Tyler Wear | 3ad8089 | 2022-02-03 15:14:44 -0800 | [diff] [blame] | 30 | |
Patrick Rohr | 7f325cc | 2022-07-25 10:15:02 -0700 | [diff] [blame] | 31 | static inline __always_inline void match_policy(struct __sk_buff* skb, bool ipv4) { |
Tyler Wear | 3ad8089 | 2022-02-03 15:14:44 -0800 | [diff] [blame] | 32 | void* data = (void*)(long)skb->data; |
| 33 | const void* data_end = (void*)(long)skb->data_end; |
| 34 | |
Patrick Rohr | 7f325cc | 2022-07-25 10:15:02 -0700 | [diff] [blame] | 35 | const int l2_header_size = sizeof(struct ethhdr); |
| 36 | struct ethhdr* eth = data; |
Tyler Wear | 3ad8089 | 2022-02-03 15:14:44 -0800 | [diff] [blame] | 37 | |
| 38 | if (data + l2_header_size > data_end) return; |
| 39 | |
Tyler Wear | 3ad8089 | 2022-02-03 15:14:44 -0800 | [diff] [blame] | 40 | int hdr_size = 0; |
Tyler Wear | 7238821 | 2021-09-09 14:49:02 -0700 | [diff] [blame] | 41 | |
| 42 | // used for map lookup |
| 43 | uint64_t cookie = bpf_get_socket_cookie(skb); |
Tyler Wear | 11f494f | 2022-06-14 16:04:49 -0700 | [diff] [blame] | 44 | if (!cookie) return; |
Tyler Wear | 7238821 | 2021-09-09 14:49:02 -0700 | [diff] [blame] | 45 | |
Maciej Żenczykowski | 640752b | 2022-08-09 23:02:57 +0000 | [diff] [blame] | 46 | __be16 sport = 0; |
Tyler Wear | 3ad8089 | 2022-02-03 15:14:44 -0800 | [diff] [blame] | 47 | uint16_t dport = 0; |
Tyler Wear | 11f494f | 2022-06-14 16:04:49 -0700 | [diff] [blame] | 48 | uint8_t protocol = 0; // TODO: Use are reserved value? Or int (-1) and cast to uint below? |
Tyler Wear | 9228105 | 2022-06-22 15:32:14 -0700 | [diff] [blame] | 49 | struct in6_addr src_ip = {}; |
| 50 | struct in6_addr dst_ip = {}; |
Maciej Żenczykowski | 242af39 | 2022-08-22 09:11:10 +0000 | [diff] [blame] | 51 | uint8_t tos = 0; // Only used for IPv4 |
| 52 | __be32 old_first_be32 = 0; // Only used for IPv6 |
Tyler Wear | 3ad8089 | 2022-02-03 15:14:44 -0800 | [diff] [blame] | 53 | if (ipv4) { |
Patrick Rohr | 7f325cc | 2022-07-25 10:15:02 -0700 | [diff] [blame] | 54 | const struct iphdr* const iph = (void*)(eth + 1); |
Tyler Wear | 11f494f | 2022-06-14 16:04:49 -0700 | [diff] [blame] | 55 | hdr_size = l2_header_size + sizeof(struct iphdr); |
Tyler Wear | 7238821 | 2021-09-09 14:49:02 -0700 | [diff] [blame] | 56 | // Must have ipv4 header |
Tyler Wear | 11f494f | 2022-06-14 16:04:49 -0700 | [diff] [blame] | 57 | if (data + hdr_size > data_end) return; |
Tyler Wear | 7238821 | 2021-09-09 14:49:02 -0700 | [diff] [blame] | 58 | |
| 59 | // IP version must be 4 |
Tyler Wear | 3ad8089 | 2022-02-03 15:14:44 -0800 | [diff] [blame] | 60 | if (iph->version != 4) return; |
Tyler Wear | 7238821 | 2021-09-09 14:49:02 -0700 | [diff] [blame] | 61 | |
| 62 | // We cannot handle IP options, just standard 20 byte == 5 dword minimal IPv4 header |
Tyler Wear | 3ad8089 | 2022-02-03 15:14:44 -0800 | [diff] [blame] | 63 | if (iph->ihl != 5) return; |
Tyler Wear | 7238821 | 2021-09-09 14:49:02 -0700 | [diff] [blame] | 64 | |
Tyler Wear | 3ad8089 | 2022-02-03 15:14:44 -0800 | [diff] [blame] | 65 | // V4 mapped address in in6_addr sets 10/11 position to 0xff. |
Tyler Wear | 9228105 | 2022-06-22 15:32:14 -0700 | [diff] [blame] | 66 | src_ip.s6_addr32[2] = htonl(0x0000ffff); |
| 67 | dst_ip.s6_addr32[2] = htonl(0x0000ffff); |
Tyler Wear | 7238821 | 2021-09-09 14:49:02 -0700 | [diff] [blame] | 68 | |
Tyler Wear | 3ad8089 | 2022-02-03 15:14:44 -0800 | [diff] [blame] | 69 | // Copy IPv4 address into in6_addr for easy comparison below. |
Tyler Wear | 9228105 | 2022-06-22 15:32:14 -0700 | [diff] [blame] | 70 | src_ip.s6_addr32[3] = iph->saddr; |
| 71 | dst_ip.s6_addr32[3] = iph->daddr; |
Tyler Wear | 3ad8089 | 2022-02-03 15:14:44 -0800 | [diff] [blame] | 72 | protocol = iph->protocol; |
| 73 | tos = iph->tos; |
Tyler Wear | 3ad8089 | 2022-02-03 15:14:44 -0800 | [diff] [blame] | 74 | } else { |
Patrick Rohr | 7f325cc | 2022-07-25 10:15:02 -0700 | [diff] [blame] | 75 | struct ipv6hdr* ip6h = (void*)(eth + 1); |
Tyler Wear | 11f494f | 2022-06-14 16:04:49 -0700 | [diff] [blame] | 76 | hdr_size = l2_header_size + sizeof(struct ipv6hdr); |
Tyler Wear | 3ad8089 | 2022-02-03 15:14:44 -0800 | [diff] [blame] | 77 | // Must have ipv6 header |
Tyler Wear | 11f494f | 2022-06-14 16:04:49 -0700 | [diff] [blame] | 78 | if (data + hdr_size > data_end) return; |
Tyler Wear | 7238821 | 2021-09-09 14:49:02 -0700 | [diff] [blame] | 79 | |
Tyler Wear | 3ad8089 | 2022-02-03 15:14:44 -0800 | [diff] [blame] | 80 | if (ip6h->version != 6) return; |
Tyler Wear | 7238821 | 2021-09-09 14:49:02 -0700 | [diff] [blame] | 81 | |
Tyler Wear | 9228105 | 2022-06-22 15:32:14 -0700 | [diff] [blame] | 82 | src_ip = ip6h->saddr; |
| 83 | dst_ip = ip6h->daddr; |
Tyler Wear | 3ad8089 | 2022-02-03 15:14:44 -0800 | [diff] [blame] | 84 | protocol = ip6h->nexthdr; |
Maciej Żenczykowski | 242af39 | 2022-08-22 09:11:10 +0000 | [diff] [blame] | 85 | old_first_be32 = *(__be32*)ip6h; |
Tyler Wear | 3ad8089 | 2022-02-03 15:14:44 -0800 | [diff] [blame] | 86 | } |
Tyler Wear | 7238821 | 2021-09-09 14:49:02 -0700 | [diff] [blame] | 87 | |
Tyler Wear | 3ad8089 | 2022-02-03 15:14:44 -0800 | [diff] [blame] | 88 | switch (protocol) { |
| 89 | case IPPROTO_UDP: |
Tyler Wear | 11f494f | 2022-06-14 16:04:49 -0700 | [diff] [blame] | 90 | case IPPROTO_UDPLITE: { |
| 91 | struct udphdr* udp; |
Tyler Wear | 3ad8089 | 2022-02-03 15:14:44 -0800 | [diff] [blame] | 92 | udp = data + hdr_size; |
| 93 | if ((void*)(udp + 1) > data_end) return; |
| 94 | sport = udp->source; |
Maciej Żenczykowski | 640752b | 2022-08-09 23:02:57 +0000 | [diff] [blame] | 95 | dport = ntohs(udp->dest); |
Tyler Wear | 11f494f | 2022-06-14 16:04:49 -0700 | [diff] [blame] | 96 | } break; |
| 97 | case IPPROTO_TCP: { |
| 98 | struct tcphdr* tcp; |
Tyler Wear | 3ad8089 | 2022-02-03 15:14:44 -0800 | [diff] [blame] | 99 | tcp = data + hdr_size; |
| 100 | if ((void*)(tcp + 1) > data_end) return; |
| 101 | sport = tcp->source; |
Maciej Żenczykowski | 640752b | 2022-08-09 23:02:57 +0000 | [diff] [blame] | 102 | dport = ntohs(tcp->dest); |
Tyler Wear | 11f494f | 2022-06-14 16:04:49 -0700 | [diff] [blame] | 103 | } break; |
Tyler Wear | 3ad8089 | 2022-02-03 15:14:44 -0800 | [diff] [blame] | 104 | default: |
| 105 | return; |
| 106 | } |
| 107 | |
Maciej Żenczykowski | f75b7e1 | 2022-07-27 12:56:01 +0000 | [diff] [blame] | 108 | RuleEntry* existing_rule = bpf_socket_policy_cache_map_lookup_elem(&cookie); |
Tyler Wear | 3ad8089 | 2022-02-03 15:14:44 -0800 | [diff] [blame] | 109 | |
Maciej Żenczykowski | 1feaa43 | 2022-07-29 21:17:07 +0000 | [diff] [blame] | 110 | if (existing_rule && |
| 111 | v6_equal(src_ip, existing_rule->src_ip) && |
| 112 | v6_equal(dst_ip, existing_rule->dst_ip) && |
| 113 | skb->ifindex == existing_rule->ifindex && |
| 114 | sport == existing_rule->src_port && |
| 115 | dport == existing_rule->dst_port && |
| 116 | protocol == existing_rule->proto) { |
Maciej Żenczykowski | d7b92c0 | 2022-07-27 19:57:15 +0000 | [diff] [blame] | 117 | if (existing_rule->dscp_val < 0) return; |
Tyler Wear | 3ad8089 | 2022-02-03 15:14:44 -0800 | [diff] [blame] | 118 | if (ipv4) { |
Tyler Wear | 9228105 | 2022-06-22 15:32:14 -0700 | [diff] [blame] | 119 | uint8_t newTos = UPDATE_TOS(existing_rule->dscp_val, tos); |
Maciej Żenczykowski | 85c9c99 | 2024-08-16 17:57:36 -0700 | [diff] [blame] | 120 | bpf_l3_csum_replace(skb, l2_header_size + IP4_OFFSET(check), htons(tos), htons(newTos), |
Tyler Wear | 11f494f | 2022-06-14 16:04:49 -0700 | [diff] [blame] | 121 | sizeof(uint16_t)); |
Maciej Żenczykowski | 85c9c99 | 2024-08-16 17:57:36 -0700 | [diff] [blame] | 122 | bpf_skb_store_bytes(skb, l2_header_size + IP4_OFFSET(tos), &newTos, sizeof(newTos), 0); |
Tyler Wear | 3ad8089 | 2022-02-03 15:14:44 -0800 | [diff] [blame] | 123 | } else { |
Maciej Żenczykowski | 242af39 | 2022-08-22 09:11:10 +0000 | [diff] [blame] | 124 | __be32 new_first_be32 = |
| 125 | htonl(ntohl(old_first_be32) & 0xF03FFFFF | (existing_rule->dscp_val << 22)); |
| 126 | bpf_skb_store_bytes(skb, l2_header_size, &new_first_be32, sizeof(__be32), |
Tyler Wear | 4e8949b | 2022-06-23 14:15:58 -0700 | [diff] [blame] | 127 | BPF_F_RECOMPUTE_CSUM); |
Tyler Wear | 3ad8089 | 2022-02-03 15:14:44 -0800 | [diff] [blame] | 128 | } |
| 129 | return; |
| 130 | } |
| 131 | |
| 132 | // Linear scan ipv4_dscp_policies_map since no stored params match skb. |
Maciej Żenczykowski | d7b92c0 | 2022-07-27 19:57:15 +0000 | [diff] [blame] | 133 | int best_score = 0; |
| 134 | int8_t new_dscp = -1; |
Tyler Wear | 3ad8089 | 2022-02-03 15:14:44 -0800 | [diff] [blame] | 135 | |
| 136 | for (register uint64_t i = 0; i < MAX_POLICIES; i++) { |
Tyler Wear | 3ad8089 | 2022-02-03 15:14:44 -0800 | [diff] [blame] | 137 | // Using a uint64 in for loop prevents infinite loop during BPF load, |
| 138 | // but the key is uint32, so convert back. |
| 139 | uint32_t key = i; |
| 140 | |
| 141 | DscpPolicy* policy; |
| 142 | if (ipv4) { |
| 143 | policy = bpf_ipv4_dscp_policies_map_lookup_elem(&key); |
| 144 | } else { |
| 145 | policy = bpf_ipv6_dscp_policies_map_lookup_elem(&key); |
Tyler Wear | 7238821 | 2021-09-09 14:49:02 -0700 | [diff] [blame] | 146 | } |
| 147 | |
Maciej Żenczykowski | 1feaa43 | 2022-07-29 21:17:07 +0000 | [diff] [blame] | 148 | // If the policy lookup failed, just continue (this should not ever happen) |
| 149 | if (!policy) continue; |
Tyler Wear | 7238821 | 2021-09-09 14:49:02 -0700 | [diff] [blame] | 150 | |
Maciej Żenczykowski | 1feaa43 | 2022-07-29 21:17:07 +0000 | [diff] [blame] | 151 | // If policy iface index does not match skb, then skip to next policy. |
| 152 | if (policy->ifindex != skb->ifindex) continue; |
Tyler Wear | 7238821 | 2021-09-09 14:49:02 -0700 | [diff] [blame] | 153 | |
Maciej Żenczykowski | 1feaa43 | 2022-07-29 21:17:07 +0000 | [diff] [blame] | 154 | int score = 0; |
| 155 | |
| 156 | if (policy->present_fields & PROTO_MASK_FLAG) { |
| 157 | if (protocol != policy->proto) continue; |
| 158 | score += 0xFFFF; |
| 159 | } |
| 160 | if (policy->present_fields & SRC_IP_MASK_FLAG) { |
| 161 | if (v6_not_equal(src_ip, policy->src_ip)) continue; |
| 162 | score += 0xFFFF; |
| 163 | } |
| 164 | if (policy->present_fields & DST_IP_MASK_FLAG) { |
| 165 | if (v6_not_equal(dst_ip, policy->dst_ip)) continue; |
| 166 | score += 0xFFFF; |
| 167 | } |
| 168 | if (policy->present_fields & SRC_PORT_MASK_FLAG) { |
| 169 | if (sport != policy->src_port) continue; |
| 170 | score += 0xFFFF; |
| 171 | } |
Maciej Żenczykowski | 640752b | 2022-08-09 23:02:57 +0000 | [diff] [blame] | 172 | if (dport < policy->dst_port_start) continue; |
| 173 | if (dport > policy->dst_port_end) continue; |
Maciej Żenczykowski | a44510b | 2022-08-09 14:59:25 +0000 | [diff] [blame] | 174 | score += 0xFFFF + policy->dst_port_start - policy->dst_port_end; |
Maciej Żenczykowski | 1feaa43 | 2022-07-29 21:17:07 +0000 | [diff] [blame] | 175 | |
| 176 | if (score > best_score) { |
Tyler Wear | 9228105 | 2022-06-22 15:32:14 -0700 | [diff] [blame] | 177 | best_score = score; |
Tyler Wear | 9228105 | 2022-06-22 15:32:14 -0700 | [diff] [blame] | 178 | new_dscp = policy->dscp_val; |
Tyler Wear | 7238821 | 2021-09-09 14:49:02 -0700 | [diff] [blame] | 179 | } |
Maciej Żenczykowski | d7b92c0 | 2022-07-27 19:57:15 +0000 | [diff] [blame] | 180 | } |
Tyler Wear | 7238821 | 2021-09-09 14:49:02 -0700 | [diff] [blame] | 181 | |
Tyler Wear | 3ad8089 | 2022-02-03 15:14:44 -0800 | [diff] [blame] | 182 | RuleEntry value = { |
Tyler Wear | 9228105 | 2022-06-22 15:32:14 -0700 | [diff] [blame] | 183 | .src_ip = src_ip, |
| 184 | .dst_ip = dst_ip, |
Tyler Wear | 3ad8089 | 2022-02-03 15:14:44 -0800 | [diff] [blame] | 185 | .ifindex = skb->ifindex, |
Tyler Wear | 9228105 | 2022-06-22 15:32:14 -0700 | [diff] [blame] | 186 | .src_port = sport, |
| 187 | .dst_port = dport, |
Tyler Wear | 3ad8089 | 2022-02-03 15:14:44 -0800 | [diff] [blame] | 188 | .proto = protocol, |
Tyler Wear | 9228105 | 2022-06-22 15:32:14 -0700 | [diff] [blame] | 189 | .dscp_val = new_dscp, |
Tyler Wear | 3ad8089 | 2022-02-03 15:14:44 -0800 | [diff] [blame] | 190 | }; |
Tyler Wear | 7238821 | 2021-09-09 14:49:02 -0700 | [diff] [blame] | 191 | |
Maciej Żenczykowski | d7b92c0 | 2022-07-27 19:57:15 +0000 | [diff] [blame] | 192 | // Update cache with found policy. |
Maciej Żenczykowski | f75b7e1 | 2022-07-27 12:56:01 +0000 | [diff] [blame] | 193 | bpf_socket_policy_cache_map_update_elem(&cookie, &value, BPF_ANY); |
Tyler Wear | 7238821 | 2021-09-09 14:49:02 -0700 | [diff] [blame] | 194 | |
Maciej Żenczykowski | d7b92c0 | 2022-07-27 19:57:15 +0000 | [diff] [blame] | 195 | if (new_dscp < 0) return; |
| 196 | |
Tyler Wear | 3ad8089 | 2022-02-03 15:14:44 -0800 | [diff] [blame] | 197 | // Need to store bytes after updating map or program will not load. |
Tyler Wear | 4e8949b | 2022-06-23 14:15:58 -0700 | [diff] [blame] | 198 | if (ipv4) { |
| 199 | uint8_t new_tos = UPDATE_TOS(new_dscp, tos); |
Maciej Żenczykowski | 85c9c99 | 2024-08-16 17:57:36 -0700 | [diff] [blame] | 200 | bpf_l3_csum_replace(skb, l2_header_size + IP4_OFFSET(check), htons(tos), htons(new_tos), 2); |
| 201 | bpf_skb_store_bytes(skb, l2_header_size + IP4_OFFSET(tos), &new_tos, sizeof(new_tos), 0); |
Tyler Wear | 4e8949b | 2022-06-23 14:15:58 -0700 | [diff] [blame] | 202 | } else { |
Maciej Żenczykowski | 242af39 | 2022-08-22 09:11:10 +0000 | [diff] [blame] | 203 | __be32 new_first_be32 = htonl(ntohl(old_first_be32) & 0xF03FFFFF | (new_dscp << 22)); |
| 204 | bpf_skb_store_bytes(skb, l2_header_size, &new_first_be32, sizeof(__be32), |
Tyler Wear | 4e8949b | 2022-06-23 14:15:58 -0700 | [diff] [blame] | 205 | BPF_F_RECOMPUTE_CSUM); |
Tyler Wear | 3ad8089 | 2022-02-03 15:14:44 -0800 | [diff] [blame] | 206 | } |
| 207 | return; |
| 208 | } |
Tyler Wear | 7238821 | 2021-09-09 14:49:02 -0700 | [diff] [blame] | 209 | |
Tyler Wear | 4e8949b | 2022-06-23 14:15:58 -0700 | [diff] [blame] | 210 | DEFINE_BPF_PROG_KVER("schedcls/set_dscp_ether", AID_ROOT, AID_SYSTEM, schedcls_set_dscp_ether, |
Maciej Żenczykowski | 901c710 | 2023-10-06 15:47:46 -0700 | [diff] [blame] | 211 | KVER_5_15) |
Tyler Wear | 3ad8089 | 2022-02-03 15:14:44 -0800 | [diff] [blame] | 212 | (struct __sk_buff* skb) { |
Tyler Wear | 3ad8089 | 2022-02-03 15:14:44 -0800 | [diff] [blame] | 213 | if (skb->pkt_type != PACKET_HOST) return TC_ACT_PIPE; |
| 214 | |
| 215 | if (skb->protocol == htons(ETH_P_IP)) { |
Patrick Rohr | 7f325cc | 2022-07-25 10:15:02 -0700 | [diff] [blame] | 216 | match_policy(skb, true); |
Tyler Wear | 3ad8089 | 2022-02-03 15:14:44 -0800 | [diff] [blame] | 217 | } else if (skb->protocol == htons(ETH_P_IPV6)) { |
Patrick Rohr | 7f325cc | 2022-07-25 10:15:02 -0700 | [diff] [blame] | 218 | match_policy(skb, false); |
Tyler Wear | 3ad8089 | 2022-02-03 15:14:44 -0800 | [diff] [blame] | 219 | } |
| 220 | |
| 221 | // Always return TC_ACT_PIPE |
| 222 | return TC_ACT_PIPE; |
| 223 | } |
| 224 | |
Tyler Wear | 7238821 | 2021-09-09 14:49:02 -0700 | [diff] [blame] | 225 | LICENSE("Apache 2.0"); |
| 226 | CRITICAL("Connectivity"); |