1 /* SPDX-License-Identifier: GPL-2.0 */ 2 #ifndef __LINUX_NETFILTER_H 3 #define __LINUX_NETFILTER_H 4 5 #include <linux/init.h> 6 #include <linux/skbuff.h> 7 #include <linux/net.h> 8 #include <linux/if.h> 9 #include <linux/in.h> 10 #include <linux/in6.h> 11 #include <linux/wait.h> 12 #include <linux/list.h> 13 #include <linux/static_key.h> 14 #include <linux/netfilter_defs.h> 15 #include <linux/netdevice.h> 16 #include <linux/sockptr.h> 17 #include <net/net_namespace.h> 18 19 static inline int NF_DROP_GETERR(int verdict) 20 { 21 return -(verdict >> NF_VERDICT_QBITS); 22 } 23 24 static inline int nf_inet_addr_cmp(const union nf_inet_addr *a1, 25 const union nf_inet_addr *a2) 26 { 27 #if defined(CONFIG_HAVE_EFFICIENT_UNALIGNED_ACCESS) && BITS_PER_LONG == 64 28 const unsigned long *ul1 = (const unsigned long *)a1; 29 const unsigned long *ul2 = (const unsigned long *)a2; 30 31 return ((ul1[0] ^ ul2[0]) | (ul1[1] ^ ul2[1])) == 0UL; 32 #else 33 return a1->all[0] == a2->all[0] && 34 a1->all[1] == a2->all[1] && 35 a1->all[2] == a2->all[2] && 36 a1->all[3] == a2->all[3]; 37 #endif 38 } 39 40 static inline void nf_inet_addr_mask(const union nf_inet_addr *a1, 41 union nf_inet_addr *result, 42 const union nf_inet_addr *mask) 43 { 44 #if defined(CONFIG_HAVE_EFFICIENT_UNALIGNED_ACCESS) && BITS_PER_LONG == 64 45 const unsigned long *ua = (const unsigned long *)a1; 46 unsigned long *ur = (unsigned long *)result; 47 const unsigned long *um = (const unsigned long *)mask; 48 49 ur[0] = ua[0] & um[0]; 50 ur[1] = ua[1] & um[1]; 51 #else 52 result->all[0] = a1->all[0] & mask->all[0]; 53 result->all[1] = a1->all[1] & mask->all[1]; 54 result->all[2] = a1->all[2] & mask->all[2]; 55 result->all[3] = a1->all[3] & mask->all[3]; 56 #endif 57 } 58 59 int netfilter_init(void); 60 61 struct sk_buff; 62 63 struct nf_hook_ops; 64 65 struct sock; 66 67 struct nf_hook_state { 68 u8 hook; 69 u8 pf; 70 struct net_device *in; 71 struct net_device *out; 72 struct sock *sk; 73 struct net *net; 74 int (*okfn)(struct net *, struct sock *, struct sk_buff *); 75 }; 76 77 typedef unsigned int nf_hookfn(void *priv, 78 struct sk_buff *skb, 79 const struct nf_hook_state *state); 80 enum nf_hook_ops_type { 81 NF_HOOK_OP_UNDEFINED, 82 NF_HOOK_OP_NF_TABLES, 83 NF_HOOK_OP_BPF, 84 }; 85 86 struct nf_hook_ops { 87 /* User fills in from here down. */ 88 nf_hookfn *hook; 89 struct net_device *dev; 90 void *priv; 91 u8 pf; 92 enum nf_hook_ops_type hook_ops_type:8; 93 unsigned int hooknum; 94 /* Hooks are ordered in ascending priority. */ 95 int priority; 96 }; 97 98 struct nf_hook_entry { 99 nf_hookfn *hook; 100 void *priv; 101 }; 102 103 struct nf_hook_entries_rcu_head { 104 struct rcu_head head; 105 void *allocation; 106 }; 107 108 struct nf_hook_entries { 109 u16 num_hook_entries; 110 /* padding */ 111 struct nf_hook_entry hooks[]; 112 113 /* trailer: pointers to original orig_ops of each hook, 114 * followed by rcu_head and scratch space used for freeing 115 * the structure via call_rcu. 116 * 117 * This is not part of struct nf_hook_entry since its only 118 * needed in slow path (hook register/unregister): 119 * const struct nf_hook_ops *orig_ops[] 120 * 121 * For the same reason, we store this at end -- its 122 * only needed when a hook is deleted, not during 123 * packet path processing: 124 * struct nf_hook_entries_rcu_head head 125 */ 126 }; 127 128 #ifdef CONFIG_NETFILTER 129 static inline struct nf_hook_ops **nf_hook_entries_get_hook_ops(const struct nf_hook_entries *e) 130 { 131 unsigned int n = e->num_hook_entries; 132 const void *hook_end; 133 134 hook_end = &e->hooks[n]; /* this is *past* ->hooks[]! */ 135 136 return (struct nf_hook_ops **)hook_end; 137 } 138 139 static inline int 140 nf_hook_entry_hookfn(const struct nf_hook_entry *entry, struct sk_buff *skb, 141 struct nf_hook_state *state) 142 { 143 return entry->hook(entry->priv, skb, state); 144 } 145 146 static inline void nf_hook_state_init(struct nf_hook_state *p, 147 unsigned int hook, 148 u_int8_t pf, 149 struct net_device *indev, 150 struct net_device *outdev, 151 struct sock *sk, 152 struct net *net, 153 int (*okfn)(struct net *, struct sock *, struct sk_buff *)) 154 { 155 p->hook = hook; 156 p->pf = pf; 157 p->in = indev; 158 p->out = outdev; 159 p->sk = sk; 160 p->net = net; 161 p->okfn = okfn; 162 } 163 164 165 166 struct nf_sockopt_ops { 167 struct list_head list; 168 169 u_int8_t pf; 170 171 /* Non-inclusive ranges: use 0/0/NULL to never get called. */ 172 int set_optmin; 173 int set_optmax; 174 int (*set)(struct sock *sk, int optval, sockptr_t arg, 175 unsigned int len); 176 int get_optmin; 177 int get_optmax; 178 int (*get)(struct sock *sk, int optval, void __user *user, int *len); 179 /* Use the module struct to lock set/get code in place */ 180 struct module *owner; 181 }; 182 183 /* Function to register/unregister hook points. */ 184 int nf_register_net_hook(struct net *net, const struct nf_hook_ops *ops); 185 void nf_unregister_net_hook(struct net *net, const struct nf_hook_ops *ops); 186 int nf_register_net_hooks(struct net *net, const struct nf_hook_ops *reg, 187 unsigned int n); 188 void nf_unregister_net_hooks(struct net *net, const struct nf_hook_ops *reg, 189 unsigned int n); 190 191 /* Functions to register get/setsockopt ranges (non-inclusive). You 192 need to check permissions yourself! */ 193 int nf_register_sockopt(struct nf_sockopt_ops *reg); 194 void nf_unregister_sockopt(struct nf_sockopt_ops *reg); 195 196 #ifdef CONFIG_JUMP_LABEL 197 extern struct static_key nf_hooks_needed[NFPROTO_NUMPROTO][NF_MAX_HOOKS]; 198 #endif 199 200 int nf_hook_slow(struct sk_buff *skb, struct nf_hook_state *state, 201 const struct nf_hook_entries *e, unsigned int i); 202 203 void nf_hook_slow_list(struct list_head *head, struct nf_hook_state *state, 204 const struct nf_hook_entries *e); 205 /** 206 * nf_hook - call a netfilter hook 207 * 208 * Returns 1 if the hook has allowed the packet to pass. The function 209 * okfn must be invoked by the caller in this case. Any other return 210 * value indicates the packet has been consumed by the hook. 211 */ 212 static inline int nf_hook(u_int8_t pf, unsigned int hook, struct net *net, 213 struct sock *sk, struct sk_buff *skb, 214 struct net_device *indev, struct net_device *outdev, 215 int (*okfn)(struct net *, struct sock *, struct sk_buff *)) 216 { 217 struct nf_hook_entries *hook_head = NULL; 218 int ret = 1; 219 220 #ifdef CONFIG_JUMP_LABEL 221 if (__builtin_constant_p(pf) && 222 __builtin_constant_p(hook) && 223 !static_key_false(&nf_hooks_needed[pf][hook])) 224 return 1; 225 #endif 226 227 rcu_read_lock(); 228 switch (pf) { 229 case NFPROTO_IPV4: 230 hook_head = rcu_dereference(net->nf.hooks_ipv4[hook]); 231 break; 232 case NFPROTO_IPV6: 233 hook_head = rcu_dereference(net->nf.hooks_ipv6[hook]); 234 break; 235 case NFPROTO_ARP: 236 #ifdef CONFIG_NETFILTER_FAMILY_ARP 237 if (WARN_ON_ONCE(hook >= ARRAY_SIZE(net->nf.hooks_arp))) 238 break; 239 hook_head = rcu_dereference(net->nf.hooks_arp[hook]); 240 #endif 241 break; 242 case NFPROTO_BRIDGE: 243 #ifdef CONFIG_NETFILTER_FAMILY_BRIDGE 244 hook_head = rcu_dereference(net->nf.hooks_bridge[hook]); 245 #endif 246 break; 247 default: 248 WARN_ON_ONCE(1); 249 break; 250 } 251 252 if (hook_head) { 253 struct nf_hook_state state; 254 255 nf_hook_state_init(&state, hook, pf, indev, outdev, 256 sk, net, okfn); 257 258 ret = nf_hook_slow(skb, &state, hook_head, 0); 259 } 260 rcu_read_unlock(); 261 262 return ret; 263 } 264 265 /* Activate hook; either okfn or kfree_skb called, unless a hook 266 returns NF_STOLEN (in which case, it's up to the hook to deal with 267 the consequences). 268 269 Returns -ERRNO if packet dropped. Zero means queued, stolen or 270 accepted. 271 */ 272 273 /* RR: 274 > I don't want nf_hook to return anything because people might forget 275 > about async and trust the return value to mean "packet was ok". 276 277 AK: 278 Just document it clearly, then you can expect some sense from kernel 279 coders :) 280 */ 281 282 static inline int 283 NF_HOOK_COND(uint8_t pf, unsigned int hook, struct net *net, struct sock *sk, 284 struct sk_buff *skb, struct net_device *in, struct net_device *out, 285 int (*okfn)(struct net *, struct sock *, struct sk_buff *), 286 bool cond) 287 { 288 int ret; 289 290 if (!cond || 291 ((ret = nf_hook(pf, hook, net, sk, skb, in, out, okfn)) == 1)) 292 ret = okfn(net, sk, skb); 293 return ret; 294 } 295 296 static inline int 297 NF_HOOK(uint8_t pf, unsigned int hook, struct net *net, struct sock *sk, struct sk_buff *skb, 298 struct net_device *in, struct net_device *out, 299 int (*okfn)(struct net *, struct sock *, struct sk_buff *)) 300 { 301 int ret = nf_hook(pf, hook, net, sk, skb, in, out, okfn); 302 if (ret == 1) 303 ret = okfn(net, sk, skb); 304 return ret; 305 } 306 307 static inline void 308 NF_HOOK_LIST(uint8_t pf, unsigned int hook, struct net *net, struct sock *sk, 309 struct list_head *head, struct net_device *in, struct net_device *out, 310 int (*okfn)(struct net *, struct sock *, struct sk_buff *)) 311 { 312 struct nf_hook_entries *hook_head = NULL; 313 314 #ifdef CONFIG_JUMP_LABEL 315 if (__builtin_constant_p(pf) && 316 __builtin_constant_p(hook) && 317 !static_key_false(&nf_hooks_needed[pf][hook])) 318 return; 319 #endif 320 321 rcu_read_lock(); 322 switch (pf) { 323 case NFPROTO_IPV4: 324 hook_head = rcu_dereference(net->nf.hooks_ipv4[hook]); 325 break; 326 case NFPROTO_IPV6: 327 hook_head = rcu_dereference(net->nf.hooks_ipv6[hook]); 328 break; 329 default: 330 WARN_ON_ONCE(1); 331 break; 332 } 333 334 if (hook_head) { 335 struct nf_hook_state state; 336 337 nf_hook_state_init(&state, hook, pf, in, out, sk, net, okfn); 338 339 nf_hook_slow_list(head, &state, hook_head); 340 } 341 rcu_read_unlock(); 342 } 343 344 /* Call setsockopt() */ 345 int nf_setsockopt(struct sock *sk, u_int8_t pf, int optval, sockptr_t opt, 346 unsigned int len); 347 int nf_getsockopt(struct sock *sk, u_int8_t pf, int optval, char __user *opt, 348 int *len); 349 350 struct flowi; 351 struct nf_queue_entry; 352 353 __sum16 nf_checksum(struct sk_buff *skb, unsigned int hook, 354 unsigned int dataoff, u_int8_t protocol, 355 unsigned short family); 356 357 __sum16 nf_checksum_partial(struct sk_buff *skb, unsigned int hook, 358 unsigned int dataoff, unsigned int len, 359 u_int8_t protocol, unsigned short family); 360 int nf_route(struct net *net, struct dst_entry **dst, struct flowi *fl, 361 bool strict, unsigned short family); 362 int nf_reroute(struct sk_buff *skb, struct nf_queue_entry *entry); 363 364 #include <net/flow.h> 365 366 struct nf_conn; 367 enum nf_nat_manip_type; 368 struct nlattr; 369 enum ip_conntrack_dir; 370 371 struct nf_nat_hook { 372 int (*parse_nat_setup)(struct nf_conn *ct, enum nf_nat_manip_type manip, 373 const struct nlattr *attr); 374 void (*decode_session)(struct sk_buff *skb, struct flowi *fl); 375 unsigned int (*manip_pkt)(struct sk_buff *skb, struct nf_conn *ct, 376 enum nf_nat_manip_type mtype, 377 enum ip_conntrack_dir dir); 378 void (*remove_nat_bysrc)(struct nf_conn *ct); 379 }; 380 381 extern const struct nf_nat_hook __rcu *nf_nat_hook; 382 383 static inline void 384 nf_nat_decode_session(struct sk_buff *skb, struct flowi *fl, u_int8_t family) 385 { 386 #if IS_ENABLED(CONFIG_NF_NAT) 387 const struct nf_nat_hook *nat_hook; 388 389 rcu_read_lock(); 390 nat_hook = rcu_dereference(nf_nat_hook); 391 if (nat_hook && nat_hook->decode_session) 392 nat_hook->decode_session(skb, fl); 393 rcu_read_unlock(); 394 #endif 395 } 396 397 #else /* !CONFIG_NETFILTER */ 398 static inline int 399 NF_HOOK_COND(uint8_t pf, unsigned int hook, struct net *net, struct sock *sk, 400 struct sk_buff *skb, struct net_device *in, struct net_device *out, 401 int (*okfn)(struct net *, struct sock *, struct sk_buff *), 402 bool cond) 403 { 404 return okfn(net, sk, skb); 405 } 406 407 static inline int 408 NF_HOOK(uint8_t pf, unsigned int hook, struct net *net, struct sock *sk, 409 struct sk_buff *skb, struct net_device *in, struct net_device *out, 410 int (*okfn)(struct net *, struct sock *, struct sk_buff *)) 411 { 412 return okfn(net, sk, skb); 413 } 414 415 static inline void 416 NF_HOOK_LIST(uint8_t pf, unsigned int hook, struct net *net, struct sock *sk, 417 struct list_head *head, struct net_device *in, struct net_device *out, 418 int (*okfn)(struct net *, struct sock *, struct sk_buff *)) 419 { 420 /* nothing to do */ 421 } 422 423 static inline int nf_hook(u_int8_t pf, unsigned int hook, struct net *net, 424 struct sock *sk, struct sk_buff *skb, 425 struct net_device *indev, struct net_device *outdev, 426 int (*okfn)(struct net *, struct sock *, struct sk_buff *)) 427 { 428 return 1; 429 } 430 struct flowi; 431 static inline void 432 nf_nat_decode_session(struct sk_buff *skb, struct flowi *fl, u_int8_t family) 433 { 434 } 435 #endif /*CONFIG_NETFILTER*/ 436 437 #if IS_ENABLED(CONFIG_NF_CONNTRACK) 438 #include <linux/netfilter/nf_conntrack_zones_common.h> 439 440 void nf_ct_attach(struct sk_buff *, const struct sk_buff *); 441 void nf_ct_set_closing(struct nf_conntrack *nfct); 442 struct nf_conntrack_tuple; 443 bool nf_ct_get_tuple_skb(struct nf_conntrack_tuple *dst_tuple, 444 const struct sk_buff *skb); 445 #else 446 static inline void nf_ct_attach(struct sk_buff *new, struct sk_buff *skb) {} 447 static inline void nf_ct_set_closing(struct nf_conntrack *nfct) {} 448 struct nf_conntrack_tuple; 449 static inline bool nf_ct_get_tuple_skb(struct nf_conntrack_tuple *dst_tuple, 450 const struct sk_buff *skb) 451 { 452 return false; 453 } 454 #endif 455 456 struct nf_conn; 457 enum ip_conntrack_info; 458 459 struct nf_ct_hook { 460 int (*update)(struct net *net, struct sk_buff *skb); 461 void (*destroy)(struct nf_conntrack *); 462 bool (*get_tuple_skb)(struct nf_conntrack_tuple *, 463 const struct sk_buff *); 464 void (*attach)(struct sk_buff *nskb, const struct sk_buff *skb); 465 void (*set_closing)(struct nf_conntrack *nfct); 466 }; 467 extern const struct nf_ct_hook __rcu *nf_ct_hook; 468 469 struct nlattr; 470 471 struct nfnl_ct_hook { 472 size_t (*build_size)(const struct nf_conn *ct); 473 int (*build)(struct sk_buff *skb, struct nf_conn *ct, 474 enum ip_conntrack_info ctinfo, 475 u_int16_t ct_attr, u_int16_t ct_info_attr); 476 int (*parse)(const struct nlattr *attr, struct nf_conn *ct); 477 int (*attach_expect)(const struct nlattr *attr, struct nf_conn *ct, 478 u32 portid, u32 report); 479 void (*seq_adjust)(struct sk_buff *skb, struct nf_conn *ct, 480 enum ip_conntrack_info ctinfo, s32 off); 481 }; 482 extern const struct nfnl_ct_hook __rcu *nfnl_ct_hook; 483 484 /* 485 * nf_skb_duplicated - TEE target has sent a packet 486 * 487 * When a xtables target sends a packet, the OUTPUT and POSTROUTING 488 * hooks are traversed again, i.e. nft and xtables are invoked recursively. 489 * 490 * This is used by xtables TEE target to prevent the duplicated skb from 491 * being duplicated again. 492 */ 493 DECLARE_PER_CPU(bool, nf_skb_duplicated); 494 495 /* 496 * Contains bitmask of ctnetlink event subscribers, if any. 497 * Can't be pernet due to NETLINK_LISTEN_ALL_NSID setsockopt flag. 498 */ 499 extern u8 nf_ctnetlink_has_listener; 500 #endif /*__LINUX_NETFILTER_H*/ 501