2647b895f4b04946a9f7110831189070991753a3
[platform/kernel/linux-rpi.git] / net / netfilter / nft_ct.c
1 /*
2  * Copyright (c) 2008-2009 Patrick McHardy <kaber@trash.net>
3  * Copyright (c) 2016 Pablo Neira Ayuso <pablo@netfilter.org>
4  *
5  * This program is free software; you can redistribute it and/or modify
6  * it under the terms of the GNU General Public License version 2 as
7  * published by the Free Software Foundation.
8  *
9  * Development of this code funded by Astaro AG (http://www.astaro.com/)
10  */
11
12 #include <linux/kernel.h>
13 #include <linux/init.h>
14 #include <linux/module.h>
15 #include <linux/netlink.h>
16 #include <linux/netfilter.h>
17 #include <linux/netfilter/nf_tables.h>
18 #include <net/netfilter/nf_tables.h>
19 #include <net/netfilter/nf_conntrack.h>
20 #include <net/netfilter/nf_conntrack_acct.h>
21 #include <net/netfilter/nf_conntrack_tuple.h>
22 #include <net/netfilter/nf_conntrack_helper.h>
23 #include <net/netfilter/nf_conntrack_ecache.h>
24 #include <net/netfilter/nf_conntrack_labels.h>
25
26 struct nft_ct {
27         enum nft_ct_keys        key:8;
28         enum ip_conntrack_dir   dir:8;
29         union {
30                 enum nft_registers      dreg:8;
31                 enum nft_registers      sreg:8;
32         };
33 };
34
35 struct nft_ct_helper_obj  {
36         struct nf_conntrack_helper *helper4;
37         struct nf_conntrack_helper *helper6;
38         u8 l4proto;
39 };
40
41 #ifdef CONFIG_NF_CONNTRACK_ZONES
42 static DEFINE_PER_CPU(struct nf_conn *, nft_ct_pcpu_template);
43 static unsigned int nft_ct_pcpu_template_refcnt __read_mostly;
44 #endif
45
46 static u64 nft_ct_get_eval_counter(const struct nf_conn_counter *c,
47                                    enum nft_ct_keys k,
48                                    enum ip_conntrack_dir d)
49 {
50         if (d < IP_CT_DIR_MAX)
51                 return k == NFT_CT_BYTES ? atomic64_read(&c[d].bytes) :
52                                            atomic64_read(&c[d].packets);
53
54         return nft_ct_get_eval_counter(c, k, IP_CT_DIR_ORIGINAL) +
55                nft_ct_get_eval_counter(c, k, IP_CT_DIR_REPLY);
56 }
57
58 static void nft_ct_get_eval(const struct nft_expr *expr,
59                             struct nft_regs *regs,
60                             const struct nft_pktinfo *pkt)
61 {
62         const struct nft_ct *priv = nft_expr_priv(expr);
63         u32 *dest = &regs->data[priv->dreg];
64         enum ip_conntrack_info ctinfo;
65         const struct nf_conn *ct;
66         const struct nf_conn_help *help;
67         const struct nf_conntrack_tuple *tuple;
68         const struct nf_conntrack_helper *helper;
69         unsigned int state;
70
71         ct = nf_ct_get(pkt->skb, &ctinfo);
72
73         switch (priv->key) {
74         case NFT_CT_STATE:
75                 if (ct)
76                         state = NF_CT_STATE_BIT(ctinfo);
77                 else if (ctinfo == IP_CT_UNTRACKED)
78                         state = NF_CT_STATE_UNTRACKED_BIT;
79                 else
80                         state = NF_CT_STATE_INVALID_BIT;
81                 *dest = state;
82                 return;
83         default:
84                 break;
85         }
86
87         if (ct == NULL)
88                 goto err;
89
90         switch (priv->key) {
91         case NFT_CT_DIRECTION:
92                 nft_reg_store8(dest, CTINFO2DIR(ctinfo));
93                 return;
94         case NFT_CT_STATUS:
95                 *dest = ct->status;
96                 return;
97 #ifdef CONFIG_NF_CONNTRACK_MARK
98         case NFT_CT_MARK:
99                 *dest = ct->mark;
100                 return;
101 #endif
102 #ifdef CONFIG_NF_CONNTRACK_SECMARK
103         case NFT_CT_SECMARK:
104                 *dest = ct->secmark;
105                 return;
106 #endif
107         case NFT_CT_EXPIRATION:
108                 *dest = jiffies_to_msecs(nf_ct_expires(ct));
109                 return;
110         case NFT_CT_HELPER:
111                 if (ct->master == NULL)
112                         goto err;
113                 help = nfct_help(ct->master);
114                 if (help == NULL)
115                         goto err;
116                 helper = rcu_dereference(help->helper);
117                 if (helper == NULL)
118                         goto err;
119                 strncpy((char *)dest, helper->name, NF_CT_HELPER_NAME_LEN);
120                 return;
121 #ifdef CONFIG_NF_CONNTRACK_LABELS
122         case NFT_CT_LABELS: {
123                 struct nf_conn_labels *labels = nf_ct_labels_find(ct);
124
125                 if (labels)
126                         memcpy(dest, labels->bits, NF_CT_LABELS_MAX_SIZE);
127                 else
128                         memset(dest, 0, NF_CT_LABELS_MAX_SIZE);
129                 return;
130         }
131 #endif
132         case NFT_CT_BYTES: /* fallthrough */
133         case NFT_CT_PKTS: {
134                 const struct nf_conn_acct *acct = nf_conn_acct_find(ct);
135                 u64 count = 0;
136
137                 if (acct)
138                         count = nft_ct_get_eval_counter(acct->counter,
139                                                         priv->key, priv->dir);
140                 memcpy(dest, &count, sizeof(count));
141                 return;
142         }
143         case NFT_CT_AVGPKT: {
144                 const struct nf_conn_acct *acct = nf_conn_acct_find(ct);
145                 u64 avgcnt = 0, bcnt = 0, pcnt = 0;
146
147                 if (acct) {
148                         pcnt = nft_ct_get_eval_counter(acct->counter,
149                                                        NFT_CT_PKTS, priv->dir);
150                         bcnt = nft_ct_get_eval_counter(acct->counter,
151                                                        NFT_CT_BYTES, priv->dir);
152                         if (pcnt != 0)
153                                 avgcnt = div64_u64(bcnt, pcnt);
154                 }
155
156                 memcpy(dest, &avgcnt, sizeof(avgcnt));
157                 return;
158         }
159         case NFT_CT_L3PROTOCOL:
160                 nft_reg_store8(dest, nf_ct_l3num(ct));
161                 return;
162         case NFT_CT_PROTOCOL:
163                 nft_reg_store8(dest, nf_ct_protonum(ct));
164                 return;
165 #ifdef CONFIG_NF_CONNTRACK_ZONES
166         case NFT_CT_ZONE: {
167                 const struct nf_conntrack_zone *zone = nf_ct_zone(ct);
168                 u16 zoneid;
169
170                 if (priv->dir < IP_CT_DIR_MAX)
171                         zoneid = nf_ct_zone_id(zone, priv->dir);
172                 else
173                         zoneid = zone->id;
174
175                 nft_reg_store16(dest, zoneid);
176                 return;
177         }
178 #endif
179         default:
180                 break;
181         }
182
183         tuple = &ct->tuplehash[priv->dir].tuple;
184         switch (priv->key) {
185         case NFT_CT_SRC:
186                 memcpy(dest, tuple->src.u3.all,
187                        nf_ct_l3num(ct) == NFPROTO_IPV4 ? 4 : 16);
188                 return;
189         case NFT_CT_DST:
190                 memcpy(dest, tuple->dst.u3.all,
191                        nf_ct_l3num(ct) == NFPROTO_IPV4 ? 4 : 16);
192                 return;
193         case NFT_CT_PROTO_SRC:
194                 nft_reg_store16(dest, (__force u16)tuple->src.u.all);
195                 return;
196         case NFT_CT_PROTO_DST:
197                 nft_reg_store16(dest, (__force u16)tuple->dst.u.all);
198                 return;
199         default:
200                 break;
201         }
202         return;
203 err:
204         regs->verdict.code = NFT_BREAK;
205 }
206
207 #ifdef CONFIG_NF_CONNTRACK_ZONES
208 static void nft_ct_set_zone_eval(const struct nft_expr *expr,
209                                  struct nft_regs *regs,
210                                  const struct nft_pktinfo *pkt)
211 {
212         struct nf_conntrack_zone zone = { .dir = NF_CT_DEFAULT_ZONE_DIR };
213         const struct nft_ct *priv = nft_expr_priv(expr);
214         struct sk_buff *skb = pkt->skb;
215         enum ip_conntrack_info ctinfo;
216         u16 value = nft_reg_load16(&regs->data[priv->sreg]);
217         struct nf_conn *ct;
218
219         ct = nf_ct_get(skb, &ctinfo);
220         if (ct) /* already tracked */
221                 return;
222
223         zone.id = value;
224
225         switch (priv->dir) {
226         case IP_CT_DIR_ORIGINAL:
227                 zone.dir = NF_CT_ZONE_DIR_ORIG;
228                 break;
229         case IP_CT_DIR_REPLY:
230                 zone.dir = NF_CT_ZONE_DIR_REPL;
231                 break;
232         default:
233                 break;
234         }
235
236         ct = this_cpu_read(nft_ct_pcpu_template);
237
238         if (likely(atomic_read(&ct->ct_general.use) == 1)) {
239                 nf_ct_zone_add(ct, &zone);
240         } else {
241                 /* previous skb got queued to userspace */
242                 ct = nf_ct_tmpl_alloc(nft_net(pkt), &zone, GFP_ATOMIC);
243                 if (!ct) {
244                         regs->verdict.code = NF_DROP;
245                         return;
246                 }
247         }
248
249         atomic_inc(&ct->ct_general.use);
250         nf_ct_set(skb, ct, IP_CT_NEW);
251 }
252 #endif
253
254 static void nft_ct_set_eval(const struct nft_expr *expr,
255                             struct nft_regs *regs,
256                             const struct nft_pktinfo *pkt)
257 {
258         const struct nft_ct *priv = nft_expr_priv(expr);
259         struct sk_buff *skb = pkt->skb;
260 #ifdef CONFIG_NF_CONNTRACK_MARK
261         u32 value = regs->data[priv->sreg];
262 #endif
263         enum ip_conntrack_info ctinfo;
264         struct nf_conn *ct;
265
266         ct = nf_ct_get(skb, &ctinfo);
267         if (ct == NULL || nf_ct_is_template(ct))
268                 return;
269
270         switch (priv->key) {
271 #ifdef CONFIG_NF_CONNTRACK_MARK
272         case NFT_CT_MARK:
273                 if (ct->mark != value) {
274                         ct->mark = value;
275                         nf_conntrack_event_cache(IPCT_MARK, ct);
276                 }
277                 break;
278 #endif
279 #ifdef CONFIG_NF_CONNTRACK_LABELS
280         case NFT_CT_LABELS:
281                 nf_connlabels_replace(ct,
282                                       &regs->data[priv->sreg],
283                                       &regs->data[priv->sreg],
284                                       NF_CT_LABELS_MAX_SIZE / sizeof(u32));
285                 break;
286 #endif
287 #ifdef CONFIG_NF_CONNTRACK_EVENTS
288         case NFT_CT_EVENTMASK: {
289                 struct nf_conntrack_ecache *e = nf_ct_ecache_find(ct);
290                 u32 ctmask = regs->data[priv->sreg];
291
292                 if (e) {
293                         if (e->ctmask != ctmask)
294                                 e->ctmask = ctmask;
295                         break;
296                 }
297
298                 if (ctmask && !nf_ct_is_confirmed(ct))
299                         nf_ct_ecache_ext_add(ct, ctmask, 0, GFP_ATOMIC);
300                 break;
301         }
302 #endif
303         default:
304                 break;
305         }
306 }
307
308 static const struct nla_policy nft_ct_policy[NFTA_CT_MAX + 1] = {
309         [NFTA_CT_DREG]          = { .type = NLA_U32 },
310         [NFTA_CT_KEY]           = { .type = NLA_U32 },
311         [NFTA_CT_DIRECTION]     = { .type = NLA_U8 },
312         [NFTA_CT_SREG]          = { .type = NLA_U32 },
313 };
314
315 #ifdef CONFIG_NF_CONNTRACK_ZONES
316 static void nft_ct_tmpl_put_pcpu(void)
317 {
318         struct nf_conn *ct;
319         int cpu;
320
321         for_each_possible_cpu(cpu) {
322                 ct = per_cpu(nft_ct_pcpu_template, cpu);
323                 if (!ct)
324                         break;
325                 nf_ct_put(ct);
326                 per_cpu(nft_ct_pcpu_template, cpu) = NULL;
327         }
328 }
329
330 static bool nft_ct_tmpl_alloc_pcpu(void)
331 {
332         struct nf_conntrack_zone zone = { .id = 0 };
333         struct nf_conn *tmp;
334         int cpu;
335
336         if (nft_ct_pcpu_template_refcnt)
337                 return true;
338
339         for_each_possible_cpu(cpu) {
340                 tmp = nf_ct_tmpl_alloc(&init_net, &zone, GFP_KERNEL);
341                 if (!tmp) {
342                         nft_ct_tmpl_put_pcpu();
343                         return false;
344                 }
345
346                 atomic_set(&tmp->ct_general.use, 1);
347                 per_cpu(nft_ct_pcpu_template, cpu) = tmp;
348         }
349
350         return true;
351 }
352 #endif
353
354 static int nft_ct_get_init(const struct nft_ctx *ctx,
355                            const struct nft_expr *expr,
356                            const struct nlattr * const tb[])
357 {
358         struct nft_ct *priv = nft_expr_priv(expr);
359         unsigned int len;
360         int err;
361
362         priv->key = ntohl(nla_get_be32(tb[NFTA_CT_KEY]));
363         priv->dir = IP_CT_DIR_MAX;
364         switch (priv->key) {
365         case NFT_CT_DIRECTION:
366                 if (tb[NFTA_CT_DIRECTION] != NULL)
367                         return -EINVAL;
368                 len = sizeof(u8);
369                 break;
370         case NFT_CT_STATE:
371         case NFT_CT_STATUS:
372 #ifdef CONFIG_NF_CONNTRACK_MARK
373         case NFT_CT_MARK:
374 #endif
375 #ifdef CONFIG_NF_CONNTRACK_SECMARK
376         case NFT_CT_SECMARK:
377 #endif
378         case NFT_CT_EXPIRATION:
379                 if (tb[NFTA_CT_DIRECTION] != NULL)
380                         return -EINVAL;
381                 len = sizeof(u32);
382                 break;
383 #ifdef CONFIG_NF_CONNTRACK_LABELS
384         case NFT_CT_LABELS:
385                 if (tb[NFTA_CT_DIRECTION] != NULL)
386                         return -EINVAL;
387                 len = NF_CT_LABELS_MAX_SIZE;
388                 break;
389 #endif
390         case NFT_CT_HELPER:
391                 if (tb[NFTA_CT_DIRECTION] != NULL)
392                         return -EINVAL;
393                 len = NF_CT_HELPER_NAME_LEN;
394                 break;
395
396         case NFT_CT_L3PROTOCOL:
397         case NFT_CT_PROTOCOL:
398                 /* For compatibility, do not report error if NFTA_CT_DIRECTION
399                  * attribute is specified.
400                  */
401                 len = sizeof(u8);
402                 break;
403         case NFT_CT_SRC:
404         case NFT_CT_DST:
405                 if (tb[NFTA_CT_DIRECTION] == NULL)
406                         return -EINVAL;
407
408                 switch (ctx->afi->family) {
409                 case NFPROTO_IPV4:
410                         len = FIELD_SIZEOF(struct nf_conntrack_tuple,
411                                            src.u3.ip);
412                         break;
413                 case NFPROTO_IPV6:
414                 case NFPROTO_INET:
415                         len = FIELD_SIZEOF(struct nf_conntrack_tuple,
416                                            src.u3.ip6);
417                         break;
418                 default:
419                         return -EAFNOSUPPORT;
420                 }
421                 break;
422         case NFT_CT_PROTO_SRC:
423         case NFT_CT_PROTO_DST:
424                 if (tb[NFTA_CT_DIRECTION] == NULL)
425                         return -EINVAL;
426                 len = FIELD_SIZEOF(struct nf_conntrack_tuple, src.u.all);
427                 break;
428         case NFT_CT_BYTES:
429         case NFT_CT_PKTS:
430         case NFT_CT_AVGPKT:
431                 len = sizeof(u64);
432                 break;
433 #ifdef CONFIG_NF_CONNTRACK_ZONES
434         case NFT_CT_ZONE:
435                 len = sizeof(u16);
436                 break;
437 #endif
438         default:
439                 return -EOPNOTSUPP;
440         }
441
442         if (tb[NFTA_CT_DIRECTION] != NULL) {
443                 priv->dir = nla_get_u8(tb[NFTA_CT_DIRECTION]);
444                 switch (priv->dir) {
445                 case IP_CT_DIR_ORIGINAL:
446                 case IP_CT_DIR_REPLY:
447                         break;
448                 default:
449                         return -EINVAL;
450                 }
451         }
452
453         priv->dreg = nft_parse_register(tb[NFTA_CT_DREG]);
454         err = nft_validate_register_store(ctx, priv->dreg, NULL,
455                                           NFT_DATA_VALUE, len);
456         if (err < 0)
457                 return err;
458
459         err = nf_ct_netns_get(ctx->net, ctx->afi->family);
460         if (err < 0)
461                 return err;
462
463         if (priv->key == NFT_CT_BYTES ||
464             priv->key == NFT_CT_PKTS  ||
465             priv->key == NFT_CT_AVGPKT)
466                 nf_ct_set_acct(ctx->net, true);
467
468         return 0;
469 }
470
471 static void __nft_ct_set_destroy(const struct nft_ctx *ctx, struct nft_ct *priv)
472 {
473         switch (priv->key) {
474 #ifdef CONFIG_NF_CONNTRACK_LABELS
475         case NFT_CT_LABELS:
476                 nf_connlabels_put(ctx->net);
477                 break;
478 #endif
479 #ifdef CONFIG_NF_CONNTRACK_ZONES
480         case NFT_CT_ZONE:
481                 if (--nft_ct_pcpu_template_refcnt == 0)
482                         nft_ct_tmpl_put_pcpu();
483 #endif
484         default:
485                 break;
486         }
487 }
488
489 static int nft_ct_set_init(const struct nft_ctx *ctx,
490                            const struct nft_expr *expr,
491                            const struct nlattr * const tb[])
492 {
493         struct nft_ct *priv = nft_expr_priv(expr);
494         unsigned int len;
495         int err;
496
497         priv->dir = IP_CT_DIR_MAX;
498         priv->key = ntohl(nla_get_be32(tb[NFTA_CT_KEY]));
499         switch (priv->key) {
500 #ifdef CONFIG_NF_CONNTRACK_MARK
501         case NFT_CT_MARK:
502                 if (tb[NFTA_CT_DIRECTION])
503                         return -EINVAL;
504                 len = FIELD_SIZEOF(struct nf_conn, mark);
505                 break;
506 #endif
507 #ifdef CONFIG_NF_CONNTRACK_LABELS
508         case NFT_CT_LABELS:
509                 if (tb[NFTA_CT_DIRECTION])
510                         return -EINVAL;
511                 len = NF_CT_LABELS_MAX_SIZE;
512                 err = nf_connlabels_get(ctx->net, (len * BITS_PER_BYTE) - 1);
513                 if (err)
514                         return err;
515                 break;
516 #endif
517 #ifdef CONFIG_NF_CONNTRACK_ZONES
518         case NFT_CT_ZONE:
519                 if (!nft_ct_tmpl_alloc_pcpu())
520                         return -ENOMEM;
521                 nft_ct_pcpu_template_refcnt++;
522                 len = sizeof(u16);
523                 break;
524 #endif
525 #ifdef CONFIG_NF_CONNTRACK_EVENTS
526         case NFT_CT_EVENTMASK:
527                 if (tb[NFTA_CT_DIRECTION])
528                         return -EINVAL;
529                 len = sizeof(u32);
530                 break;
531 #endif
532         default:
533                 return -EOPNOTSUPP;
534         }
535
536         if (tb[NFTA_CT_DIRECTION]) {
537                 priv->dir = nla_get_u8(tb[NFTA_CT_DIRECTION]);
538                 switch (priv->dir) {
539                 case IP_CT_DIR_ORIGINAL:
540                 case IP_CT_DIR_REPLY:
541                         break;
542                 default:
543                         err = -EINVAL;
544                         goto err1;
545                 }
546         }
547
548         priv->sreg = nft_parse_register(tb[NFTA_CT_SREG]);
549         err = nft_validate_register_load(priv->sreg, len);
550         if (err < 0)
551                 goto err1;
552
553         err = nf_ct_netns_get(ctx->net, ctx->afi->family);
554         if (err < 0)
555                 goto err1;
556
557         return 0;
558
559 err1:
560         __nft_ct_set_destroy(ctx, priv);
561         return err;
562 }
563
564 static void nft_ct_get_destroy(const struct nft_ctx *ctx,
565                                const struct nft_expr *expr)
566 {
567         nf_ct_netns_put(ctx->net, ctx->afi->family);
568 }
569
570 static void nft_ct_set_destroy(const struct nft_ctx *ctx,
571                                const struct nft_expr *expr)
572 {
573         struct nft_ct *priv = nft_expr_priv(expr);
574
575         __nft_ct_set_destroy(ctx, priv);
576         nf_ct_netns_put(ctx->net, ctx->afi->family);
577 }
578
579 static int nft_ct_get_dump(struct sk_buff *skb, const struct nft_expr *expr)
580 {
581         const struct nft_ct *priv = nft_expr_priv(expr);
582
583         if (nft_dump_register(skb, NFTA_CT_DREG, priv->dreg))
584                 goto nla_put_failure;
585         if (nla_put_be32(skb, NFTA_CT_KEY, htonl(priv->key)))
586                 goto nla_put_failure;
587
588         switch (priv->key) {
589         case NFT_CT_SRC:
590         case NFT_CT_DST:
591         case NFT_CT_PROTO_SRC:
592         case NFT_CT_PROTO_DST:
593                 if (nla_put_u8(skb, NFTA_CT_DIRECTION, priv->dir))
594                         goto nla_put_failure;
595                 break;
596         case NFT_CT_BYTES:
597         case NFT_CT_PKTS:
598         case NFT_CT_AVGPKT:
599         case NFT_CT_ZONE:
600                 if (priv->dir < IP_CT_DIR_MAX &&
601                     nla_put_u8(skb, NFTA_CT_DIRECTION, priv->dir))
602                         goto nla_put_failure;
603                 break;
604         default:
605                 break;
606         }
607
608         return 0;
609
610 nla_put_failure:
611         return -1;
612 }
613
614 static int nft_ct_set_dump(struct sk_buff *skb, const struct nft_expr *expr)
615 {
616         const struct nft_ct *priv = nft_expr_priv(expr);
617
618         if (nft_dump_register(skb, NFTA_CT_SREG, priv->sreg))
619                 goto nla_put_failure;
620         if (nla_put_be32(skb, NFTA_CT_KEY, htonl(priv->key)))
621                 goto nla_put_failure;
622
623         switch (priv->key) {
624         case NFT_CT_ZONE:
625                 if (priv->dir < IP_CT_DIR_MAX &&
626                     nla_put_u8(skb, NFTA_CT_DIRECTION, priv->dir))
627                         goto nla_put_failure;
628                 break;
629         default:
630                 break;
631         }
632
633         return 0;
634
635 nla_put_failure:
636         return -1;
637 }
638
639 static struct nft_expr_type nft_ct_type;
640 static const struct nft_expr_ops nft_ct_get_ops = {
641         .type           = &nft_ct_type,
642         .size           = NFT_EXPR_SIZE(sizeof(struct nft_ct)),
643         .eval           = nft_ct_get_eval,
644         .init           = nft_ct_get_init,
645         .destroy        = nft_ct_get_destroy,
646         .dump           = nft_ct_get_dump,
647 };
648
649 static const struct nft_expr_ops nft_ct_set_ops = {
650         .type           = &nft_ct_type,
651         .size           = NFT_EXPR_SIZE(sizeof(struct nft_ct)),
652         .eval           = nft_ct_set_eval,
653         .init           = nft_ct_set_init,
654         .destroy        = nft_ct_set_destroy,
655         .dump           = nft_ct_set_dump,
656 };
657
658 #ifdef CONFIG_NF_CONNTRACK_ZONES
659 static const struct nft_expr_ops nft_ct_set_zone_ops = {
660         .type           = &nft_ct_type,
661         .size           = NFT_EXPR_SIZE(sizeof(struct nft_ct)),
662         .eval           = nft_ct_set_zone_eval,
663         .init           = nft_ct_set_init,
664         .destroy        = nft_ct_set_destroy,
665         .dump           = nft_ct_set_dump,
666 };
667 #endif
668
669 static const struct nft_expr_ops *
670 nft_ct_select_ops(const struct nft_ctx *ctx,
671                     const struct nlattr * const tb[])
672 {
673         if (tb[NFTA_CT_KEY] == NULL)
674                 return ERR_PTR(-EINVAL);
675
676         if (tb[NFTA_CT_DREG] && tb[NFTA_CT_SREG])
677                 return ERR_PTR(-EINVAL);
678
679         if (tb[NFTA_CT_DREG])
680                 return &nft_ct_get_ops;
681
682         if (tb[NFTA_CT_SREG]) {
683 #ifdef CONFIG_NF_CONNTRACK_ZONES
684                 if (nla_get_be32(tb[NFTA_CT_KEY]) == htonl(NFT_CT_ZONE))
685                         return &nft_ct_set_zone_ops;
686 #endif
687                 return &nft_ct_set_ops;
688         }
689
690         return ERR_PTR(-EINVAL);
691 }
692
693 static struct nft_expr_type nft_ct_type __read_mostly = {
694         .name           = "ct",
695         .select_ops     = nft_ct_select_ops,
696         .policy         = nft_ct_policy,
697         .maxattr        = NFTA_CT_MAX,
698         .owner          = THIS_MODULE,
699 };
700
701 static void nft_notrack_eval(const struct nft_expr *expr,
702                              struct nft_regs *regs,
703                              const struct nft_pktinfo *pkt)
704 {
705         struct sk_buff *skb = pkt->skb;
706         enum ip_conntrack_info ctinfo;
707         struct nf_conn *ct;
708
709         ct = nf_ct_get(pkt->skb, &ctinfo);
710         /* Previously seen (loopback or untracked)?  Ignore. */
711         if (ct || ctinfo == IP_CT_UNTRACKED)
712                 return;
713
714         nf_ct_set(skb, ct, IP_CT_UNTRACKED);
715 }
716
717 static struct nft_expr_type nft_notrack_type;
718 static const struct nft_expr_ops nft_notrack_ops = {
719         .type           = &nft_notrack_type,
720         .size           = NFT_EXPR_SIZE(0),
721         .eval           = nft_notrack_eval,
722 };
723
724 static struct nft_expr_type nft_notrack_type __read_mostly = {
725         .name           = "notrack",
726         .ops            = &nft_notrack_ops,
727         .owner          = THIS_MODULE,
728 };
729
730 static int nft_ct_helper_obj_init(const struct nft_ctx *ctx,
731                                   const struct nlattr * const tb[],
732                                   struct nft_object *obj)
733 {
734         struct nft_ct_helper_obj *priv = nft_obj_data(obj);
735         struct nf_conntrack_helper *help4, *help6;
736         char name[NF_CT_HELPER_NAME_LEN];
737         int family = ctx->afi->family;
738
739         if (!tb[NFTA_CT_HELPER_NAME] || !tb[NFTA_CT_HELPER_L4PROTO])
740                 return -EINVAL;
741
742         priv->l4proto = nla_get_u8(tb[NFTA_CT_HELPER_L4PROTO]);
743         if (!priv->l4proto)
744                 return -ENOENT;
745
746         nla_strlcpy(name, tb[NFTA_CT_HELPER_NAME], sizeof(name));
747
748         if (tb[NFTA_CT_HELPER_L3PROTO])
749                 family = ntohs(nla_get_be16(tb[NFTA_CT_HELPER_L3PROTO]));
750
751         help4 = NULL;
752         help6 = NULL;
753
754         switch (family) {
755         case NFPROTO_IPV4:
756                 if (ctx->afi->family == NFPROTO_IPV6)
757                         return -EINVAL;
758
759                 help4 = nf_conntrack_helper_try_module_get(name, family,
760                                                            priv->l4proto);
761                 break;
762         case NFPROTO_IPV6:
763                 if (ctx->afi->family == NFPROTO_IPV4)
764                         return -EINVAL;
765
766                 help6 = nf_conntrack_helper_try_module_get(name, family,
767                                                            priv->l4proto);
768                 break;
769         case NFPROTO_NETDEV: /* fallthrough */
770         case NFPROTO_BRIDGE: /* same */
771         case NFPROTO_INET:
772                 help4 = nf_conntrack_helper_try_module_get(name, NFPROTO_IPV4,
773                                                            priv->l4proto);
774                 help6 = nf_conntrack_helper_try_module_get(name, NFPROTO_IPV6,
775                                                            priv->l4proto);
776                 break;
777         default:
778                 return -EAFNOSUPPORT;
779         }
780
781         /* && is intentional; only error if INET found neither ipv4 or ipv6 */
782         if (!help4 && !help6)
783                 return -ENOENT;
784
785         priv->helper4 = help4;
786         priv->helper6 = help6;
787
788         return 0;
789 }
790
791 static void nft_ct_helper_obj_destroy(struct nft_object *obj)
792 {
793         struct nft_ct_helper_obj *priv = nft_obj_data(obj);
794
795         if (priv->helper4)
796                 nf_conntrack_helper_put(priv->helper4);
797         if (priv->helper6)
798                 nf_conntrack_helper_put(priv->helper6);
799 }
800
801 static void nft_ct_helper_obj_eval(struct nft_object *obj,
802                                    struct nft_regs *regs,
803                                    const struct nft_pktinfo *pkt)
804 {
805         const struct nft_ct_helper_obj *priv = nft_obj_data(obj);
806         struct nf_conn *ct = (struct nf_conn *)skb_nfct(pkt->skb);
807         struct nf_conntrack_helper *to_assign = NULL;
808         struct nf_conn_help *help;
809
810         if (!ct ||
811             nf_ct_is_confirmed(ct) ||
812             nf_ct_is_template(ct) ||
813             priv->l4proto != nf_ct_protonum(ct))
814                 return;
815
816         switch (nf_ct_l3num(ct)) {
817         case NFPROTO_IPV4:
818                 to_assign = priv->helper4;
819                 break;
820         case NFPROTO_IPV6:
821                 to_assign = priv->helper6;
822                 break;
823         default:
824                 WARN_ON_ONCE(1);
825                 return;
826         }
827
828         if (!to_assign)
829                 return;
830
831         if (test_bit(IPS_HELPER_BIT, &ct->status))
832                 return;
833
834         help = nf_ct_helper_ext_add(ct, to_assign, GFP_ATOMIC);
835         if (help) {
836                 rcu_assign_pointer(help->helper, to_assign);
837                 set_bit(IPS_HELPER_BIT, &ct->status);
838         }
839 }
840
841 static int nft_ct_helper_obj_dump(struct sk_buff *skb,
842                                   struct nft_object *obj, bool reset)
843 {
844         const struct nft_ct_helper_obj *priv = nft_obj_data(obj);
845         const struct nf_conntrack_helper *helper = priv->helper4;
846         u16 family;
847
848         if (nla_put_string(skb, NFTA_CT_HELPER_NAME, helper->name))
849                 return -1;
850
851         if (nla_put_u8(skb, NFTA_CT_HELPER_L4PROTO, priv->l4proto))
852                 return -1;
853
854         if (priv->helper4 && priv->helper6)
855                 family = NFPROTO_INET;
856         else if (priv->helper6)
857                 family = NFPROTO_IPV6;
858         else
859                 family = NFPROTO_IPV4;
860
861         if (nla_put_be16(skb, NFTA_CT_HELPER_L3PROTO, htons(family)))
862                 return -1;
863
864         return 0;
865 }
866
867 static const struct nla_policy nft_ct_helper_policy[NFTA_CT_HELPER_MAX + 1] = {
868         [NFTA_CT_HELPER_NAME] = { .type = NLA_STRING,
869                                   .len = NF_CT_HELPER_NAME_LEN - 1 },
870         [NFTA_CT_HELPER_L3PROTO] = { .type = NLA_U16 },
871         [NFTA_CT_HELPER_L4PROTO] = { .type = NLA_U8 },
872 };
873
874 static struct nft_object_type nft_ct_helper_obj_type;
875 static const struct nft_object_ops nft_ct_helper_obj_ops = {
876         .type           = &nft_ct_helper_obj_type,
877         .size           = sizeof(struct nft_ct_helper_obj),
878         .eval           = nft_ct_helper_obj_eval,
879         .init           = nft_ct_helper_obj_init,
880         .destroy        = nft_ct_helper_obj_destroy,
881         .dump           = nft_ct_helper_obj_dump,
882 };
883
884 static struct nft_object_type nft_ct_helper_obj_type __read_mostly = {
885         .type           = NFT_OBJECT_CT_HELPER,
886         .ops            = &nft_ct_helper_obj_ops,
887         .maxattr        = NFTA_CT_HELPER_MAX,
888         .policy         = nft_ct_helper_policy,
889         .owner          = THIS_MODULE,
890 };
891
892 static int __init nft_ct_module_init(void)
893 {
894         int err;
895
896         BUILD_BUG_ON(NF_CT_LABELS_MAX_SIZE > NFT_REG_SIZE);
897
898         err = nft_register_expr(&nft_ct_type);
899         if (err < 0)
900                 return err;
901
902         err = nft_register_expr(&nft_notrack_type);
903         if (err < 0)
904                 goto err1;
905
906         err = nft_register_obj(&nft_ct_helper_obj_type);
907         if (err < 0)
908                 goto err2;
909
910         return 0;
911
912 err2:
913         nft_unregister_expr(&nft_notrack_type);
914 err1:
915         nft_unregister_expr(&nft_ct_type);
916         return err;
917 }
918
919 static void __exit nft_ct_module_exit(void)
920 {
921         nft_unregister_obj(&nft_ct_helper_obj_type);
922         nft_unregister_expr(&nft_notrack_type);
923         nft_unregister_expr(&nft_ct_type);
924 }
925
926 module_init(nft_ct_module_init);
927 module_exit(nft_ct_module_exit);
928
929 MODULE_LICENSE("GPL");
930 MODULE_AUTHOR("Patrick McHardy <kaber@trash.net>");
931 MODULE_ALIAS_NFT_EXPR("ct");
932 MODULE_ALIAS_NFT_EXPR("notrack");
933 MODULE_ALIAS_NFT_OBJ(NFT_OBJECT_CT_HELPER);