Patrick McHardy | 9651851 | 2013-10-14 11:00:02 +0200 | [diff] [blame] | 1 | /* |
Patrick McHardy | ce6eb0d | 2014-03-04 16:21:51 +0100 | [diff] [blame] | 2 | * Copyright (c) 2008-2014 Patrick McHardy <kaber@trash.net> |
Patrick McHardy | 9651851 | 2013-10-14 11:00:02 +0200 | [diff] [blame] | 3 | * |
| 4 | * This program is free software; you can redistribute it and/or modify |
| 5 | * it under the terms of the GNU General Public License version 2 as |
| 6 | * published by the Free Software Foundation. |
| 7 | * |
| 8 | * Development of this code funded by Astaro AG (http://www.astaro.com/) |
| 9 | */ |
| 10 | |
| 11 | #include <linux/kernel.h> |
| 12 | #include <linux/init.h> |
| 13 | #include <linux/module.h> |
| 14 | #include <linux/list.h> |
Patrick McHardy | c50b960 | 2014-03-28 10:19:47 +0000 | [diff] [blame] | 15 | #include <linux/log2.h> |
Patrick McHardy | 9651851 | 2013-10-14 11:00:02 +0200 | [diff] [blame] | 16 | #include <linux/jhash.h> |
| 17 | #include <linux/netlink.h> |
Thomas Graf | cfe4a9d | 2014-08-02 11:47:46 +0200 | [diff] [blame] | 18 | #include <linux/rhashtable.h> |
Patrick McHardy | 9651851 | 2013-10-14 11:00:02 +0200 | [diff] [blame] | 19 | #include <linux/netfilter.h> |
| 20 | #include <linux/netfilter/nf_tables.h> |
| 21 | #include <net/netfilter/nf_tables.h> |
| 22 | |
Thomas Graf | cfe4a9d | 2014-08-02 11:47:46 +0200 | [diff] [blame] | 23 | /* We target a hash table size of 4, element hint is 75% of final size */ |
| 24 | #define NFT_HASH_ELEMENT_HINT 3 |
Patrick McHardy | 9651851 | 2013-10-14 11:00:02 +0200 | [diff] [blame] | 25 | |
| 26 | struct nft_hash_elem { |
Thomas Graf | cfe4a9d | 2014-08-02 11:47:46 +0200 | [diff] [blame] | 27 | struct rhash_head node; |
Patrick McHardy | ce6eb0d | 2014-03-04 16:21:51 +0100 | [diff] [blame] | 28 | struct nft_data key; |
| 29 | struct nft_data data[]; |
Patrick McHardy | 9651851 | 2013-10-14 11:00:02 +0200 | [diff] [blame] | 30 | }; |
| 31 | |
Patrick McHardy | 20a6934 | 2013-10-11 12:06:22 +0200 | [diff] [blame] | 32 | static bool nft_hash_lookup(const struct nft_set *set, |
| 33 | const struct nft_data *key, |
| 34 | struct nft_data *data) |
Patrick McHardy | 9651851 | 2013-10-14 11:00:02 +0200 | [diff] [blame] | 35 | { |
Thomas Graf | 97defe1 | 2015-01-02 23:00:20 +0100 | [diff] [blame] | 36 | struct rhashtable *priv = nft_set_priv(set); |
Patrick McHardy | 20a6934 | 2013-10-11 12:06:22 +0200 | [diff] [blame] | 37 | const struct nft_hash_elem *he; |
Patrick McHardy | 9651851 | 2013-10-14 11:00:02 +0200 | [diff] [blame] | 38 | |
Thomas Graf | cfe4a9d | 2014-08-02 11:47:46 +0200 | [diff] [blame] | 39 | he = rhashtable_lookup(priv, key); |
| 40 | if (he && set->flags & NFT_SET_MAP) |
| 41 | nft_data_copy(data, he->data); |
Patrick McHardy | 9651851 | 2013-10-14 11:00:02 +0200 | [diff] [blame] | 42 | |
Thomas Graf | cfe4a9d | 2014-08-02 11:47:46 +0200 | [diff] [blame] | 43 | return !!he; |
Patrick McHardy | 9651851 | 2013-10-14 11:00:02 +0200 | [diff] [blame] | 44 | } |
| 45 | |
Patrick McHardy | 20a6934 | 2013-10-11 12:06:22 +0200 | [diff] [blame] | 46 | static int nft_hash_insert(const struct nft_set *set, |
| 47 | const struct nft_set_elem *elem) |
Patrick McHardy | 9651851 | 2013-10-14 11:00:02 +0200 | [diff] [blame] | 48 | { |
Thomas Graf | cfe4a9d | 2014-08-02 11:47:46 +0200 | [diff] [blame] | 49 | struct rhashtable *priv = nft_set_priv(set); |
Patrick McHardy | 20a6934 | 2013-10-11 12:06:22 +0200 | [diff] [blame] | 50 | struct nft_hash_elem *he; |
Thomas Graf | cfe4a9d | 2014-08-02 11:47:46 +0200 | [diff] [blame] | 51 | unsigned int size; |
Patrick McHardy | 9651851 | 2013-10-14 11:00:02 +0200 | [diff] [blame] | 52 | |
Patrick McHardy | 20a6934 | 2013-10-11 12:06:22 +0200 | [diff] [blame] | 53 | if (elem->flags != 0) |
Patrick McHardy | 9651851 | 2013-10-14 11:00:02 +0200 | [diff] [blame] | 54 | return -EINVAL; |
Patrick McHardy | 9651851 | 2013-10-14 11:00:02 +0200 | [diff] [blame] | 55 | |
Patrick McHardy | 20a6934 | 2013-10-11 12:06:22 +0200 | [diff] [blame] | 56 | size = sizeof(*he); |
| 57 | if (set->flags & NFT_SET_MAP) |
| 58 | size += sizeof(he->data[0]); |
Patrick McHardy | 9651851 | 2013-10-14 11:00:02 +0200 | [diff] [blame] | 59 | |
Patrick McHardy | 20a6934 | 2013-10-11 12:06:22 +0200 | [diff] [blame] | 60 | he = kzalloc(size, GFP_KERNEL); |
| 61 | if (he == NULL) |
Patrick McHardy | 9651851 | 2013-10-14 11:00:02 +0200 | [diff] [blame] | 62 | return -ENOMEM; |
| 63 | |
Patrick McHardy | 20a6934 | 2013-10-11 12:06:22 +0200 | [diff] [blame] | 64 | nft_data_copy(&he->key, &elem->key); |
| 65 | if (set->flags & NFT_SET_MAP) |
| 66 | nft_data_copy(he->data, &elem->data); |
Patrick McHardy | 9651851 | 2013-10-14 11:00:02 +0200 | [diff] [blame] | 67 | |
Thomas Graf | 6eba822 | 2014-11-13 13:45:46 +0100 | [diff] [blame] | 68 | rhashtable_insert(priv, &he->node); |
Patrick McHardy | ce6eb0d | 2014-03-04 16:21:51 +0100 | [diff] [blame] | 69 | |
Patrick McHardy | 9651851 | 2013-10-14 11:00:02 +0200 | [diff] [blame] | 70 | return 0; |
Patrick McHardy | 9651851 | 2013-10-14 11:00:02 +0200 | [diff] [blame] | 71 | } |
| 72 | |
Patrick McHardy | ce6eb0d | 2014-03-04 16:21:51 +0100 | [diff] [blame] | 73 | static void nft_hash_elem_destroy(const struct nft_set *set, |
| 74 | struct nft_hash_elem *he) |
| 75 | { |
| 76 | nft_data_uninit(&he->key, NFT_DATA_VALUE); |
| 77 | if (set->flags & NFT_SET_MAP) |
| 78 | nft_data_uninit(he->data, set->dtype); |
| 79 | kfree(he); |
| 80 | } |
| 81 | |
Patrick McHardy | 20a6934 | 2013-10-11 12:06:22 +0200 | [diff] [blame] | 82 | static void nft_hash_remove(const struct nft_set *set, |
| 83 | const struct nft_set_elem *elem) |
Patrick McHardy | 9651851 | 2013-10-14 11:00:02 +0200 | [diff] [blame] | 84 | { |
Thomas Graf | cfe4a9d | 2014-08-02 11:47:46 +0200 | [diff] [blame] | 85 | struct rhashtable *priv = nft_set_priv(set); |
Patrick McHardy | 9651851 | 2013-10-14 11:00:02 +0200 | [diff] [blame] | 86 | |
Thomas Graf | 897362e | 2015-01-02 23:00:18 +0100 | [diff] [blame] | 87 | rhashtable_remove(priv, elem->cookie); |
Patrick McHardy | ce6eb0d | 2014-03-04 16:21:51 +0100 | [diff] [blame] | 88 | synchronize_rcu(); |
Thomas Graf | 897362e | 2015-01-02 23:00:18 +0100 | [diff] [blame] | 89 | kfree(elem->cookie); |
Patrick McHardy | 9651851 | 2013-10-14 11:00:02 +0200 | [diff] [blame] | 90 | } |
| 91 | |
Thomas Graf | 8d24c0b | 2015-01-02 23:00:14 +0100 | [diff] [blame] | 92 | struct nft_compare_arg { |
| 93 | const struct nft_set *set; |
| 94 | struct nft_set_elem *elem; |
| 95 | }; |
| 96 | |
| 97 | static bool nft_hash_compare(void *ptr, void *arg) |
| 98 | { |
| 99 | struct nft_hash_elem *he = ptr; |
| 100 | struct nft_compare_arg *x = arg; |
| 101 | |
| 102 | if (!nft_data_cmp(&he->key, &x->elem->key, x->set->klen)) { |
Thomas Graf | 897362e | 2015-01-02 23:00:18 +0100 | [diff] [blame] | 103 | x->elem->cookie = he; |
Thomas Graf | 8d24c0b | 2015-01-02 23:00:14 +0100 | [diff] [blame] | 104 | x->elem->flags = 0; |
| 105 | if (x->set->flags & NFT_SET_MAP) |
| 106 | nft_data_copy(&x->elem->data, he->data); |
| 107 | |
| 108 | return true; |
| 109 | } |
| 110 | |
| 111 | return false; |
| 112 | } |
| 113 | |
Patrick McHardy | 20a6934 | 2013-10-11 12:06:22 +0200 | [diff] [blame] | 114 | static int nft_hash_get(const struct nft_set *set, struct nft_set_elem *elem) |
Patrick McHardy | 9651851 | 2013-10-14 11:00:02 +0200 | [diff] [blame] | 115 | { |
Thomas Graf | 97defe1 | 2015-01-02 23:00:20 +0100 | [diff] [blame] | 116 | struct rhashtable *priv = nft_set_priv(set); |
Thomas Graf | 8d24c0b | 2015-01-02 23:00:14 +0100 | [diff] [blame] | 117 | struct nft_compare_arg arg = { |
| 118 | .set = set, |
| 119 | .elem = elem, |
| 120 | }; |
Patrick McHardy | 20a6934 | 2013-10-11 12:06:22 +0200 | [diff] [blame] | 121 | |
Thomas Graf | 8d24c0b | 2015-01-02 23:00:14 +0100 | [diff] [blame] | 122 | if (rhashtable_lookup_compare(priv, &elem->key, |
| 123 | &nft_hash_compare, &arg)) |
Patrick McHardy | 20a6934 | 2013-10-11 12:06:22 +0200 | [diff] [blame] | 124 | return 0; |
Thomas Graf | 8d24c0b | 2015-01-02 23:00:14 +0100 | [diff] [blame] | 125 | |
Patrick McHardy | 20a6934 | 2013-10-11 12:06:22 +0200 | [diff] [blame] | 126 | return -ENOENT; |
| 127 | } |
| 128 | |
| 129 | static void nft_hash_walk(const struct nft_ctx *ctx, const struct nft_set *set, |
| 130 | struct nft_set_iter *iter) |
| 131 | { |
Thomas Graf | 97defe1 | 2015-01-02 23:00:20 +0100 | [diff] [blame] | 132 | struct rhashtable *priv = nft_set_priv(set); |
Patrick McHardy | 20a6934 | 2013-10-11 12:06:22 +0200 | [diff] [blame] | 133 | const struct nft_hash_elem *he; |
Herbert Xu | 9a77662 | 2015-02-04 07:33:25 +1100 | [diff] [blame] | 134 | struct rhashtable_iter hti; |
Patrick McHardy | 20a6934 | 2013-10-11 12:06:22 +0200 | [diff] [blame] | 135 | struct nft_set_elem elem; |
Herbert Xu | 9a77662 | 2015-02-04 07:33:25 +1100 | [diff] [blame] | 136 | int err; |
Patrick McHardy | 9651851 | 2013-10-14 11:00:02 +0200 | [diff] [blame] | 137 | |
Herbert Xu | 9a77662 | 2015-02-04 07:33:25 +1100 | [diff] [blame] | 138 | err = rhashtable_walk_init(priv, &hti); |
| 139 | iter->err = err; |
| 140 | if (err) |
| 141 | return; |
Thomas Graf | 88d6ed1 | 2015-01-02 23:00:16 +0100 | [diff] [blame] | 142 | |
Herbert Xu | 9a77662 | 2015-02-04 07:33:25 +1100 | [diff] [blame] | 143 | err = rhashtable_walk_start(&hti); |
| 144 | if (err && err != -EAGAIN) { |
| 145 | iter->err = err; |
| 146 | goto out; |
Patrick McHardy | 9651851 | 2013-10-14 11:00:02 +0200 | [diff] [blame] | 147 | } |
Herbert Xu | 9a77662 | 2015-02-04 07:33:25 +1100 | [diff] [blame] | 148 | |
| 149 | while ((he = rhashtable_walk_next(&hti))) { |
| 150 | if (IS_ERR(he)) { |
| 151 | err = PTR_ERR(he); |
| 152 | if (err != -EAGAIN) { |
| 153 | iter->err = err; |
| 154 | goto out; |
| 155 | } |
| 156 | } |
| 157 | |
| 158 | if (iter->count < iter->skip) |
| 159 | goto cont; |
| 160 | |
| 161 | memcpy(&elem.key, &he->key, sizeof(elem.key)); |
| 162 | if (set->flags & NFT_SET_MAP) |
| 163 | memcpy(&elem.data, he->data, sizeof(elem.data)); |
| 164 | elem.flags = 0; |
| 165 | |
| 166 | iter->err = iter->fn(ctx, set, iter, &elem); |
| 167 | if (iter->err < 0) |
| 168 | goto out; |
| 169 | |
| 170 | cont: |
| 171 | iter->count++; |
| 172 | } |
| 173 | |
| 174 | out: |
| 175 | rhashtable_walk_stop(&hti); |
| 176 | rhashtable_walk_exit(&hti); |
Patrick McHardy | 9651851 | 2013-10-14 11:00:02 +0200 | [diff] [blame] | 177 | } |
| 178 | |
Patrick McHardy | 20a6934 | 2013-10-11 12:06:22 +0200 | [diff] [blame] | 179 | static unsigned int nft_hash_privsize(const struct nlattr * const nla[]) |
| 180 | { |
Thomas Graf | cfe4a9d | 2014-08-02 11:47:46 +0200 | [diff] [blame] | 181 | return sizeof(struct rhashtable); |
| 182 | } |
| 183 | |
Patrick McHardy | 20a6934 | 2013-10-11 12:06:22 +0200 | [diff] [blame] | 184 | static int nft_hash_init(const struct nft_set *set, |
Patrick McHardy | c50b960 | 2014-03-28 10:19:47 +0000 | [diff] [blame] | 185 | const struct nft_set_desc *desc, |
Patrick McHardy | 9651851 | 2013-10-14 11:00:02 +0200 | [diff] [blame] | 186 | const struct nlattr * const tb[]) |
| 187 | { |
Thomas Graf | cfe4a9d | 2014-08-02 11:47:46 +0200 | [diff] [blame] | 188 | struct rhashtable *priv = nft_set_priv(set); |
| 189 | struct rhashtable_params params = { |
| 190 | .nelem_hint = desc->size ? : NFT_HASH_ELEMENT_HINT, |
| 191 | .head_offset = offsetof(struct nft_hash_elem, node), |
| 192 | .key_offset = offsetof(struct nft_hash_elem, key), |
| 193 | .key_len = set->klen, |
| 194 | .hashfn = jhash, |
Thomas Graf | cfe4a9d | 2014-08-02 11:47:46 +0200 | [diff] [blame] | 195 | }; |
Patrick McHardy | 9651851 | 2013-10-14 11:00:02 +0200 | [diff] [blame] | 196 | |
Thomas Graf | cfe4a9d | 2014-08-02 11:47:46 +0200 | [diff] [blame] | 197 | return rhashtable_init(priv, ¶ms); |
Patrick McHardy | 9651851 | 2013-10-14 11:00:02 +0200 | [diff] [blame] | 198 | } |
| 199 | |
Patrick McHardy | 20a6934 | 2013-10-11 12:06:22 +0200 | [diff] [blame] | 200 | static void nft_hash_destroy(const struct nft_set *set) |
Patrick McHardy | 9651851 | 2013-10-14 11:00:02 +0200 | [diff] [blame] | 201 | { |
Thomas Graf | 97defe1 | 2015-01-02 23:00:20 +0100 | [diff] [blame] | 202 | struct rhashtable *priv = nft_set_priv(set); |
| 203 | const struct bucket_table *tbl; |
Thomas Graf | 88d6ed1 | 2015-01-02 23:00:16 +0100 | [diff] [blame] | 204 | struct nft_hash_elem *he; |
| 205 | struct rhash_head *pos, *next; |
Patrick McHardy | 9651851 | 2013-10-14 11:00:02 +0200 | [diff] [blame] | 206 | unsigned int i; |
| 207 | |
Thomas Graf | 97defe1 | 2015-01-02 23:00:20 +0100 | [diff] [blame] | 208 | /* Stop an eventual async resizing */ |
| 209 | priv->being_destroyed = true; |
| 210 | mutex_lock(&priv->mutex); |
| 211 | |
| 212 | tbl = rht_dereference(priv->tbl, priv); |
Pablo Neira Ayuso | 39f3901 | 2014-09-01 11:09:35 +0200 | [diff] [blame] | 213 | for (i = 0; i < tbl->size; i++) { |
Thomas Graf | 88d6ed1 | 2015-01-02 23:00:16 +0100 | [diff] [blame] | 214 | rht_for_each_entry_safe(he, pos, next, tbl, i, node) |
Patrick McHardy | ce6eb0d | 2014-03-04 16:21:51 +0100 | [diff] [blame] | 215 | nft_hash_elem_destroy(set, he); |
Pablo Neira Ayuso | 39f3901 | 2014-09-01 11:09:35 +0200 | [diff] [blame] | 216 | } |
Thomas Graf | 97defe1 | 2015-01-02 23:00:20 +0100 | [diff] [blame] | 217 | mutex_unlock(&priv->mutex); |
| 218 | |
Thomas Graf | cfe4a9d | 2014-08-02 11:47:46 +0200 | [diff] [blame] | 219 | rhashtable_destroy(priv); |
Patrick McHardy | 9651851 | 2013-10-14 11:00:02 +0200 | [diff] [blame] | 220 | } |
| 221 | |
Patrick McHardy | c50b960 | 2014-03-28 10:19:47 +0000 | [diff] [blame] | 222 | static bool nft_hash_estimate(const struct nft_set_desc *desc, u32 features, |
| 223 | struct nft_set_estimate *est) |
| 224 | { |
| 225 | unsigned int esize; |
| 226 | |
| 227 | esize = sizeof(struct nft_hash_elem); |
| 228 | if (features & NFT_SET_MAP) |
| 229 | esize += FIELD_SIZEOF(struct nft_hash_elem, data[0]); |
| 230 | |
| 231 | if (desc->size) { |
Thomas Graf | cfe4a9d | 2014-08-02 11:47:46 +0200 | [diff] [blame] | 232 | est->size = sizeof(struct rhashtable) + |
| 233 | roundup_pow_of_two(desc->size * 4 / 3) * |
Patrick McHardy | c50b960 | 2014-03-28 10:19:47 +0000 | [diff] [blame] | 234 | sizeof(struct nft_hash_elem *) + |
| 235 | desc->size * esize; |
| 236 | } else { |
| 237 | /* Resizing happens when the load drops below 30% or goes |
| 238 | * above 75%. The average of 52.5% load (approximated by 50%) |
| 239 | * is used for the size estimation of the hash buckets, |
| 240 | * meaning we calculate two buckets per element. |
| 241 | */ |
| 242 | est->size = esize + 2 * sizeof(struct nft_hash_elem *); |
| 243 | } |
| 244 | |
| 245 | est->class = NFT_SET_CLASS_O_1; |
| 246 | |
| 247 | return true; |
| 248 | } |
| 249 | |
Patrick McHardy | 20a6934 | 2013-10-11 12:06:22 +0200 | [diff] [blame] | 250 | static struct nft_set_ops nft_hash_ops __read_mostly = { |
| 251 | .privsize = nft_hash_privsize, |
Patrick McHardy | c50b960 | 2014-03-28 10:19:47 +0000 | [diff] [blame] | 252 | .estimate = nft_hash_estimate, |
Patrick McHardy | 9651851 | 2013-10-14 11:00:02 +0200 | [diff] [blame] | 253 | .init = nft_hash_init, |
| 254 | .destroy = nft_hash_destroy, |
Patrick McHardy | 20a6934 | 2013-10-11 12:06:22 +0200 | [diff] [blame] | 255 | .get = nft_hash_get, |
| 256 | .insert = nft_hash_insert, |
| 257 | .remove = nft_hash_remove, |
| 258 | .lookup = nft_hash_lookup, |
| 259 | .walk = nft_hash_walk, |
| 260 | .features = NFT_SET_MAP, |
| 261 | .owner = THIS_MODULE, |
Patrick McHardy | 9651851 | 2013-10-14 11:00:02 +0200 | [diff] [blame] | 262 | }; |
| 263 | |
| 264 | static int __init nft_hash_module_init(void) |
| 265 | { |
Patrick McHardy | 20a6934 | 2013-10-11 12:06:22 +0200 | [diff] [blame] | 266 | return nft_register_set(&nft_hash_ops); |
Patrick McHardy | 9651851 | 2013-10-14 11:00:02 +0200 | [diff] [blame] | 267 | } |
| 268 | |
| 269 | static void __exit nft_hash_module_exit(void) |
| 270 | { |
Patrick McHardy | 20a6934 | 2013-10-11 12:06:22 +0200 | [diff] [blame] | 271 | nft_unregister_set(&nft_hash_ops); |
Patrick McHardy | 9651851 | 2013-10-14 11:00:02 +0200 | [diff] [blame] | 272 | } |
| 273 | |
| 274 | module_init(nft_hash_module_init); |
| 275 | module_exit(nft_hash_module_exit); |
| 276 | |
| 277 | MODULE_LICENSE("GPL"); |
| 278 | MODULE_AUTHOR("Patrick McHardy <kaber@trash.net>"); |
Patrick McHardy | 20a6934 | 2013-10-11 12:06:22 +0200 | [diff] [blame] | 279 | MODULE_ALIAS_NFT_SET(); |