Jesse Gross | ccb1352 | 2011-10-25 19:26:31 -0700 | [diff] [blame] | 1 | /* |
Raju Subramanian | caf2ee1 | 2012-05-03 18:55:23 -0700 | [diff] [blame] | 2 | * Copyright (c) 2007-2012 Nicira, Inc. |
Jesse Gross | ccb1352 | 2011-10-25 19:26:31 -0700 | [diff] [blame] | 3 | * |
| 4 | * This program is free software; you can redistribute it and/or |
| 5 | * modify it under the terms of version 2 of the GNU General Public |
| 6 | * License as published by the Free Software Foundation. |
| 7 | * |
| 8 | * This program is distributed in the hope that it will be useful, but |
| 9 | * WITHOUT ANY WARRANTY; without even the implied warranty of |
| 10 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
| 11 | * General Public License for more details. |
| 12 | * |
| 13 | * You should have received a copy of the GNU General Public License |
| 14 | * along with this program; if not, write to the Free Software |
| 15 | * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA |
| 16 | * 02110-1301, USA |
| 17 | */ |
| 18 | |
| 19 | #ifndef VPORT_H |
| 20 | #define VPORT_H 1 |
| 21 | |
Pravin B Shelar | e0f0ecf | 2013-04-15 13:30:37 -0700 | [diff] [blame] | 22 | #include <linux/if_tunnel.h> |
Jesse Gross | ccb1352 | 2011-10-25 19:26:31 -0700 | [diff] [blame] | 23 | #include <linux/list.h> |
Pravin B Shelar | 46df7b8 | 2012-02-22 19:58:59 -0800 | [diff] [blame] | 24 | #include <linux/netlink.h> |
Jesse Gross | ccb1352 | 2011-10-25 19:26:31 -0700 | [diff] [blame] | 25 | #include <linux/openvswitch.h> |
Alex Wang | 5cd667b | 2014-07-17 15:14:13 -0700 | [diff] [blame] | 26 | #include <linux/reciprocal_div.h> |
Jesse Gross | ccb1352 | 2011-10-25 19:26:31 -0700 | [diff] [blame] | 27 | #include <linux/skbuff.h> |
| 28 | #include <linux/spinlock.h> |
| 29 | #include <linux/u64_stats_sync.h> |
Thomas Graf | 3093fbe | 2015-07-21 10:44:00 +0200 | [diff] [blame] | 30 | #include <net/route.h> |
Jesse Gross | ccb1352 | 2011-10-25 19:26:31 -0700 | [diff] [blame] | 31 | |
| 32 | #include "datapath.h" |
| 33 | |
| 34 | struct vport; |
| 35 | struct vport_parms; |
| 36 | |
| 37 | /* The following definitions are for users of the vport subsytem: */ |
| 38 | |
Pravin B Shelar | aa31070 | 2013-06-17 17:50:33 -0700 | [diff] [blame] | 39 | struct vport_net { |
| 40 | struct vport __rcu *gre_vport; |
| 41 | }; |
| 42 | |
Jesse Gross | ccb1352 | 2011-10-25 19:26:31 -0700 | [diff] [blame] | 43 | int ovs_vport_init(void); |
| 44 | void ovs_vport_exit(void); |
| 45 | |
| 46 | struct vport *ovs_vport_add(const struct vport_parms *); |
| 47 | void ovs_vport_del(struct vport *); |
| 48 | |
Thomas Graf | 12eb18f | 2014-11-06 06:58:52 -0800 | [diff] [blame] | 49 | struct vport *ovs_vport_locate(const struct net *net, const char *name); |
Jesse Gross | ccb1352 | 2011-10-25 19:26:31 -0700 | [diff] [blame] | 50 | |
| 51 | void ovs_vport_get_stats(struct vport *, struct ovs_vport_stats *); |
| 52 | |
| 53 | int ovs_vport_set_options(struct vport *, struct nlattr *options); |
| 54 | int ovs_vport_get_options(const struct vport *, struct sk_buff *); |
| 55 | |
Thomas Graf | 12eb18f | 2014-11-06 06:58:52 -0800 | [diff] [blame] | 56 | int ovs_vport_set_upcall_portids(struct vport *, const struct nlattr *pids); |
Alex Wang | 5cd667b | 2014-07-17 15:14:13 -0700 | [diff] [blame] | 57 | int ovs_vport_get_upcall_portids(const struct vport *, struct sk_buff *); |
| 58 | u32 ovs_vport_find_upcall_portid(const struct vport *, struct sk_buff *); |
| 59 | |
Jesse Gross | ccb1352 | 2011-10-25 19:26:31 -0700 | [diff] [blame] | 60 | int ovs_vport_send(struct vport *, struct sk_buff *); |
| 61 | |
Thomas Graf | 1d8fff9 | 2015-07-21 10:43:54 +0200 | [diff] [blame] | 62 | int ovs_tunnel_get_egress_info(struct ip_tunnel_info *egress_tun_info, |
Wenyu Zhang | 8f0aad6 | 2014-11-06 06:51:24 -0800 | [diff] [blame] | 63 | struct net *net, |
Thomas Graf | 1d8fff9 | 2015-07-21 10:43:54 +0200 | [diff] [blame] | 64 | const struct ip_tunnel_info *tun_info, |
Wenyu Zhang | 8f0aad6 | 2014-11-06 06:51:24 -0800 | [diff] [blame] | 65 | u8 ipproto, |
| 66 | u32 skb_mark, |
| 67 | __be16 tp_src, |
| 68 | __be16 tp_dst); |
| 69 | int ovs_vport_get_egress_tun_info(struct vport *vport, struct sk_buff *skb, |
Thomas Graf | 1d8fff9 | 2015-07-21 10:43:54 +0200 | [diff] [blame] | 70 | struct ip_tunnel_info *info); |
Wenyu Zhang | 8f0aad6 | 2014-11-06 06:51:24 -0800 | [diff] [blame] | 71 | |
Jesse Gross | ccb1352 | 2011-10-25 19:26:31 -0700 | [diff] [blame] | 72 | /* The following definitions are for implementers of vport devices: */ |
| 73 | |
Jesse Gross | ccb1352 | 2011-10-25 19:26:31 -0700 | [diff] [blame] | 74 | struct vport_err_stats { |
Li RongQing | e403ade | 2014-09-06 19:06:11 +0800 | [diff] [blame] | 75 | atomic_long_t rx_dropped; |
| 76 | atomic_long_t rx_errors; |
| 77 | atomic_long_t tx_dropped; |
| 78 | atomic_long_t tx_errors; |
Jesse Gross | ccb1352 | 2011-10-25 19:26:31 -0700 | [diff] [blame] | 79 | }; |
Alex Wang | 5cd667b | 2014-07-17 15:14:13 -0700 | [diff] [blame] | 80 | /** |
| 81 | * struct vport_portids - array of netlink portids of a vport. |
| 82 | * must be protected by rcu. |
| 83 | * @rn_ids: The reciprocal value of @n_ids. |
| 84 | * @rcu: RCU callback head for deferred destruction. |
| 85 | * @n_ids: Size of @ids array. |
| 86 | * @ids: Array storing the Netlink socket pids to be used for packets received |
| 87 | * on this port that miss the flow table. |
| 88 | */ |
| 89 | struct vport_portids { |
| 90 | struct reciprocal_value rn_ids; |
| 91 | struct rcu_head rcu; |
| 92 | u32 n_ids; |
| 93 | u32 ids[]; |
| 94 | }; |
Jesse Gross | ccb1352 | 2011-10-25 19:26:31 -0700 | [diff] [blame] | 95 | |
| 96 | /** |
| 97 | * struct vport - one port within a datapath |
| 98 | * @rcu: RCU callback head for deferred destruction. |
Jesse Gross | ccb1352 | 2011-10-25 19:26:31 -0700 | [diff] [blame] | 99 | * @dp: Datapath to which this port belongs. |
Alex Wang | 5cd667b | 2014-07-17 15:14:13 -0700 | [diff] [blame] | 100 | * @upcall_portids: RCU protected 'struct vport_portids'. |
Thomas Graf | 03599c9 | 2012-12-03 22:24:32 +0000 | [diff] [blame] | 101 | * @port_no: Index into @dp's @ports array. |
Jesse Gross | ccb1352 | 2011-10-25 19:26:31 -0700 | [diff] [blame] | 102 | * @hash_node: Element in @dev_table hash table in vport.c. |
Pravin B Shelar | 15eac2a | 2012-08-23 12:40:54 -0700 | [diff] [blame] | 103 | * @dp_hash_node: Element in @datapath->ports hash table in datapath.c. |
Jesse Gross | ccb1352 | 2011-10-25 19:26:31 -0700 | [diff] [blame] | 104 | * @ops: Class structure. |
| 105 | * @percpu_stats: Points to per-CPU statistics used and maintained by vport |
Jesse Gross | ccb1352 | 2011-10-25 19:26:31 -0700 | [diff] [blame] | 106 | * @err_stats: Points to error statistics used and maintained by vport |
Pravin B Shelar | 7b4577a | 2015-02-17 11:23:10 -0800 | [diff] [blame] | 107 | * @detach_list: list used for detaching vport in net-exit call. |
Jesse Gross | ccb1352 | 2011-10-25 19:26:31 -0700 | [diff] [blame] | 108 | */ |
| 109 | struct vport { |
Thomas Graf | be4ace6 | 2015-07-21 10:44:04 +0200 | [diff] [blame] | 110 | struct net_device *dev; |
Jesse Gross | ccb1352 | 2011-10-25 19:26:31 -0700 | [diff] [blame] | 111 | struct datapath *dp; |
Alex Wang | 5cd667b | 2014-07-17 15:14:13 -0700 | [diff] [blame] | 112 | struct vport_portids __rcu *upcall_portids; |
Thomas Graf | 03599c9 | 2012-12-03 22:24:32 +0000 | [diff] [blame] | 113 | u16 port_no; |
Jesse Gross | ccb1352 | 2011-10-25 19:26:31 -0700 | [diff] [blame] | 114 | |
| 115 | struct hlist_node hash_node; |
Pravin B Shelar | 15eac2a | 2012-08-23 12:40:54 -0700 | [diff] [blame] | 116 | struct hlist_node dp_hash_node; |
Jesse Gross | ccb1352 | 2011-10-25 19:26:31 -0700 | [diff] [blame] | 117 | const struct vport_ops *ops; |
| 118 | |
Li RongQing | 8f84985 | 2014-01-04 13:57:59 +0800 | [diff] [blame] | 119 | struct pcpu_sw_netstats __percpu *percpu_stats; |
Jesse Gross | ccb1352 | 2011-10-25 19:26:31 -0700 | [diff] [blame] | 120 | |
Jesse Gross | ccb1352 | 2011-10-25 19:26:31 -0700 | [diff] [blame] | 121 | struct vport_err_stats err_stats; |
Pravin B Shelar | 7b4577a | 2015-02-17 11:23:10 -0800 | [diff] [blame] | 122 | struct list_head detach_list; |
Thomas Graf | be4ace6 | 2015-07-21 10:44:04 +0200 | [diff] [blame] | 123 | struct rcu_head rcu; |
Jesse Gross | ccb1352 | 2011-10-25 19:26:31 -0700 | [diff] [blame] | 124 | }; |
| 125 | |
| 126 | /** |
| 127 | * struct vport_parms - parameters for creating a new vport |
| 128 | * |
| 129 | * @name: New vport's name. |
| 130 | * @type: New vport's type. |
| 131 | * @options: %OVS_VPORT_ATTR_OPTIONS attribute from Netlink message, %NULL if |
| 132 | * none was supplied. |
| 133 | * @dp: New vport's datapath. |
| 134 | * @port_no: New vport's port number. |
| 135 | */ |
| 136 | struct vport_parms { |
| 137 | const char *name; |
| 138 | enum ovs_vport_type type; |
| 139 | struct nlattr *options; |
| 140 | |
| 141 | /* For ovs_vport_alloc(). */ |
| 142 | struct datapath *dp; |
| 143 | u16 port_no; |
Alex Wang | 5cd667b | 2014-07-17 15:14:13 -0700 | [diff] [blame] | 144 | struct nlattr *upcall_portids; |
Jesse Gross | ccb1352 | 2011-10-25 19:26:31 -0700 | [diff] [blame] | 145 | }; |
| 146 | |
| 147 | /** |
| 148 | * struct vport_ops - definition of a type of virtual port |
| 149 | * |
| 150 | * @type: %OVS_VPORT_TYPE_* value for this type of virtual port. |
| 151 | * @create: Create a new vport configured as specified. On success returns |
| 152 | * a new vport allocated with ovs_vport_alloc(), otherwise an ERR_PTR() value. |
| 153 | * @destroy: Destroys a vport. Must call vport_free() on the vport but not |
| 154 | * before an RCU grace period has elapsed. |
| 155 | * @set_options: Modify the configuration of an existing vport. May be %NULL |
| 156 | * if modification is not supported. |
| 157 | * @get_options: Appends vport-specific attributes for the configuration of an |
| 158 | * existing vport to a &struct sk_buff. May be %NULL for a vport that does not |
| 159 | * have any configuration. |
| 160 | * @get_name: Get the device's name. |
Pravin B Shelar | 91b7514 | 2013-05-13 08:22:34 -0700 | [diff] [blame] | 161 | * @send: Send a packet on the device. Returns the length of the packet sent, |
| 162 | * zero for dropped packets or negative for error. |
Wenyu Zhang | 8f0aad6 | 2014-11-06 06:51:24 -0800 | [diff] [blame] | 163 | * @get_egress_tun_info: Get the egress tunnel 5-tuple and other info for |
| 164 | * a packet. |
Jesse Gross | ccb1352 | 2011-10-25 19:26:31 -0700 | [diff] [blame] | 165 | */ |
| 166 | struct vport_ops { |
| 167 | enum ovs_vport_type type; |
| 168 | |
Pravin B Shelar | 8e4e171 | 2013-04-15 13:23:03 -0700 | [diff] [blame] | 169 | /* Called with ovs_mutex. */ |
Jesse Gross | ccb1352 | 2011-10-25 19:26:31 -0700 | [diff] [blame] | 170 | struct vport *(*create)(const struct vport_parms *); |
| 171 | void (*destroy)(struct vport *); |
| 172 | |
| 173 | int (*set_options)(struct vport *, struct nlattr *); |
| 174 | int (*get_options)(const struct vport *, struct sk_buff *); |
| 175 | |
Pravin B Shelar | 8e4e171 | 2013-04-15 13:23:03 -0700 | [diff] [blame] | 176 | /* Called with rcu_read_lock or ovs_mutex. */ |
Jesse Gross | ccb1352 | 2011-10-25 19:26:31 -0700 | [diff] [blame] | 177 | const char *(*get_name)(const struct vport *); |
Jesse Gross | ccb1352 | 2011-10-25 19:26:31 -0700 | [diff] [blame] | 178 | |
| 179 | int (*send)(struct vport *, struct sk_buff *); |
Wenyu Zhang | 8f0aad6 | 2014-11-06 06:51:24 -0800 | [diff] [blame] | 180 | int (*get_egress_tun_info)(struct vport *, struct sk_buff *, |
Thomas Graf | 1d8fff9 | 2015-07-21 10:43:54 +0200 | [diff] [blame] | 181 | struct ip_tunnel_info *); |
Thomas Graf | 62b9c8d | 2014-10-22 17:29:06 +0200 | [diff] [blame] | 182 | |
| 183 | struct module *owner; |
| 184 | struct list_head list; |
Jesse Gross | ccb1352 | 2011-10-25 19:26:31 -0700 | [diff] [blame] | 185 | }; |
| 186 | |
| 187 | enum vport_err_type { |
| 188 | VPORT_E_RX_DROPPED, |
| 189 | VPORT_E_RX_ERROR, |
| 190 | VPORT_E_TX_DROPPED, |
| 191 | VPORT_E_TX_ERROR, |
| 192 | }; |
| 193 | |
| 194 | struct vport *ovs_vport_alloc(int priv_size, const struct vport_ops *, |
| 195 | const struct vport_parms *); |
| 196 | void ovs_vport_free(struct vport *); |
Pravin B Shelar | aa31070 | 2013-06-17 17:50:33 -0700 | [diff] [blame] | 197 | void ovs_vport_deferred_free(struct vport *vport); |
Jesse Gross | ccb1352 | 2011-10-25 19:26:31 -0700 | [diff] [blame] | 198 | |
| 199 | #define VPORT_ALIGN 8 |
| 200 | |
| 201 | /** |
| 202 | * vport_priv - access private data area of vport |
| 203 | * |
| 204 | * @vport: vport to access |
| 205 | * |
| 206 | * If a nonzero size was passed in priv_size of vport_alloc() a private data |
| 207 | * area was allocated on creation. This allows that area to be accessed and |
| 208 | * used for any purpose needed by the vport implementer. |
| 209 | */ |
| 210 | static inline void *vport_priv(const struct vport *vport) |
| 211 | { |
Daniele Di Proietto | 07dc060 | 2014-02-03 14:08:29 -0800 | [diff] [blame] | 212 | return (u8 *)(uintptr_t)vport + ALIGN(sizeof(struct vport), VPORT_ALIGN); |
Jesse Gross | ccb1352 | 2011-10-25 19:26:31 -0700 | [diff] [blame] | 213 | } |
| 214 | |
| 215 | /** |
| 216 | * vport_from_priv - lookup vport from private data pointer |
| 217 | * |
| 218 | * @priv: Start of private data area. |
| 219 | * |
| 220 | * It is sometimes useful to translate from a pointer to the private data |
| 221 | * area to the vport, such as in the case where the private data pointer is |
| 222 | * the result of a hash table lookup. @priv must point to the start of the |
| 223 | * private data area. |
| 224 | */ |
Daniele Di Proietto | d0b4da1 | 2014-02-03 14:07:43 -0800 | [diff] [blame] | 225 | static inline struct vport *vport_from_priv(void *priv) |
Jesse Gross | ccb1352 | 2011-10-25 19:26:31 -0700 | [diff] [blame] | 226 | { |
Daniele Di Proietto | d0b4da1 | 2014-02-03 14:07:43 -0800 | [diff] [blame] | 227 | return (struct vport *)((u8 *)priv - ALIGN(sizeof(struct vport), VPORT_ALIGN)); |
Jesse Gross | ccb1352 | 2011-10-25 19:26:31 -0700 | [diff] [blame] | 228 | } |
| 229 | |
Pravin B Shelar | 7d5437c | 2013-06-17 17:50:18 -0700 | [diff] [blame] | 230 | void ovs_vport_receive(struct vport *, struct sk_buff *, |
Thomas Graf | 1d8fff9 | 2015-07-21 10:43:54 +0200 | [diff] [blame] | 231 | const struct ip_tunnel_info *); |
Jesse Gross | ccb1352 | 2011-10-25 19:26:31 -0700 | [diff] [blame] | 232 | |
Pravin B Shelar | b34df5e | 2013-06-13 11:11:44 -0700 | [diff] [blame] | 233 | static inline void ovs_skb_postpush_rcsum(struct sk_buff *skb, |
| 234 | const void *start, unsigned int len) |
| 235 | { |
| 236 | if (skb->ip_summed == CHECKSUM_COMPLETE) |
| 237 | skb->csum = csum_add(skb->csum, csum_partial(start, len, 0)); |
| 238 | } |
| 239 | |
Thomas Graf | c9db965 | 2015-07-21 10:44:05 +0200 | [diff] [blame] | 240 | static inline const char *ovs_vport_name(struct vport *vport) |
| 241 | { |
| 242 | return vport->dev ? vport->dev->name : vport->ops->get_name(vport); |
| 243 | } |
| 244 | |
Thomas Graf | 62b9c8d | 2014-10-22 17:29:06 +0200 | [diff] [blame] | 245 | int ovs_vport_ops_register(struct vport_ops *ops); |
| 246 | void ovs_vport_ops_unregister(struct vport_ops *ops); |
| 247 | |
Fan Du | 3f4c1d8 | 2015-01-14 13:10:35 +0800 | [diff] [blame] | 248 | static inline struct rtable *ovs_tunnel_route_lookup(struct net *net, |
Thomas Graf | 1d8fff9 | 2015-07-21 10:43:54 +0200 | [diff] [blame] | 249 | const struct ip_tunnel_key *key, |
Fan Du | 3f4c1d8 | 2015-01-14 13:10:35 +0800 | [diff] [blame] | 250 | u32 mark, |
| 251 | struct flowi4 *fl, |
| 252 | u8 protocol) |
| 253 | { |
| 254 | struct rtable *rt; |
| 255 | |
| 256 | memset(fl, 0, sizeof(*fl)); |
Jiri Benc | c1ea5d6 | 2015-08-20 13:56:23 +0200 | [diff] [blame^] | 257 | fl->daddr = key->u.ipv4.dst; |
| 258 | fl->saddr = key->u.ipv4.src; |
Fan Du | 3f4c1d8 | 2015-01-14 13:10:35 +0800 | [diff] [blame] | 259 | fl->flowi4_tos = RT_TOS(key->ipv4_tos); |
| 260 | fl->flowi4_mark = mark; |
| 261 | fl->flowi4_proto = protocol; |
| 262 | |
| 263 | rt = ip_route_output_key(net, fl); |
| 264 | return rt; |
| 265 | } |
Jesse Gross | ccb1352 | 2011-10-25 19:26:31 -0700 | [diff] [blame] | 266 | #endif /* vport.h */ |