blob: f14dd88dafc87569fed73b835015ae5546f670e5 [file] [log] [blame]
Eliezer Tamir06021292013-06-10 11:39:50 +03001/*
2 * Low Latency Sockets
3 * Copyright(c) 2013 Intel Corporation.
4 *
5 * This program is free software; you can redistribute it and/or modify it
6 * under the terms and conditions of the GNU General Public License,
7 * version 2, as published by the Free Software Foundation.
8 *
9 * This program is distributed in the hope it will be useful, but WITHOUT
10 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
11 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
12 * more details.
13 *
14 * You should have received a copy of the GNU General Public License along with
15 * this program; if not, write to the Free Software Foundation, Inc.,
16 * 51 Franklin St - Fifth Floor, Boston, MA 02110-1301 USA.
17 *
18 * Author: Eliezer Tamir
19 *
20 * Contact Information:
21 * e1000-devel Mailing List <e1000-devel@lists.sourceforge.net>
22 */
23
Eliezer Tamir06021292013-06-10 11:39:50 +030024#ifndef _LINUX_NET_LL_POLL_H
25#define _LINUX_NET_LL_POLL_H
26
27#include <linux/netdevice.h>
28#include <net/ip.h>
29
30#ifdef CONFIG_NET_LL_RX_POLL
31
32struct napi_struct;
Eliezer Tamir2d48d672013-06-24 10:28:03 +030033extern unsigned int sysctl_net_ll_read __read_mostly;
Eliezer Tamireb6db622013-06-14 16:33:25 +030034extern unsigned int sysctl_net_ll_poll __read_mostly;
Eliezer Tamir06021292013-06-10 11:39:50 +030035
36/* return values from ndo_ll_poll */
37#define LL_FLUSH_FAILED -1
38#define LL_FLUSH_BUSY -2
39
Eliezer Tamircbf55002013-07-08 16:20:34 +030040static inline bool net_busy_loop_on(void)
Eliezer Tamir91e2fd332013-06-28 15:59:35 +030041{
Eliezer Tamircbf55002013-07-08 16:20:34 +030042 return sysctl_net_ll_poll;
Eliezer Tamir91e2fd332013-06-28 15:59:35 +030043}
44
Eliezer Tamirad6276e2013-06-28 15:59:26 +030045/* a wrapper to make debug_smp_processor_id() happy
46 * we can use sched_clock() because we don't care much about precision
Eliezer Tamir9a3c71a2013-06-14 16:33:35 +030047 * we only care that the average is bounded
Eliezer Tamirad6276e2013-06-28 15:59:26 +030048 */
49#ifdef CONFIG_DEBUG_PREEMPT
Eliezer Tamircbf55002013-07-08 16:20:34 +030050static inline u64 busy_loop_sched_clock(void)
Eliezer Tamirad6276e2013-06-28 15:59:26 +030051{
52 u64 rc;
53
54 preempt_disable_notrace();
55 rc = sched_clock();
56 preempt_enable_no_resched_notrace();
57
58 return rc;
59}
60#else /* CONFIG_DEBUG_PREEMPT */
Eliezer Tamircbf55002013-07-08 16:20:34 +030061static inline u64 busy_loop_sched_clock(void)
Eliezer Tamirad6276e2013-06-28 15:59:26 +030062{
63 return sched_clock();
64}
65#endif /* CONFIG_DEBUG_PREEMPT */
66
67/* we don't mind a ~2.5% imprecision so <<10 instead of *1000
Eliezer Tamir2d48d672013-06-24 10:28:03 +030068 * sk->sk_ll_usec is a u_int so this can't overflow
Eliezer Tamir9a3c71a2013-06-14 16:33:35 +030069 */
Eliezer Tamircbf55002013-07-08 16:20:34 +030070static inline u64 sk_busy_loop_end_time(struct sock *sk)
Eliezer Tamir06021292013-06-10 11:39:50 +030071{
Eliezer Tamir1bc27742013-07-02 23:22:47 +030072 return (u64)ACCESS_ONCE(sk->sk_ll_usec) << 10;
Eliezer Tamir2d48d672013-06-24 10:28:03 +030073}
Eliezer Tamir9a3c71a2013-06-14 16:33:35 +030074
Eliezer Tamir91e2fd332013-06-28 15:59:35 +030075/* in poll/select we use the global sysctl_net_ll_poll value
76 * only call sched_clock() if enabled
77 */
Eliezer Tamircbf55002013-07-08 16:20:34 +030078static inline u64 busy_loop_end_time(void)
Eliezer Tamir2d48d672013-06-24 10:28:03 +030079{
Eliezer Tamir1bc27742013-07-02 23:22:47 +030080 return (u64)ACCESS_ONCE(sysctl_net_ll_poll) << 10;
81}
Eliezer Tamir91e2fd332013-06-28 15:59:35 +030082
Eliezer Tamircbf55002013-07-08 16:20:34 +030083/* if flag is not set we don't need to know the time
84 * so we want to avoid a potentially expensive sched_clock()
85 */
86static inline u64 busy_loop_start_time(unsigned int flag)
Eliezer Tamir1bc27742013-07-02 23:22:47 +030087{
Eliezer Tamircbf55002013-07-08 16:20:34 +030088 return flag ? busy_loop_sched_clock() : 0;
Eliezer Tamir06021292013-06-10 11:39:50 +030089}
90
Eliezer Tamircbf55002013-07-08 16:20:34 +030091static inline bool sk_can_busy_loop(struct sock *sk)
Eliezer Tamir06021292013-06-10 11:39:50 +030092{
Eliezer Tamirdafcc432013-06-14 16:33:57 +030093 return sk->sk_ll_usec && sk->sk_napi_id &&
Eliezer Tamir06021292013-06-10 11:39:50 +030094 !need_resched() && !signal_pending(current);
95}
96
Eliezer Tamir1bc27742013-07-02 23:22:47 +030097/* careful! time_in_range64 will evaluate now twice */
Eliezer Tamircbf55002013-07-08 16:20:34 +030098static inline bool busy_loop_range(u64 start_time, u64 run_time)
Eliezer Tamir06021292013-06-10 11:39:50 +030099{
Eliezer Tamircbf55002013-07-08 16:20:34 +0300100 u64 now = busy_loop_sched_clock();
Eliezer Tamir1bc27742013-07-02 23:22:47 +0300101
102 return time_in_range64(now, start_time, start_time + run_time);
Eliezer Tamir06021292013-06-10 11:39:50 +0300103}
104
Eliezer Tamir2d48d672013-06-24 10:28:03 +0300105/* when used in sock_poll() nonblock is known at compile time to be true
106 * so the loop and end_time will be optimized out
107 */
Eliezer Tamircbf55002013-07-08 16:20:34 +0300108static inline bool sk_busy_loop(struct sock *sk, int nonblock)
Eliezer Tamir06021292013-06-10 11:39:50 +0300109{
Eliezer Tamircbf55002013-07-08 16:20:34 +0300110 u64 start_time = busy_loop_start_time(!nonblock);
111 u64 end_time = sk_busy_loop_end_time(sk);
Eliezer Tamir06021292013-06-10 11:39:50 +0300112 const struct net_device_ops *ops;
113 struct napi_struct *napi;
114 int rc = false;
115
116 /*
117 * rcu read lock for napi hash
118 * bh so we don't race with net_rx_action
119 */
120 rcu_read_lock_bh();
121
122 napi = napi_by_id(sk->sk_napi_id);
123 if (!napi)
124 goto out;
125
126 ops = napi->dev->netdev_ops;
127 if (!ops->ndo_ll_poll)
128 goto out;
129
130 do {
Eliezer Tamir06021292013-06-10 11:39:50 +0300131 rc = ops->ndo_ll_poll(napi);
132
133 if (rc == LL_FLUSH_FAILED)
134 break; /* permanent failure */
135
136 if (rc > 0)
137 /* local bh are disabled so it is ok to use _BH */
138 NET_ADD_STATS_BH(sock_net(sk),
139 LINUX_MIB_LOWLATENCYRXPACKETS, rc);
140
Eliezer Tamir2d48d672013-06-24 10:28:03 +0300141 } while (!nonblock && skb_queue_empty(&sk->sk_receive_queue) &&
Eliezer Tamircbf55002013-07-08 16:20:34 +0300142 busy_loop_range(start_time, end_time));
Eliezer Tamir06021292013-06-10 11:39:50 +0300143
144 rc = !skb_queue_empty(&sk->sk_receive_queue);
145out:
146 rcu_read_unlock_bh();
147 return rc;
148}
149
150/* used in the NIC receive handler to mark the skb */
151static inline void skb_mark_ll(struct sk_buff *skb, struct napi_struct *napi)
152{
153 skb->napi_id = napi->napi_id;
154}
155
156/* used in the protocol hanlder to propagate the napi_id to the socket */
157static inline void sk_mark_ll(struct sock *sk, struct sk_buff *skb)
158{
159 sk->sk_napi_id = skb->napi_id;
160}
161
162#else /* CONFIG_NET_LL_RX_POLL */
Eliezer Tamircbf55002013-07-08 16:20:34 +0300163static inline unsigned long net_busy_loop_on(void)
Eliezer Tamir91e2fd332013-06-28 15:59:35 +0300164{
165 return 0;
166}
Eliezer Tamir06021292013-06-10 11:39:50 +0300167
Eliezer Tamircbf55002013-07-08 16:20:34 +0300168static inline u64 busy_loop_start_time(unsigned int flag)
Eliezer Tamir2d48d672013-06-24 10:28:03 +0300169{
170 return 0;
171}
172
Eliezer Tamircbf55002013-07-08 16:20:34 +0300173static inline u64 busy_loop_end_time(void)
Eliezer Tamir06021292013-06-10 11:39:50 +0300174{
175 return 0;
176}
177
Eliezer Tamircbf55002013-07-08 16:20:34 +0300178static inline bool sk_can_busy_loop(struct sock *sk)
Eliezer Tamir06021292013-06-10 11:39:50 +0300179{
180 return false;
181}
182
Eliezer Tamircbf55002013-07-08 16:20:34 +0300183static inline bool sk_busy_poll(struct sock *sk, int nonblock)
Eliezer Tamir06021292013-06-10 11:39:50 +0300184{
185 return false;
186}
187
188static inline void skb_mark_ll(struct sk_buff *skb, struct napi_struct *napi)
189{
190}
191
192static inline void sk_mark_ll(struct sock *sk, struct sk_buff *skb)
193{
194}
195
Eliezer Tamircbf55002013-07-08 16:20:34 +0300196static inline bool busy_loop_range(u64 start_time, u64 run_time)
Eliezer Tamir06021292013-06-10 11:39:50 +0300197{
198 return false;
199}
200
201#endif /* CONFIG_NET_LL_RX_POLL */
202#endif /* _LINUX_NET_LL_POLL_H */