blob: 6d45e6f6ff4c950cb0fa4acaccd26baa6f38777a [file] [log] [blame]
Eliezer Tamir06021292013-06-10 11:39:50 +03001/*
2 * Low Latency Sockets
3 * Copyright(c) 2013 Intel Corporation.
4 *
5 * This program is free software; you can redistribute it and/or modify it
6 * under the terms and conditions of the GNU General Public License,
7 * version 2, as published by the Free Software Foundation.
8 *
9 * This program is distributed in the hope it will be useful, but WITHOUT
10 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
11 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
12 * more details.
13 *
14 * You should have received a copy of the GNU General Public License along with
15 * this program; if not, write to the Free Software Foundation, Inc.,
16 * 51 Franklin St - Fifth Floor, Boston, MA 02110-1301 USA.
17 *
18 * Author: Eliezer Tamir
19 *
20 * Contact Information:
21 * e1000-devel Mailing List <e1000-devel@lists.sourceforge.net>
22 */
23
Eliezer Tamir06021292013-06-10 11:39:50 +030024#ifndef _LINUX_NET_LL_POLL_H
25#define _LINUX_NET_LL_POLL_H
26
27#include <linux/netdevice.h>
28#include <net/ip.h>
29
30#ifdef CONFIG_NET_LL_RX_POLL
31
32struct napi_struct;
Eliezer Tamir2d48d672013-06-24 10:28:03 +030033extern unsigned int sysctl_net_ll_read __read_mostly;
Eliezer Tamireb6db622013-06-14 16:33:25 +030034extern unsigned int sysctl_net_ll_poll __read_mostly;
Eliezer Tamir06021292013-06-10 11:39:50 +030035
36/* return values from ndo_ll_poll */
37#define LL_FLUSH_FAILED -1
38#define LL_FLUSH_BUSY -2
39
Eliezer Tamirad6276e2013-06-28 15:59:26 +030040/* a wrapper to make debug_smp_processor_id() happy
41 * we can use sched_clock() because we don't care much about precision
Eliezer Tamir9a3c71a2013-06-14 16:33:35 +030042 * we only care that the average is bounded
Eliezer Tamirad6276e2013-06-28 15:59:26 +030043 */
44#ifdef CONFIG_DEBUG_PREEMPT
45static inline u64 ll_sched_clock(void)
46{
47 u64 rc;
48
49 preempt_disable_notrace();
50 rc = sched_clock();
51 preempt_enable_no_resched_notrace();
52
53 return rc;
54}
55#else /* CONFIG_DEBUG_PREEMPT */
56static inline u64 ll_sched_clock(void)
57{
58 return sched_clock();
59}
60#endif /* CONFIG_DEBUG_PREEMPT */
61
62/* we don't mind a ~2.5% imprecision so <<10 instead of *1000
Eliezer Tamir2d48d672013-06-24 10:28:03 +030063 * sk->sk_ll_usec is a u_int so this can't overflow
Eliezer Tamir9a3c71a2013-06-14 16:33:35 +030064 */
Eliezer Tamir2d48d672013-06-24 10:28:03 +030065static inline u64 ll_sk_end_time(struct sock *sk)
Eliezer Tamir06021292013-06-10 11:39:50 +030066{
Eliezer Tamirad6276e2013-06-28 15:59:26 +030067 return ((u64)ACCESS_ONCE(sk->sk_ll_usec) << 10) + ll_sched_clock();
Eliezer Tamir2d48d672013-06-24 10:28:03 +030068}
Eliezer Tamir9a3c71a2013-06-14 16:33:35 +030069
Eliezer Tamir2d48d672013-06-24 10:28:03 +030070/* in poll/select we use the global sysctl_net_ll_poll value */
71static inline u64 ll_end_time(void)
72{
Eliezer Tamirad6276e2013-06-28 15:59:26 +030073 return ((u64)ACCESS_ONCE(sysctl_net_ll_poll) << 10) + ll_sched_clock();
Eliezer Tamir06021292013-06-10 11:39:50 +030074}
75
76static inline bool sk_valid_ll(struct sock *sk)
77{
Eliezer Tamirdafcc432013-06-14 16:33:57 +030078 return sk->sk_ll_usec && sk->sk_napi_id &&
Eliezer Tamir06021292013-06-10 11:39:50 +030079 !need_resched() && !signal_pending(current);
80}
81
Eliezer Tamir9a3c71a2013-06-14 16:33:35 +030082static inline bool can_poll_ll(u64 end_time)
Eliezer Tamir06021292013-06-10 11:39:50 +030083{
Eliezer Tamirad6276e2013-06-28 15:59:26 +030084 return !time_after64(ll_sched_clock(), end_time);
Eliezer Tamir06021292013-06-10 11:39:50 +030085}
86
Eliezer Tamir2d48d672013-06-24 10:28:03 +030087/* when used in sock_poll() nonblock is known at compile time to be true
88 * so the loop and end_time will be optimized out
89 */
Eliezer Tamir06021292013-06-10 11:39:50 +030090static inline bool sk_poll_ll(struct sock *sk, int nonblock)
91{
Eliezer Tamir2d48d672013-06-24 10:28:03 +030092 u64 end_time = nonblock ? 0 : ll_sk_end_time(sk);
Eliezer Tamir06021292013-06-10 11:39:50 +030093 const struct net_device_ops *ops;
94 struct napi_struct *napi;
95 int rc = false;
96
97 /*
98 * rcu read lock for napi hash
99 * bh so we don't race with net_rx_action
100 */
101 rcu_read_lock_bh();
102
103 napi = napi_by_id(sk->sk_napi_id);
104 if (!napi)
105 goto out;
106
107 ops = napi->dev->netdev_ops;
108 if (!ops->ndo_ll_poll)
109 goto out;
110
111 do {
Eliezer Tamir06021292013-06-10 11:39:50 +0300112 rc = ops->ndo_ll_poll(napi);
113
114 if (rc == LL_FLUSH_FAILED)
115 break; /* permanent failure */
116
117 if (rc > 0)
118 /* local bh are disabled so it is ok to use _BH */
119 NET_ADD_STATS_BH(sock_net(sk),
120 LINUX_MIB_LOWLATENCYRXPACKETS, rc);
121
Eliezer Tamir2d48d672013-06-24 10:28:03 +0300122 } while (!nonblock && skb_queue_empty(&sk->sk_receive_queue) &&
123 can_poll_ll(end_time));
Eliezer Tamir06021292013-06-10 11:39:50 +0300124
125 rc = !skb_queue_empty(&sk->sk_receive_queue);
126out:
127 rcu_read_unlock_bh();
128 return rc;
129}
130
131/* used in the NIC receive handler to mark the skb */
132static inline void skb_mark_ll(struct sk_buff *skb, struct napi_struct *napi)
133{
134 skb->napi_id = napi->napi_id;
135}
136
137/* used in the protocol hanlder to propagate the napi_id to the socket */
138static inline void sk_mark_ll(struct sock *sk, struct sk_buff *skb)
139{
140 sk->sk_napi_id = skb->napi_id;
141}
142
143#else /* CONFIG_NET_LL_RX_POLL */
144
Eliezer Tamir2d48d672013-06-24 10:28:03 +0300145static inline u64 sk_ll_end_time(struct sock *sk)
146{
147 return 0;
148}
149
150static inline u64 ll_end_time(void)
Eliezer Tamir06021292013-06-10 11:39:50 +0300151{
152 return 0;
153}
154
155static inline bool sk_valid_ll(struct sock *sk)
156{
157 return false;
158}
159
160static inline bool sk_poll_ll(struct sock *sk, int nonblock)
161{
162 return false;
163}
164
165static inline void skb_mark_ll(struct sk_buff *skb, struct napi_struct *napi)
166{
167}
168
169static inline void sk_mark_ll(struct sock *sk, struct sk_buff *skb)
170{
171}
172
Eliezer Tamir9a3c71a2013-06-14 16:33:35 +0300173static inline bool can_poll_ll(u64 end_time)
Eliezer Tamir06021292013-06-10 11:39:50 +0300174{
175 return false;
176}
177
178#endif /* CONFIG_NET_LL_RX_POLL */
179#endif /* _LINUX_NET_LL_POLL_H */