blob: 7d44cb1884dc63ab28ccd8c2de29e92bb3b6a29e [file] [log] [blame]
Craig Tillerc67cc992017-04-27 10:15:51 -07001/*
2 *
Jan Tattermusch7897ae92017-06-07 22:57:36 +02003 * Copyright 2017 gRPC authors.
Craig Tillerc67cc992017-04-27 10:15:51 -07004 *
Jan Tattermusch7897ae92017-06-07 22:57:36 +02005 * Licensed under the Apache License, Version 2.0 (the "License");
6 * you may not use this file except in compliance with the License.
7 * You may obtain a copy of the License at
Craig Tillerc67cc992017-04-27 10:15:51 -07008 *
Jan Tattermusch7897ae92017-06-07 22:57:36 +02009 * http://www.apache.org/licenses/LICENSE-2.0
Craig Tillerc67cc992017-04-27 10:15:51 -070010 *
Jan Tattermusch7897ae92017-06-07 22:57:36 +020011 * Unless required by applicable law or agreed to in writing, software
12 * distributed under the License is distributed on an "AS IS" BASIS,
13 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
14 * See the License for the specific language governing permissions and
15 * limitations under the License.
Craig Tillerc67cc992017-04-27 10:15:51 -070016 *
17 */
18
19#include "src/core/lib/iomgr/port.h"
20
21/* This polling engine is only relevant on linux kernels supporting epoll() */
22#ifdef GRPC_LINUX_EPOLL
23
Craig Tiller4509c472017-04-27 19:05:13 +000024#include "src/core/lib/iomgr/ev_epoll1_linux.h"
Craig Tillerc67cc992017-04-27 10:15:51 -070025
26#include <assert.h>
27#include <errno.h>
28#include <poll.h>
29#include <pthread.h>
30#include <string.h>
31#include <sys/epoll.h>
32#include <sys/socket.h>
33#include <unistd.h>
34
35#include <grpc/support/alloc.h>
Craig Tiller6de05932017-04-28 09:17:38 -070036#include <grpc/support/cpu.h>
Craig Tillerc67cc992017-04-27 10:15:51 -070037#include <grpc/support/log.h>
38#include <grpc/support/string_util.h>
39#include <grpc/support/tls.h>
40#include <grpc/support/useful.h>
41
42#include "src/core/lib/iomgr/ev_posix.h"
43#include "src/core/lib/iomgr/iomgr_internal.h"
44#include "src/core/lib/iomgr/lockfree_event.h"
Craig Tillerc67cc992017-04-27 10:15:51 -070045#include "src/core/lib/iomgr/wakeup_fd_posix.h"
Craig Tillerc67cc992017-04-27 10:15:51 -070046#include "src/core/lib/profiling/timers.h"
47#include "src/core/lib/support/block_annotate.h"
Craig Tillerb89bac02017-05-26 15:20:32 +000048#include "src/core/lib/support/string.h"
Craig Tillerc67cc992017-04-27 10:15:51 -070049
Craig Tillerc67cc992017-04-27 10:15:51 -070050static grpc_wakeup_fd global_wakeup_fd;
51static int g_epfd;
52
53/*******************************************************************************
54 * Fd Declarations
55 */
56
57struct grpc_fd {
58 int fd;
59
Craig Tillerc67cc992017-04-27 10:15:51 -070060 gpr_atm read_closure;
61 gpr_atm write_closure;
62
63 struct grpc_fd *freelist_next;
Craig Tillerc67cc992017-04-27 10:15:51 -070064
65 /* The pollset that last noticed that the fd is readable. The actual type
66 * stored in this is (grpc_pollset *) */
67 gpr_atm read_notifier_pollset;
68
69 grpc_iomgr_object iomgr_object;
70};
71
72static void fd_global_init(void);
73static void fd_global_shutdown(void);
74
75/*******************************************************************************
76 * Pollset Declarations
77 */
78
Craig Tiller43bf2592017-04-28 23:21:01 +000079typedef enum { UNKICKED, KICKED, DESIGNATED_POLLER } kick_state;
Craig Tillerc67cc992017-04-27 10:15:51 -070080
Craig Tiller830e82a2017-05-31 16:26:27 -070081static const char *kick_state_string(kick_state st) {
82 switch (st) {
83 case UNKICKED:
84 return "UNKICKED";
85 case KICKED:
86 return "KICKED";
87 case DESIGNATED_POLLER:
88 return "DESIGNATED_POLLER";
89 }
90 GPR_UNREACHABLE_CODE(return "UNKNOWN");
91}
92
Craig Tillerc67cc992017-04-27 10:15:51 -070093struct grpc_pollset_worker {
Craig Tiller32f90ee2017-04-28 12:46:41 -070094 kick_state kick_state;
Craig Tiller55624a32017-05-26 08:14:44 -070095 int kick_state_mutator; // which line of code last changed kick state
Craig Tillerc67cc992017-04-27 10:15:51 -070096 bool initialized_cv;
Craig Tiller32f90ee2017-04-28 12:46:41 -070097 grpc_pollset_worker *next;
98 grpc_pollset_worker *prev;
Craig Tillerc67cc992017-04-27 10:15:51 -070099 gpr_cv cv;
Craig Tiller50da5ec2017-05-01 13:51:14 -0700100 grpc_closure_list schedule_on_end_work;
Craig Tillerc67cc992017-04-27 10:15:51 -0700101};
102
Craig Tiller55624a32017-05-26 08:14:44 -0700103#define SET_KICK_STATE(worker, state) \
104 do { \
105 (worker)->kick_state = (state); \
106 (worker)->kick_state_mutator = __LINE__; \
107 } while (false)
108
Craig Tillerba550da2017-05-01 14:26:31 +0000109#define MAX_NEIGHBOURHOODS 1024
110
Craig Tiller6de05932017-04-28 09:17:38 -0700111typedef struct pollset_neighbourhood {
112 gpr_mu mu;
113 grpc_pollset *active_root;
Craig Tiller6de05932017-04-28 09:17:38 -0700114 char pad[GPR_CACHELINE_SIZE];
115} pollset_neighbourhood;
116
Craig Tillerc67cc992017-04-27 10:15:51 -0700117struct grpc_pollset {
Craig Tiller6de05932017-04-28 09:17:38 -0700118 gpr_mu mu;
119 pollset_neighbourhood *neighbourhood;
Craig Tillere00d7332017-05-01 15:43:51 +0000120 bool reassigning_neighbourhood;
Craig Tiller4509c472017-04-27 19:05:13 +0000121 grpc_pollset_worker *root_worker;
122 bool kicked_without_poller;
Sree Kuchibhotla0d8431a2017-07-18 16:21:54 -0700123
124 /* Set to true if the pollset is observed to have no workers available to
125 * poll */
Craig Tiller6de05932017-04-28 09:17:38 -0700126 bool seen_inactive;
Sree Kuchibhotla0d8431a2017-07-18 16:21:54 -0700127 bool shutting_down; /* Is the pollset shutting down ? */
Craig Tiller4509c472017-04-27 19:05:13 +0000128 grpc_closure *shutdown_closure; /* Called after after shutdown is complete */
Sree Kuchibhotla0d8431a2017-07-18 16:21:54 -0700129
130 /* Number of workers who are *about-to* attach themselves to the pollset
131 * worker list */
Craig Tillerba550da2017-05-01 14:26:31 +0000132 int begin_refs;
Craig Tiller6de05932017-04-28 09:17:38 -0700133
134 grpc_pollset *next;
135 grpc_pollset *prev;
Craig Tillerc67cc992017-04-27 10:15:51 -0700136};
137
138/*******************************************************************************
139 * Pollset-set Declarations
140 */
Craig Tiller6de05932017-04-28 09:17:38 -0700141
Craig Tiller61f96c12017-05-12 13:36:39 -0700142struct grpc_pollset_set {
143 char unused;
144};
Craig Tillerc67cc992017-04-27 10:15:51 -0700145
146/*******************************************************************************
147 * Common helpers
148 */
149
150static bool append_error(grpc_error **composite, grpc_error *error,
151 const char *desc) {
152 if (error == GRPC_ERROR_NONE) return true;
153 if (*composite == GRPC_ERROR_NONE) {
154 *composite = GRPC_ERROR_CREATE_FROM_COPIED_STRING(desc);
155 }
156 *composite = grpc_error_add_child(*composite, error);
157 return false;
158}
159
160/*******************************************************************************
161 * Fd Definitions
162 */
163
164/* We need to keep a freelist not because of any concerns of malloc performance
165 * but instead so that implementations with multiple threads in (for example)
166 * epoll_wait deal with the race between pollset removal and incoming poll
167 * notifications.
168 *
169 * The problem is that the poller ultimately holds a reference to this
170 * object, so it is very difficult to know when is safe to free it, at least
171 * without some expensive synchronization.
172 *
173 * If we keep the object freelisted, in the worst case losing this race just
174 * becomes a spurious read notification on a reused fd.
175 */
176
177/* The alarm system needs to be able to wakeup 'some poller' sometimes
178 * (specifically when a new alarm needs to be triggered earlier than the next
179 * alarm 'epoch'). This wakeup_fd gives us something to alert on when such a
180 * case occurs. */
181
182static grpc_fd *fd_freelist = NULL;
183static gpr_mu fd_freelist_mu;
184
Craig Tillerc67cc992017-04-27 10:15:51 -0700185static void fd_global_init(void) { gpr_mu_init(&fd_freelist_mu); }
186
187static void fd_global_shutdown(void) {
188 gpr_mu_lock(&fd_freelist_mu);
189 gpr_mu_unlock(&fd_freelist_mu);
190 while (fd_freelist != NULL) {
191 grpc_fd *fd = fd_freelist;
192 fd_freelist = fd_freelist->freelist_next;
Craig Tillerc67cc992017-04-27 10:15:51 -0700193 gpr_free(fd);
194 }
195 gpr_mu_destroy(&fd_freelist_mu);
196}
197
198static grpc_fd *fd_create(int fd, const char *name) {
199 grpc_fd *new_fd = NULL;
200
201 gpr_mu_lock(&fd_freelist_mu);
202 if (fd_freelist != NULL) {
203 new_fd = fd_freelist;
204 fd_freelist = fd_freelist->freelist_next;
205 }
206 gpr_mu_unlock(&fd_freelist_mu);
207
208 if (new_fd == NULL) {
209 new_fd = gpr_malloc(sizeof(grpc_fd));
Craig Tillerc67cc992017-04-27 10:15:51 -0700210 }
211
Craig Tillerc67cc992017-04-27 10:15:51 -0700212 new_fd->fd = fd;
Craig Tillerc67cc992017-04-27 10:15:51 -0700213 grpc_lfev_init(&new_fd->read_closure);
214 grpc_lfev_init(&new_fd->write_closure);
215 gpr_atm_no_barrier_store(&new_fd->read_notifier_pollset, (gpr_atm)NULL);
216
217 new_fd->freelist_next = NULL;
Craig Tillerc67cc992017-04-27 10:15:51 -0700218
219 char *fd_name;
220 gpr_asprintf(&fd_name, "%s fd=%d", name, fd);
221 grpc_iomgr_register_object(&new_fd->iomgr_object, fd_name);
Noah Eisen264879f2017-06-20 17:14:47 -0700222#ifndef NDEBUG
223 if (GRPC_TRACER_ON(grpc_trace_fd_refcount)) {
224 gpr_log(GPR_DEBUG, "FD %d %p create %s", fd, new_fd, fd_name);
225 }
Craig Tillerc67cc992017-04-27 10:15:51 -0700226#endif
227 gpr_free(fd_name);
Craig Tiller9ddb3152017-04-27 21:32:56 +0000228
229 struct epoll_event ev = {.events = (uint32_t)(EPOLLIN | EPOLLOUT | EPOLLET),
230 .data.ptr = new_fd};
231 if (epoll_ctl(g_epfd, EPOLL_CTL_ADD, fd, &ev) != 0) {
232 gpr_log(GPR_ERROR, "epoll_ctl failed: %s", strerror(errno));
233 }
234
Craig Tillerc67cc992017-04-27 10:15:51 -0700235 return new_fd;
236}
237
Craig Tiller4509c472017-04-27 19:05:13 +0000238static int fd_wrapped_fd(grpc_fd *fd) { return fd->fd; }
Craig Tillerc67cc992017-04-27 10:15:51 -0700239
Sree Kuchibhotlaf2641472017-08-02 23:46:40 -0700240/* if 'releasing_fd' is true, it means that we are going to detach the internal
241 * fd from grpc_fd structure (i.e which means we should not be calling
242 * shutdown() syscall on that fd) */
243static void fd_shutdown_internal(grpc_exec_ctx *exec_ctx, grpc_fd *fd,
244 grpc_error *why, bool releasing_fd) {
Craig Tiller9ddb3152017-04-27 21:32:56 +0000245 if (grpc_lfev_set_shutdown(exec_ctx, &fd->read_closure,
246 GRPC_ERROR_REF(why))) {
Sree Kuchibhotlaf2641472017-08-02 23:46:40 -0700247 if (!releasing_fd) {
248 shutdown(fd->fd, SHUT_RDWR);
249 }
Craig Tiller9ddb3152017-04-27 21:32:56 +0000250 grpc_lfev_set_shutdown(exec_ctx, &fd->write_closure, GRPC_ERROR_REF(why));
251 }
252 GRPC_ERROR_UNREF(why);
253}
254
Sree Kuchibhotlaf2641472017-08-02 23:46:40 -0700255/* Might be called multiple times */
256static void fd_shutdown(grpc_exec_ctx *exec_ctx, grpc_fd *fd, grpc_error *why) {
257 fd_shutdown_internal(exec_ctx, fd, why, false);
258}
259
Craig Tillerc67cc992017-04-27 10:15:51 -0700260static void fd_orphan(grpc_exec_ctx *exec_ctx, grpc_fd *fd,
261 grpc_closure *on_done, int *release_fd,
Yuchen Zengd40a7ae2017-07-12 15:59:56 -0700262 bool already_closed, const char *reason) {
Craig Tillerc67cc992017-04-27 10:15:51 -0700263 grpc_error *error = GRPC_ERROR_NONE;
Sree Kuchibhotlaf2641472017-08-02 23:46:40 -0700264 bool is_release_fd = (release_fd != NULL);
Craig Tillerc67cc992017-04-27 10:15:51 -0700265
Craig Tiller9ddb3152017-04-27 21:32:56 +0000266 if (!grpc_lfev_is_shutdown(&fd->read_closure)) {
Sree Kuchibhotlaf2641472017-08-02 23:46:40 -0700267 fd_shutdown_internal(exec_ctx, fd,
268 GRPC_ERROR_CREATE_FROM_COPIED_STRING(reason),
269 is_release_fd);
Craig Tiller9ddb3152017-04-27 21:32:56 +0000270 }
271
Craig Tillerc67cc992017-04-27 10:15:51 -0700272 /* If release_fd is not NULL, we should be relinquishing control of the file
273 descriptor fd->fd (but we still own the grpc_fd structure). */
Sree Kuchibhotlaf2641472017-08-02 23:46:40 -0700274 if (is_release_fd) {
Craig Tillerc67cc992017-04-27 10:15:51 -0700275 *release_fd = fd->fd;
Yuchen Zengd40a7ae2017-07-12 15:59:56 -0700276 } else if (!already_closed) {
Craig Tillerc67cc992017-04-27 10:15:51 -0700277 close(fd->fd);
Craig Tillerc67cc992017-04-27 10:15:51 -0700278 }
279
ncteisen274bbbe2017-06-08 14:57:11 -0700280 GRPC_CLOSURE_SCHED(exec_ctx, on_done, GRPC_ERROR_REF(error));
Craig Tillerc67cc992017-04-27 10:15:51 -0700281
Craig Tiller4509c472017-04-27 19:05:13 +0000282 grpc_iomgr_unregister_object(&fd->iomgr_object);
283 grpc_lfev_destroy(&fd->read_closure);
284 grpc_lfev_destroy(&fd->write_closure);
Craig Tillerc67cc992017-04-27 10:15:51 -0700285
Craig Tiller4509c472017-04-27 19:05:13 +0000286 gpr_mu_lock(&fd_freelist_mu);
287 fd->freelist_next = fd_freelist;
288 fd_freelist = fd;
289 gpr_mu_unlock(&fd_freelist_mu);
Craig Tillerc67cc992017-04-27 10:15:51 -0700290}
291
292static grpc_pollset *fd_get_read_notifier_pollset(grpc_exec_ctx *exec_ctx,
293 grpc_fd *fd) {
294 gpr_atm notifier = gpr_atm_acq_load(&fd->read_notifier_pollset);
295 return (grpc_pollset *)notifier;
296}
297
298static bool fd_is_shutdown(grpc_fd *fd) {
299 return grpc_lfev_is_shutdown(&fd->read_closure);
300}
301
Craig Tillerc67cc992017-04-27 10:15:51 -0700302static void fd_notify_on_read(grpc_exec_ctx *exec_ctx, grpc_fd *fd,
303 grpc_closure *closure) {
Craig Tiller830e82a2017-05-31 16:26:27 -0700304 grpc_lfev_notify_on(exec_ctx, &fd->read_closure, closure, "read");
Craig Tillerc67cc992017-04-27 10:15:51 -0700305}
306
307static void fd_notify_on_write(grpc_exec_ctx *exec_ctx, grpc_fd *fd,
308 grpc_closure *closure) {
Craig Tiller830e82a2017-05-31 16:26:27 -0700309 grpc_lfev_notify_on(exec_ctx, &fd->write_closure, closure, "write");
Craig Tillerc67cc992017-04-27 10:15:51 -0700310}
311
Craig Tiller4509c472017-04-27 19:05:13 +0000312static void fd_become_readable(grpc_exec_ctx *exec_ctx, grpc_fd *fd,
313 grpc_pollset *notifier) {
Craig Tiller830e82a2017-05-31 16:26:27 -0700314 grpc_lfev_set_ready(exec_ctx, &fd->read_closure, "read");
Craig Tiller4509c472017-04-27 19:05:13 +0000315 /* Use release store to match with acquire load in fd_get_read_notifier */
316 gpr_atm_rel_store(&fd->read_notifier_pollset, (gpr_atm)notifier);
317}
318
319static void fd_become_writable(grpc_exec_ctx *exec_ctx, grpc_fd *fd) {
Craig Tiller830e82a2017-05-31 16:26:27 -0700320 grpc_lfev_set_ready(exec_ctx, &fd->write_closure, "write");
Craig Tillerc67cc992017-04-27 10:15:51 -0700321}
322
323/*******************************************************************************
324 * Pollset Definitions
325 */
326
Craig Tiller6de05932017-04-28 09:17:38 -0700327GPR_TLS_DECL(g_current_thread_pollset);
328GPR_TLS_DECL(g_current_thread_worker);
329static gpr_atm g_active_poller;
330static pollset_neighbourhood *g_neighbourhoods;
Craig Tiller32f90ee2017-04-28 12:46:41 -0700331static size_t g_num_neighbourhoods;
Craig Tiller6de05932017-04-28 09:17:38 -0700332
Craig Tillerc67cc992017-04-27 10:15:51 -0700333/* Return true if first in list */
Craig Tiller32f90ee2017-04-28 12:46:41 -0700334static bool worker_insert(grpc_pollset *pollset, grpc_pollset_worker *worker) {
335 if (pollset->root_worker == NULL) {
336 pollset->root_worker = worker;
337 worker->next = worker->prev = worker;
Craig Tillerc67cc992017-04-27 10:15:51 -0700338 return true;
339 } else {
Craig Tiller32f90ee2017-04-28 12:46:41 -0700340 worker->next = pollset->root_worker;
341 worker->prev = worker->next->prev;
342 worker->next->prev = worker;
343 worker->prev->next = worker;
Craig Tillerc67cc992017-04-27 10:15:51 -0700344 return false;
345 }
346}
347
348/* Return true if last in list */
349typedef enum { EMPTIED, NEW_ROOT, REMOVED } worker_remove_result;
350
Craig Tiller32f90ee2017-04-28 12:46:41 -0700351static worker_remove_result worker_remove(grpc_pollset *pollset,
Craig Tillerc67cc992017-04-27 10:15:51 -0700352 grpc_pollset_worker *worker) {
Craig Tiller32f90ee2017-04-28 12:46:41 -0700353 if (worker == pollset->root_worker) {
354 if (worker == worker->next) {
355 pollset->root_worker = NULL;
Craig Tillerc67cc992017-04-27 10:15:51 -0700356 return EMPTIED;
357 } else {
Craig Tiller32f90ee2017-04-28 12:46:41 -0700358 pollset->root_worker = worker->next;
359 worker->prev->next = worker->next;
360 worker->next->prev = worker->prev;
Craig Tillerc67cc992017-04-27 10:15:51 -0700361 return NEW_ROOT;
362 }
363 } else {
Craig Tiller32f90ee2017-04-28 12:46:41 -0700364 worker->prev->next = worker->next;
365 worker->next->prev = worker->prev;
Craig Tillerc67cc992017-04-27 10:15:51 -0700366 return REMOVED;
367 }
368}
369
Craig Tillerba550da2017-05-01 14:26:31 +0000370static size_t choose_neighbourhood(void) {
371 return (size_t)gpr_cpu_current_cpu() % g_num_neighbourhoods;
372}
373
Craig Tiller4509c472017-04-27 19:05:13 +0000374static grpc_error *pollset_global_init(void) {
Craig Tiller4509c472017-04-27 19:05:13 +0000375 gpr_tls_init(&g_current_thread_pollset);
376 gpr_tls_init(&g_current_thread_worker);
Craig Tiller6de05932017-04-28 09:17:38 -0700377 gpr_atm_no_barrier_store(&g_active_poller, 0);
Craig Tiller375eb252017-04-27 23:29:12 +0000378 global_wakeup_fd.read_fd = -1;
379 grpc_error *err = grpc_wakeup_fd_init(&global_wakeup_fd);
380 if (err != GRPC_ERROR_NONE) return err;
Craig Tiller4509c472017-04-27 19:05:13 +0000381 struct epoll_event ev = {.events = (uint32_t)(EPOLLIN | EPOLLET),
382 .data.ptr = &global_wakeup_fd};
383 if (epoll_ctl(g_epfd, EPOLL_CTL_ADD, global_wakeup_fd.read_fd, &ev) != 0) {
384 return GRPC_OS_ERROR(errno, "epoll_ctl");
385 }
Craig Tillerba550da2017-05-01 14:26:31 +0000386 g_num_neighbourhoods = GPR_CLAMP(gpr_cpu_num_cores(), 1, MAX_NEIGHBOURHOODS);
Craig Tiller32f90ee2017-04-28 12:46:41 -0700387 g_neighbourhoods =
388 gpr_zalloc(sizeof(*g_neighbourhoods) * g_num_neighbourhoods);
389 for (size_t i = 0; i < g_num_neighbourhoods; i++) {
390 gpr_mu_init(&g_neighbourhoods[i].mu);
Craig Tiller32f90ee2017-04-28 12:46:41 -0700391 }
Craig Tiller4509c472017-04-27 19:05:13 +0000392 return GRPC_ERROR_NONE;
393}
394
395static void pollset_global_shutdown(void) {
Craig Tiller4509c472017-04-27 19:05:13 +0000396 gpr_tls_destroy(&g_current_thread_pollset);
397 gpr_tls_destroy(&g_current_thread_worker);
Craig Tiller375eb252017-04-27 23:29:12 +0000398 if (global_wakeup_fd.read_fd != -1) grpc_wakeup_fd_destroy(&global_wakeup_fd);
Craig Tiller32f90ee2017-04-28 12:46:41 -0700399 for (size_t i = 0; i < g_num_neighbourhoods; i++) {
400 gpr_mu_destroy(&g_neighbourhoods[i].mu);
401 }
402 gpr_free(g_neighbourhoods);
Craig Tiller4509c472017-04-27 19:05:13 +0000403}
404
405static void pollset_init(grpc_pollset *pollset, gpr_mu **mu) {
Craig Tiller6de05932017-04-28 09:17:38 -0700406 gpr_mu_init(&pollset->mu);
407 *mu = &pollset->mu;
Craig Tillerba550da2017-05-01 14:26:31 +0000408 pollset->neighbourhood = &g_neighbourhoods[choose_neighbourhood()];
Sree Kuchibhotla30882302017-08-16 13:46:52 -0700409 pollset->reassigning_neighbourhood = false;
410 pollset->root_worker = NULL;
411 pollset->kicked_without_poller = false;
Craig Tiller6de05932017-04-28 09:17:38 -0700412 pollset->seen_inactive = true;
Sree Kuchibhotla30882302017-08-16 13:46:52 -0700413 pollset->shutting_down = false;
414 pollset->shutdown_closure = NULL;
415 pollset->begin_refs = 0;
416 pollset->next = pollset->prev = NULL;
Craig Tiller6de05932017-04-28 09:17:38 -0700417}
418
Craig Tillerc6109852017-05-01 14:26:49 -0700419static void pollset_destroy(grpc_exec_ctx *exec_ctx, grpc_pollset *pollset) {
Craig Tillere00d7332017-05-01 15:43:51 +0000420 gpr_mu_lock(&pollset->mu);
Craig Tillerba550da2017-05-01 14:26:31 +0000421 if (!pollset->seen_inactive) {
Craig Tillere00d7332017-05-01 15:43:51 +0000422 pollset_neighbourhood *neighbourhood = pollset->neighbourhood;
423 gpr_mu_unlock(&pollset->mu);
Craig Tillera95bacf2017-05-01 12:51:24 -0700424 retry_lock_neighbourhood:
Craig Tillere00d7332017-05-01 15:43:51 +0000425 gpr_mu_lock(&neighbourhood->mu);
426 gpr_mu_lock(&pollset->mu);
427 if (!pollset->seen_inactive) {
428 if (pollset->neighbourhood != neighbourhood) {
429 gpr_mu_unlock(&neighbourhood->mu);
430 neighbourhood = pollset->neighbourhood;
431 gpr_mu_unlock(&pollset->mu);
432 goto retry_lock_neighbourhood;
433 }
434 pollset->prev->next = pollset->next;
435 pollset->next->prev = pollset->prev;
436 if (pollset == pollset->neighbourhood->active_root) {
437 pollset->neighbourhood->active_root =
438 pollset->next == pollset ? NULL : pollset->next;
439 }
Craig Tillerba550da2017-05-01 14:26:31 +0000440 }
441 gpr_mu_unlock(&pollset->neighbourhood->mu);
Craig Tiller6de05932017-04-28 09:17:38 -0700442 }
Craig Tillere00d7332017-05-01 15:43:51 +0000443 gpr_mu_unlock(&pollset->mu);
Craig Tiller32f90ee2017-04-28 12:46:41 -0700444 gpr_mu_destroy(&pollset->mu);
Craig Tiller4509c472017-04-27 19:05:13 +0000445}
446
447static grpc_error *pollset_kick_all(grpc_pollset *pollset) {
448 grpc_error *error = GRPC_ERROR_NONE;
449 if (pollset->root_worker != NULL) {
450 grpc_pollset_worker *worker = pollset->root_worker;
451 do {
Craig Tiller55624a32017-05-26 08:14:44 -0700452 switch (worker->kick_state) {
453 case KICKED:
454 break;
455 case UNKICKED:
456 SET_KICK_STATE(worker, KICKED);
457 if (worker->initialized_cv) {
458 gpr_cv_signal(&worker->cv);
459 }
460 break;
461 case DESIGNATED_POLLER:
462 SET_KICK_STATE(worker, KICKED);
463 append_error(&error, grpc_wakeup_fd_wakeup(&global_wakeup_fd),
Sree Kuchibhotla0d8431a2017-07-18 16:21:54 -0700464 "pollset_kick_all");
Craig Tiller55624a32017-05-26 08:14:44 -0700465 break;
Craig Tiller4509c472017-04-27 19:05:13 +0000466 }
467
Craig Tiller32f90ee2017-04-28 12:46:41 -0700468 worker = worker->next;
Craig Tiller4509c472017-04-27 19:05:13 +0000469 } while (worker != pollset->root_worker);
470 }
Sree Kuchibhotla0d8431a2017-07-18 16:21:54 -0700471 // TODO: sreek. Check if we need to set 'kicked_without_poller' to true here
472 // in the else case
473
Craig Tiller4509c472017-04-27 19:05:13 +0000474 return error;
475}
476
477static void pollset_maybe_finish_shutdown(grpc_exec_ctx *exec_ctx,
478 grpc_pollset *pollset) {
Craig Tillerba550da2017-05-01 14:26:31 +0000479 if (pollset->shutdown_closure != NULL && pollset->root_worker == NULL &&
480 pollset->begin_refs == 0) {
ncteisen274bbbe2017-06-08 14:57:11 -0700481 GRPC_CLOSURE_SCHED(exec_ctx, pollset->shutdown_closure, GRPC_ERROR_NONE);
Craig Tiller4509c472017-04-27 19:05:13 +0000482 pollset->shutdown_closure = NULL;
483 }
484}
485
486static void pollset_shutdown(grpc_exec_ctx *exec_ctx, grpc_pollset *pollset,
487 grpc_closure *closure) {
488 GPR_ASSERT(pollset->shutdown_closure == NULL);
Craig Tillerc81512a2017-05-26 09:53:58 -0700489 GPR_ASSERT(!pollset->shutting_down);
Craig Tiller4509c472017-04-27 19:05:13 +0000490 pollset->shutdown_closure = closure;
Craig Tillerc81512a2017-05-26 09:53:58 -0700491 pollset->shutting_down = true;
Craig Tiller4509c472017-04-27 19:05:13 +0000492 GRPC_LOG_IF_ERROR("pollset_shutdown", pollset_kick_all(pollset));
493 pollset_maybe_finish_shutdown(exec_ctx, pollset);
494}
495
Craig Tillera95bacf2017-05-01 12:51:24 -0700496#define MAX_EPOLL_EVENTS 100
Craig Tiller4509c472017-04-27 19:05:13 +0000497
498static int poll_deadline_to_millis_timeout(gpr_timespec deadline,
499 gpr_timespec now) {
500 gpr_timespec timeout;
501 if (gpr_time_cmp(deadline, gpr_inf_future(deadline.clock_type)) == 0) {
502 return -1;
503 }
504
505 if (gpr_time_cmp(deadline, now) <= 0) {
506 return 0;
507 }
508
509 static const gpr_timespec round_up = {
510 .clock_type = GPR_TIMESPAN, .tv_sec = 0, .tv_nsec = GPR_NS_PER_MS - 1};
511 timeout = gpr_time_sub(deadline, now);
512 int millis = gpr_time_to_millis(gpr_time_add(timeout, round_up));
513 return millis >= 1 ? millis : 1;
514}
515
516static grpc_error *pollset_epoll(grpc_exec_ctx *exec_ctx, grpc_pollset *pollset,
517 gpr_timespec now, gpr_timespec deadline) {
518 struct epoll_event events[MAX_EPOLL_EVENTS];
519 static const char *err_desc = "pollset_poll";
520
521 int timeout = poll_deadline_to_millis_timeout(deadline, now);
522
523 if (timeout != 0) {
524 GRPC_SCHEDULING_START_BLOCKING_REGION;
525 }
526 int r;
527 do {
528 r = epoll_wait(g_epfd, events, MAX_EPOLL_EVENTS, timeout);
529 } while (r < 0 && errno == EINTR);
530 if (timeout != 0) {
531 GRPC_SCHEDULING_END_BLOCKING_REGION;
532 }
533
534 if (r < 0) return GRPC_OS_ERROR(errno, "epoll_wait");
535
536 grpc_error *error = GRPC_ERROR_NONE;
537 for (int i = 0; i < r; i++) {
538 void *data_ptr = events[i].data.ptr;
539 if (data_ptr == &global_wakeup_fd) {
Craig Tiller4509c472017-04-27 19:05:13 +0000540 append_error(&error, grpc_wakeup_fd_consume_wakeup(&global_wakeup_fd),
541 err_desc);
542 } else {
543 grpc_fd *fd = (grpc_fd *)(data_ptr);
544 bool cancel = (events[i].events & (EPOLLERR | EPOLLHUP)) != 0;
545 bool read_ev = (events[i].events & (EPOLLIN | EPOLLPRI)) != 0;
546 bool write_ev = (events[i].events & EPOLLOUT) != 0;
547 if (read_ev || cancel) {
548 fd_become_readable(exec_ctx, fd, pollset);
549 }
550 if (write_ev || cancel) {
551 fd_become_writable(exec_ctx, fd);
552 }
553 }
554 }
555
556 return error;
557}
558
559static bool begin_worker(grpc_pollset *pollset, grpc_pollset_worker *worker,
560 grpc_pollset_worker **worker_hdl, gpr_timespec *now,
561 gpr_timespec deadline) {
Craig Tiller4509c472017-04-27 19:05:13 +0000562 if (worker_hdl != NULL) *worker_hdl = worker;
563 worker->initialized_cv = false;
Craig Tiller55624a32017-05-26 08:14:44 -0700564 SET_KICK_STATE(worker, UNKICKED);
Craig Tiller50da5ec2017-05-01 13:51:14 -0700565 worker->schedule_on_end_work = (grpc_closure_list)GRPC_CLOSURE_LIST_INIT;
Craig Tillerba550da2017-05-01 14:26:31 +0000566 pollset->begin_refs++;
Craig Tiller4509c472017-04-27 19:05:13 +0000567
Craig Tiller830e82a2017-05-31 16:26:27 -0700568 if (GRPC_TRACER_ON(grpc_polling_trace)) {
569 gpr_log(GPR_ERROR, "PS:%p BEGIN_STARTS:%p", pollset, worker);
570 }
571
Craig Tiller32f90ee2017-04-28 12:46:41 -0700572 if (pollset->seen_inactive) {
573 // pollset has been observed to be inactive, we need to move back to the
574 // active list
Craig Tillere00d7332017-05-01 15:43:51 +0000575 bool is_reassigning = false;
576 if (!pollset->reassigning_neighbourhood) {
577 is_reassigning = true;
578 pollset->reassigning_neighbourhood = true;
579 pollset->neighbourhood = &g_neighbourhoods[choose_neighbourhood()];
580 }
581 pollset_neighbourhood *neighbourhood = pollset->neighbourhood;
Craig Tiller32f90ee2017-04-28 12:46:41 -0700582 gpr_mu_unlock(&pollset->mu);
Craig Tillerba550da2017-05-01 14:26:31 +0000583 // pollset unlocked: state may change (even worker->kick_state)
584 retry_lock_neighbourhood:
Craig Tiller32f90ee2017-04-28 12:46:41 -0700585 gpr_mu_lock(&neighbourhood->mu);
586 gpr_mu_lock(&pollset->mu);
Craig Tiller830e82a2017-05-31 16:26:27 -0700587 if (GRPC_TRACER_ON(grpc_polling_trace)) {
588 gpr_log(GPR_ERROR, "PS:%p BEGIN_REORG:%p kick_state=%s is_reassigning=%d",
589 pollset, worker, kick_state_string(worker->kick_state),
590 is_reassigning);
591 }
Craig Tiller32f90ee2017-04-28 12:46:41 -0700592 if (pollset->seen_inactive) {
Craig Tiller2acab6e2017-04-30 23:06:33 +0000593 if (neighbourhood != pollset->neighbourhood) {
594 gpr_mu_unlock(&neighbourhood->mu);
595 neighbourhood = pollset->neighbourhood;
596 gpr_mu_unlock(&pollset->mu);
597 goto retry_lock_neighbourhood;
598 }
Craig Tiller32f90ee2017-04-28 12:46:41 -0700599 pollset->seen_inactive = false;
Craig Tiller2acab6e2017-04-30 23:06:33 +0000600 if (neighbourhood->active_root == NULL) {
601 neighbourhood->active_root = pollset->next = pollset->prev = pollset;
Sree Kuchibhotla0d8431a2017-07-18 16:21:54 -0700602 /* TODO: sreek. Why would this worker state be other than UNKICKED
603 * here ? (since the worker isn't added to the pollset yet, there is no
604 * way it can be "found" by other threads to get kicked). */
605
606 /* If there is no designated poller, make this the designated poller */
Craig Tiller55624a32017-05-26 08:14:44 -0700607 if (worker->kick_state == UNKICKED &&
608 gpr_atm_no_barrier_cas(&g_active_poller, 0, (gpr_atm)worker)) {
609 SET_KICK_STATE(worker, DESIGNATED_POLLER);
Craig Tiller32f90ee2017-04-28 12:46:41 -0700610 }
Craig Tiller2acab6e2017-04-30 23:06:33 +0000611 } else {
612 pollset->next = neighbourhood->active_root;
613 pollset->prev = pollset->next->prev;
614 pollset->next->prev = pollset->prev->next = pollset;
Craig Tiller4509c472017-04-27 19:05:13 +0000615 }
616 }
Craig Tillere00d7332017-05-01 15:43:51 +0000617 if (is_reassigning) {
618 GPR_ASSERT(pollset->reassigning_neighbourhood);
619 pollset->reassigning_neighbourhood = false;
620 }
Craig Tiller32f90ee2017-04-28 12:46:41 -0700621 gpr_mu_unlock(&neighbourhood->mu);
622 }
Sree Kuchibhotlae6506bc2017-07-18 21:43:45 -0700623
Craig Tiller32f90ee2017-04-28 12:46:41 -0700624 worker_insert(pollset, worker);
Craig Tillerba550da2017-05-01 14:26:31 +0000625 pollset->begin_refs--;
Sree Kuchibhotla949d0752017-07-20 23:49:15 -0700626 if (worker->kick_state == UNKICKED && !pollset->kicked_without_poller) {
Craig Tillera4b8eb02017-04-29 00:13:52 +0000627 GPR_ASSERT(gpr_atm_no_barrier_load(&g_active_poller) != (gpr_atm)worker);
Craig Tiller32f90ee2017-04-28 12:46:41 -0700628 worker->initialized_cv = true;
629 gpr_cv_init(&worker->cv);
Craig Tillerc81512a2017-05-26 09:53:58 -0700630 while (worker->kick_state == UNKICKED && !pollset->shutting_down) {
Craig Tiller830e82a2017-05-31 16:26:27 -0700631 if (GRPC_TRACER_ON(grpc_polling_trace)) {
632 gpr_log(GPR_ERROR, "PS:%p BEGIN_WAIT:%p kick_state=%s shutdown=%d",
633 pollset, worker, kick_state_string(worker->kick_state),
634 pollset->shutting_down);
635 }
Sree Kuchibhotla0d8431a2017-07-18 16:21:54 -0700636
Craig Tiller32f90ee2017-04-28 12:46:41 -0700637 if (gpr_cv_wait(&worker->cv, &pollset->mu, deadline) &&
638 worker->kick_state == UNKICKED) {
Sree Kuchibhotla0d8431a2017-07-18 16:21:54 -0700639 /* If gpr_cv_wait returns true (i.e a timeout), pretend that the worker
640 received a kick */
Craig Tiller55624a32017-05-26 08:14:44 -0700641 SET_KICK_STATE(worker, KICKED);
Craig Tiller32f90ee2017-04-28 12:46:41 -0700642 }
Craig Tillerba550da2017-05-01 14:26:31 +0000643 }
Craig Tiller4509c472017-04-27 19:05:13 +0000644 *now = gpr_now(now->clock_type);
645 }
Sree Kuchibhotla949d0752017-07-20 23:49:15 -0700646
Craig Tiller830e82a2017-05-31 16:26:27 -0700647 if (GRPC_TRACER_ON(grpc_polling_trace)) {
Sree Kuchibhotla949d0752017-07-20 23:49:15 -0700648 gpr_log(GPR_ERROR,
649 "PS:%p BEGIN_DONE:%p kick_state=%s shutdown=%d "
650 "kicked_without_poller: %d",
651 pollset, worker, kick_state_string(worker->kick_state),
652 pollset->shutting_down, pollset->kicked_without_poller);
Craig Tiller830e82a2017-05-31 16:26:27 -0700653 }
Craig Tiller4509c472017-04-27 19:05:13 +0000654
Sree Kuchibhotlae6506bc2017-07-18 21:43:45 -0700655 /* We release pollset lock in this function at a couple of places:
Sree Kuchibhotlaa0616ef2017-07-18 23:49:49 -0700656 * 1. Briefly when assigning pollset to a neighbourhood
Sree Kuchibhotlae6506bc2017-07-18 21:43:45 -0700657 * 2. When doing gpr_cv_wait()
658 * It is possible that 'kicked_without_poller' was set to true during (1) and
659 * 'shutting_down' is set to true during (1) or (2). If either of them is
660 * true, this worker cannot do polling */
Sree Kuchibhotlae6506bc2017-07-18 21:43:45 -0700661 /* TODO(sreek): Perhaps there is a better way to handle kicked_without_poller
662 * case; especially when the worker is the DESIGNATED_POLLER */
663
Sree Kuchibhotlaa0616ef2017-07-18 23:49:49 -0700664 if (pollset->kicked_without_poller) {
665 pollset->kicked_without_poller = false;
666 return false;
667 }
668
669 return worker->kick_state == DESIGNATED_POLLER && !pollset->shutting_down;
Craig Tiller4509c472017-04-27 19:05:13 +0000670}
671
Craig Tillerbbf4c7a2017-04-28 15:12:10 -0700672static bool check_neighbourhood_for_available_poller(
Craig Tillera4b8eb02017-04-29 00:13:52 +0000673 pollset_neighbourhood *neighbourhood) {
Craig Tillerbbf4c7a2017-04-28 15:12:10 -0700674 bool found_worker = false;
675 do {
676 grpc_pollset *inspect = neighbourhood->active_root;
677 if (inspect == NULL) {
678 break;
679 }
680 gpr_mu_lock(&inspect->mu);
681 GPR_ASSERT(!inspect->seen_inactive);
682 grpc_pollset_worker *inspect_worker = inspect->root_worker;
Craig Tillerbbf4c7a2017-04-28 15:12:10 -0700683 if (inspect_worker != NULL) {
Craig Tillera4b8eb02017-04-29 00:13:52 +0000684 do {
Craig Tillerba550da2017-05-01 14:26:31 +0000685 switch (inspect_worker->kick_state) {
686 case UNKICKED:
687 if (gpr_atm_no_barrier_cas(&g_active_poller, 0,
688 (gpr_atm)inspect_worker)) {
Craig Tiller830e82a2017-05-31 16:26:27 -0700689 if (GRPC_TRACER_ON(grpc_polling_trace)) {
690 gpr_log(GPR_DEBUG, " .. choose next poller to be %p",
691 inspect_worker);
692 }
Craig Tiller55624a32017-05-26 08:14:44 -0700693 SET_KICK_STATE(inspect_worker, DESIGNATED_POLLER);
Craig Tillerba550da2017-05-01 14:26:31 +0000694 if (inspect_worker->initialized_cv) {
695 gpr_cv_signal(&inspect_worker->cv);
696 }
Craig Tiller830e82a2017-05-31 16:26:27 -0700697 } else {
698 if (GRPC_TRACER_ON(grpc_polling_trace)) {
699 gpr_log(GPR_DEBUG, " .. beaten to choose next poller");
700 }
Craig Tillera4b8eb02017-04-29 00:13:52 +0000701 }
Craig Tillerba550da2017-05-01 14:26:31 +0000702 // even if we didn't win the cas, there's a worker, we can stop
703 found_worker = true;
704 break;
705 case KICKED:
706 break;
707 case DESIGNATED_POLLER:
708 found_worker = true; // ok, so someone else found the worker, but
709 // we'll accept that
710 break;
Craig Tillerbbf4c7a2017-04-28 15:12:10 -0700711 }
Craig Tillera4b8eb02017-04-29 00:13:52 +0000712 inspect_worker = inspect_worker->next;
Craig Tiller830e82a2017-05-31 16:26:27 -0700713 } while (!found_worker && inspect_worker != inspect->root_worker);
Craig Tillera4b8eb02017-04-29 00:13:52 +0000714 }
715 if (!found_worker) {
Craig Tiller830e82a2017-05-31 16:26:27 -0700716 if (GRPC_TRACER_ON(grpc_polling_trace)) {
717 gpr_log(GPR_DEBUG, " .. mark pollset %p inactive", inspect);
718 }
Craig Tillerbbf4c7a2017-04-28 15:12:10 -0700719 inspect->seen_inactive = true;
Craig Tiller2acab6e2017-04-30 23:06:33 +0000720 if (inspect == neighbourhood->active_root) {
Craig Tillera95bacf2017-05-01 12:51:24 -0700721 neighbourhood->active_root =
722 inspect->next == inspect ? NULL : inspect->next;
Craig Tiller2acab6e2017-04-30 23:06:33 +0000723 }
724 inspect->next->prev = inspect->prev;
725 inspect->prev->next = inspect->next;
Craig Tillere00d7332017-05-01 15:43:51 +0000726 inspect->next = inspect->prev = NULL;
Craig Tillerbbf4c7a2017-04-28 15:12:10 -0700727 }
728 gpr_mu_unlock(&inspect->mu);
729 } while (!found_worker);
Craig Tillerbbf4c7a2017-04-28 15:12:10 -0700730 return found_worker;
731}
732
Craig Tiller4509c472017-04-27 19:05:13 +0000733static void end_worker(grpc_exec_ctx *exec_ctx, grpc_pollset *pollset,
734 grpc_pollset_worker *worker,
735 grpc_pollset_worker **worker_hdl) {
Craig Tiller830e82a2017-05-31 16:26:27 -0700736 if (GRPC_TRACER_ON(grpc_polling_trace)) {
737 gpr_log(GPR_DEBUG, "PS:%p END_WORKER:%p", pollset, worker);
738 }
Craig Tiller8502ecb2017-04-28 14:22:01 -0700739 if (worker_hdl != NULL) *worker_hdl = NULL;
Craig Tiller830e82a2017-05-31 16:26:27 -0700740 /* Make sure we appear kicked */
Craig Tiller55624a32017-05-26 08:14:44 -0700741 SET_KICK_STATE(worker, KICKED);
Craig Tiller50da5ec2017-05-01 13:51:14 -0700742 grpc_closure_list_move(&worker->schedule_on_end_work,
743 &exec_ctx->closure_list);
Craig Tiller8502ecb2017-04-28 14:22:01 -0700744 if (gpr_atm_no_barrier_load(&g_active_poller) == (gpr_atm)worker) {
Craig Tillera4b8eb02017-04-29 00:13:52 +0000745 if (worker->next != worker && worker->next->kick_state == UNKICKED) {
Craig Tiller830e82a2017-05-31 16:26:27 -0700746 if (GRPC_TRACER_ON(grpc_polling_trace)) {
747 gpr_log(GPR_DEBUG, " .. choose next poller to be peer %p", worker);
748 }
Craig Tiller2acab6e2017-04-30 23:06:33 +0000749 GPR_ASSERT(worker->next->initialized_cv);
Craig Tiller32f90ee2017-04-28 12:46:41 -0700750 gpr_atm_no_barrier_store(&g_active_poller, (gpr_atm)worker->next);
Craig Tiller55624a32017-05-26 08:14:44 -0700751 SET_KICK_STATE(worker->next, DESIGNATED_POLLER);
Craig Tiller32f90ee2017-04-28 12:46:41 -0700752 gpr_cv_signal(&worker->next->cv);
Craig Tiller8502ecb2017-04-28 14:22:01 -0700753 if (grpc_exec_ctx_has_work(exec_ctx)) {
754 gpr_mu_unlock(&pollset->mu);
755 grpc_exec_ctx_flush(exec_ctx);
756 gpr_mu_lock(&pollset->mu);
757 }
Craig Tiller32f90ee2017-04-28 12:46:41 -0700758 } else {
759 gpr_atm_no_barrier_store(&g_active_poller, 0);
Craig Tillerbbf4c7a2017-04-28 15:12:10 -0700760 size_t poller_neighbourhood_idx =
761 (size_t)(pollset->neighbourhood - g_neighbourhoods);
Craig Tillerbb742672017-05-17 22:19:05 +0000762 gpr_mu_unlock(&pollset->mu);
Craig Tiller32f90ee2017-04-28 12:46:41 -0700763 bool found_worker = false;
Craig Tillerba550da2017-05-01 14:26:31 +0000764 bool scan_state[MAX_NEIGHBOURHOODS];
Craig Tillerbbf4c7a2017-04-28 15:12:10 -0700765 for (size_t i = 0; !found_worker && i < g_num_neighbourhoods; i++) {
766 pollset_neighbourhood *neighbourhood =
767 &g_neighbourhoods[(poller_neighbourhood_idx + i) %
768 g_num_neighbourhoods];
769 if (gpr_mu_trylock(&neighbourhood->mu)) {
770 found_worker =
Craig Tillera4b8eb02017-04-29 00:13:52 +0000771 check_neighbourhood_for_available_poller(neighbourhood);
Craig Tillerbbf4c7a2017-04-28 15:12:10 -0700772 gpr_mu_unlock(&neighbourhood->mu);
Craig Tillerba550da2017-05-01 14:26:31 +0000773 scan_state[i] = true;
Craig Tillerbbf4c7a2017-04-28 15:12:10 -0700774 } else {
Craig Tillerba550da2017-05-01 14:26:31 +0000775 scan_state[i] = false;
Craig Tiller32f90ee2017-04-28 12:46:41 -0700776 }
Craig Tillerbbf4c7a2017-04-28 15:12:10 -0700777 }
Craig Tiller2acab6e2017-04-30 23:06:33 +0000778 for (size_t i = 0; !found_worker && i < g_num_neighbourhoods; i++) {
Craig Tillerba550da2017-05-01 14:26:31 +0000779 if (scan_state[i]) continue;
Craig Tiller2acab6e2017-04-30 23:06:33 +0000780 pollset_neighbourhood *neighbourhood =
781 &g_neighbourhoods[(poller_neighbourhood_idx + i) %
782 g_num_neighbourhoods];
783 gpr_mu_lock(&neighbourhood->mu);
Craig Tillerba550da2017-05-01 14:26:31 +0000784 found_worker = check_neighbourhood_for_available_poller(neighbourhood);
Craig Tiller2acab6e2017-04-30 23:06:33 +0000785 gpr_mu_unlock(&neighbourhood->mu);
Craig Tillerbbf4c7a2017-04-28 15:12:10 -0700786 }
Craig Tiller8502ecb2017-04-28 14:22:01 -0700787 grpc_exec_ctx_flush(exec_ctx);
Craig Tiller32f90ee2017-04-28 12:46:41 -0700788 gpr_mu_lock(&pollset->mu);
789 }
Craig Tiller50da5ec2017-05-01 13:51:14 -0700790 } else if (grpc_exec_ctx_has_work(exec_ctx)) {
791 gpr_mu_unlock(&pollset->mu);
792 grpc_exec_ctx_flush(exec_ctx);
793 gpr_mu_lock(&pollset->mu);
Craig Tiller4509c472017-04-27 19:05:13 +0000794 }
795 if (worker->initialized_cv) {
796 gpr_cv_destroy(&worker->cv);
797 }
Craig Tiller830e82a2017-05-31 16:26:27 -0700798 if (GRPC_TRACER_ON(grpc_polling_trace)) {
799 gpr_log(GPR_DEBUG, " .. remove worker");
800 }
Craig Tiller32f90ee2017-04-28 12:46:41 -0700801 if (EMPTIED == worker_remove(pollset, worker)) {
Craig Tiller4509c472017-04-27 19:05:13 +0000802 pollset_maybe_finish_shutdown(exec_ctx, pollset);
803 }
Craig Tillera4b8eb02017-04-29 00:13:52 +0000804 GPR_ASSERT(gpr_atm_no_barrier_load(&g_active_poller) != (gpr_atm)worker);
Craig Tiller4509c472017-04-27 19:05:13 +0000805}
806
807/* pollset->po.mu lock must be held by the caller before calling this.
808 The function pollset_work() may temporarily release the lock (pollset->po.mu)
809 during the course of its execution but it will always re-acquire the lock and
810 ensure that it is held by the time the function returns */
811static grpc_error *pollset_work(grpc_exec_ctx *exec_ctx, grpc_pollset *pollset,
812 grpc_pollset_worker **worker_hdl,
813 gpr_timespec now, gpr_timespec deadline) {
814 grpc_pollset_worker worker;
815 grpc_error *error = GRPC_ERROR_NONE;
816 static const char *err_desc = "pollset_work";
817 if (pollset->kicked_without_poller) {
818 pollset->kicked_without_poller = false;
819 return GRPC_ERROR_NONE;
820 }
821 if (begin_worker(pollset, &worker, worker_hdl, &now, deadline)) {
Craig Tiller830e82a2017-05-31 16:26:27 -0700822 gpr_tls_set(&g_current_thread_pollset, (intptr_t)pollset);
Craig Tiller4509c472017-04-27 19:05:13 +0000823 gpr_tls_set(&g_current_thread_worker, (intptr_t)&worker);
Craig Tillerc81512a2017-05-26 09:53:58 -0700824 GPR_ASSERT(!pollset->shutting_down);
Craig Tiller2acab6e2017-04-30 23:06:33 +0000825 GPR_ASSERT(!pollset->seen_inactive);
Craig Tiller32f90ee2017-04-28 12:46:41 -0700826 gpr_mu_unlock(&pollset->mu);
Craig Tiller4509c472017-04-27 19:05:13 +0000827 append_error(&error, pollset_epoll(exec_ctx, pollset, now, deadline),
828 err_desc);
Craig Tiller32f90ee2017-04-28 12:46:41 -0700829 gpr_mu_lock(&pollset->mu);
Craig Tiller4509c472017-04-27 19:05:13 +0000830 gpr_tls_set(&g_current_thread_worker, 0);
Craig Tiller830e82a2017-05-31 16:26:27 -0700831 } else {
832 gpr_tls_set(&g_current_thread_pollset, (intptr_t)pollset);
Craig Tiller4509c472017-04-27 19:05:13 +0000833 }
834 end_worker(exec_ctx, pollset, &worker, worker_hdl);
Craig Tiller8502ecb2017-04-28 14:22:01 -0700835 gpr_tls_set(&g_current_thread_pollset, 0);
Craig Tiller4509c472017-04-27 19:05:13 +0000836 return error;
837}
838
839static grpc_error *pollset_kick(grpc_pollset *pollset,
840 grpc_pollset_worker *specific_worker) {
Craig Tillerb89bac02017-05-26 15:20:32 +0000841 if (GRPC_TRACER_ON(grpc_polling_trace)) {
842 gpr_strvec log;
843 gpr_strvec_init(&log);
844 char *tmp;
Craig Tiller75aef7f2017-05-26 08:26:08 -0700845 gpr_asprintf(
846 &tmp, "PS:%p KICK:%p curps=%p curworker=%p root=%p", pollset,
847 specific_worker, (void *)gpr_tls_get(&g_current_thread_pollset),
848 (void *)gpr_tls_get(&g_current_thread_worker), pollset->root_worker);
Craig Tillerb89bac02017-05-26 15:20:32 +0000849 gpr_strvec_add(&log, tmp);
850 if (pollset->root_worker != NULL) {
Craig Tiller830e82a2017-05-31 16:26:27 -0700851 gpr_asprintf(&tmp, " {kick_state=%s next=%p {kick_state=%s}}",
852 kick_state_string(pollset->root_worker->kick_state),
853 pollset->root_worker->next,
854 kick_state_string(pollset->root_worker->next->kick_state));
Craig Tillerb89bac02017-05-26 15:20:32 +0000855 gpr_strvec_add(&log, tmp);
856 }
857 if (specific_worker != NULL) {
Craig Tiller830e82a2017-05-31 16:26:27 -0700858 gpr_asprintf(&tmp, " worker_kick_state=%s",
859 kick_state_string(specific_worker->kick_state));
Craig Tillerb89bac02017-05-26 15:20:32 +0000860 gpr_strvec_add(&log, tmp);
861 }
862 tmp = gpr_strvec_flatten(&log, NULL);
863 gpr_strvec_destroy(&log);
Craig Tiller830e82a2017-05-31 16:26:27 -0700864 gpr_log(GPR_ERROR, "%s", tmp);
Craig Tillerb89bac02017-05-26 15:20:32 +0000865 gpr_free(tmp);
866 }
Craig Tiller4509c472017-04-27 19:05:13 +0000867 if (specific_worker == NULL) {
868 if (gpr_tls_get(&g_current_thread_pollset) != (intptr_t)pollset) {
Craig Tiller375eb252017-04-27 23:29:12 +0000869 grpc_pollset_worker *root_worker = pollset->root_worker;
870 if (root_worker == NULL) {
Craig Tiller4509c472017-04-27 19:05:13 +0000871 pollset->kicked_without_poller = true;
Craig Tiller75aef7f2017-05-26 08:26:08 -0700872 if (GRPC_TRACER_ON(grpc_polling_trace)) {
Craig Tiller830e82a2017-05-31 16:26:27 -0700873 gpr_log(GPR_ERROR, " .. kicked_without_poller");
Craig Tiller75aef7f2017-05-26 08:26:08 -0700874 }
Craig Tiller4509c472017-04-27 19:05:13 +0000875 return GRPC_ERROR_NONE;
Craig Tiller375eb252017-04-27 23:29:12 +0000876 }
Craig Tiller32f90ee2017-04-28 12:46:41 -0700877 grpc_pollset_worker *next_worker = root_worker->next;
Craig Tiller830e82a2017-05-31 16:26:27 -0700878 if (root_worker->kick_state == KICKED) {
Craig Tiller75aef7f2017-05-26 08:26:08 -0700879 if (GRPC_TRACER_ON(grpc_polling_trace)) {
Craig Tiller830e82a2017-05-31 16:26:27 -0700880 gpr_log(GPR_ERROR, " .. already kicked %p", root_worker);
881 }
882 SET_KICK_STATE(root_worker, KICKED);
883 return GRPC_ERROR_NONE;
884 } else if (next_worker->kick_state == KICKED) {
885 if (GRPC_TRACER_ON(grpc_polling_trace)) {
886 gpr_log(GPR_ERROR, " .. already kicked %p", next_worker);
887 }
888 SET_KICK_STATE(next_worker, KICKED);
889 return GRPC_ERROR_NONE;
890 } else if (root_worker ==
891 next_worker && // only try and wake up a poller if
892 // there is no next worker
893 root_worker == (grpc_pollset_worker *)gpr_atm_no_barrier_load(
894 &g_active_poller)) {
895 if (GRPC_TRACER_ON(grpc_polling_trace)) {
896 gpr_log(GPR_ERROR, " .. kicked %p", root_worker);
Craig Tiller75aef7f2017-05-26 08:26:08 -0700897 }
Craig Tiller55624a32017-05-26 08:14:44 -0700898 SET_KICK_STATE(root_worker, KICKED);
Craig Tiller4509c472017-04-27 19:05:13 +0000899 return grpc_wakeup_fd_wakeup(&global_wakeup_fd);
Craig Tiller8502ecb2017-04-28 14:22:01 -0700900 } else if (next_worker->kick_state == UNKICKED) {
Craig Tiller75aef7f2017-05-26 08:26:08 -0700901 if (GRPC_TRACER_ON(grpc_polling_trace)) {
Craig Tiller830e82a2017-05-31 16:26:27 -0700902 gpr_log(GPR_ERROR, " .. kicked %p", next_worker);
Craig Tiller75aef7f2017-05-26 08:26:08 -0700903 }
Craig Tiller8502ecb2017-04-28 14:22:01 -0700904 GPR_ASSERT(next_worker->initialized_cv);
Craig Tiller55624a32017-05-26 08:14:44 -0700905 SET_KICK_STATE(next_worker, KICKED);
Craig Tiller375eb252017-04-27 23:29:12 +0000906 gpr_cv_signal(&next_worker->cv);
907 return GRPC_ERROR_NONE;
Craig Tiller55624a32017-05-26 08:14:44 -0700908 } else if (next_worker->kick_state == DESIGNATED_POLLER) {
909 if (root_worker->kick_state != DESIGNATED_POLLER) {
Craig Tiller75aef7f2017-05-26 08:26:08 -0700910 if (GRPC_TRACER_ON(grpc_polling_trace)) {
Craig Tiller830e82a2017-05-31 16:26:27 -0700911 gpr_log(
912 GPR_ERROR,
913 " .. kicked root non-poller %p (initialized_cv=%d) (poller=%p)",
914 root_worker, root_worker->initialized_cv, next_worker);
Craig Tiller75aef7f2017-05-26 08:26:08 -0700915 }
Craig Tiller55624a32017-05-26 08:14:44 -0700916 SET_KICK_STATE(root_worker, KICKED);
917 if (root_worker->initialized_cv) {
918 gpr_cv_signal(&root_worker->cv);
919 }
920 return GRPC_ERROR_NONE;
921 } else {
Craig Tiller75aef7f2017-05-26 08:26:08 -0700922 if (GRPC_TRACER_ON(grpc_polling_trace)) {
Craig Tiller830e82a2017-05-31 16:26:27 -0700923 gpr_log(GPR_ERROR, " .. non-root poller %p (root=%p)", next_worker,
Craig Tiller75aef7f2017-05-26 08:26:08 -0700924 root_worker);
925 }
Craig Tiller55624a32017-05-26 08:14:44 -0700926 SET_KICK_STATE(next_worker, KICKED);
927 return grpc_wakeup_fd_wakeup(&global_wakeup_fd);
928 }
Craig Tiller8502ecb2017-04-28 14:22:01 -0700929 } else {
Craig Tiller55624a32017-05-26 08:14:44 -0700930 GPR_ASSERT(next_worker->kick_state == KICKED);
931 SET_KICK_STATE(next_worker, KICKED);
Craig Tiller8502ecb2017-04-28 14:22:01 -0700932 return GRPC_ERROR_NONE;
Craig Tiller4509c472017-04-27 19:05:13 +0000933 }
934 } else {
Craig Tiller830e82a2017-05-31 16:26:27 -0700935 if (GRPC_TRACER_ON(grpc_polling_trace)) {
936 gpr_log(GPR_ERROR, " .. kicked while waking up");
937 }
Craig Tiller4509c472017-04-27 19:05:13 +0000938 return GRPC_ERROR_NONE;
939 }
Craig Tiller43bf2592017-04-28 23:21:01 +0000940 } else if (specific_worker->kick_state == KICKED) {
Craig Tiller75aef7f2017-05-26 08:26:08 -0700941 if (GRPC_TRACER_ON(grpc_polling_trace)) {
Craig Tiller830e82a2017-05-31 16:26:27 -0700942 gpr_log(GPR_ERROR, " .. specific worker already kicked");
Craig Tiller75aef7f2017-05-26 08:26:08 -0700943 }
Craig Tiller4509c472017-04-27 19:05:13 +0000944 return GRPC_ERROR_NONE;
945 } else if (gpr_tls_get(&g_current_thread_worker) ==
946 (intptr_t)specific_worker) {
Craig Tiller75aef7f2017-05-26 08:26:08 -0700947 if (GRPC_TRACER_ON(grpc_polling_trace)) {
Craig Tiller830e82a2017-05-31 16:26:27 -0700948 gpr_log(GPR_ERROR, " .. mark %p kicked", specific_worker);
Craig Tiller75aef7f2017-05-26 08:26:08 -0700949 }
Craig Tiller55624a32017-05-26 08:14:44 -0700950 SET_KICK_STATE(specific_worker, KICKED);
Craig Tiller4509c472017-04-27 19:05:13 +0000951 return GRPC_ERROR_NONE;
Craig Tiller32f90ee2017-04-28 12:46:41 -0700952 } else if (specific_worker ==
953 (grpc_pollset_worker *)gpr_atm_no_barrier_load(&g_active_poller)) {
Craig Tiller75aef7f2017-05-26 08:26:08 -0700954 if (GRPC_TRACER_ON(grpc_polling_trace)) {
Craig Tiller830e82a2017-05-31 16:26:27 -0700955 gpr_log(GPR_ERROR, " .. kick active poller");
Craig Tiller75aef7f2017-05-26 08:26:08 -0700956 }
Craig Tiller55624a32017-05-26 08:14:44 -0700957 SET_KICK_STATE(specific_worker, KICKED);
Craig Tiller4509c472017-04-27 19:05:13 +0000958 return grpc_wakeup_fd_wakeup(&global_wakeup_fd);
Craig Tiller8502ecb2017-04-28 14:22:01 -0700959 } else if (specific_worker->initialized_cv) {
Craig Tiller75aef7f2017-05-26 08:26:08 -0700960 if (GRPC_TRACER_ON(grpc_polling_trace)) {
Craig Tiller830e82a2017-05-31 16:26:27 -0700961 gpr_log(GPR_ERROR, " .. kick waiting worker");
Craig Tiller75aef7f2017-05-26 08:26:08 -0700962 }
Craig Tiller55624a32017-05-26 08:14:44 -0700963 SET_KICK_STATE(specific_worker, KICKED);
Craig Tiller4509c472017-04-27 19:05:13 +0000964 gpr_cv_signal(&specific_worker->cv);
965 return GRPC_ERROR_NONE;
Craig Tiller8502ecb2017-04-28 14:22:01 -0700966 } else {
Craig Tiller75aef7f2017-05-26 08:26:08 -0700967 if (GRPC_TRACER_ON(grpc_polling_trace)) {
Craig Tiller830e82a2017-05-31 16:26:27 -0700968 gpr_log(GPR_ERROR, " .. kick non-waiting worker");
Craig Tiller75aef7f2017-05-26 08:26:08 -0700969 }
Craig Tiller55624a32017-05-26 08:14:44 -0700970 SET_KICK_STATE(specific_worker, KICKED);
Craig Tiller8502ecb2017-04-28 14:22:01 -0700971 return GRPC_ERROR_NONE;
Craig Tiller4509c472017-04-27 19:05:13 +0000972 }
973}
974
975static void pollset_add_fd(grpc_exec_ctx *exec_ctx, grpc_pollset *pollset,
976 grpc_fd *fd) {}
977
Craig Tiller4509c472017-04-27 19:05:13 +0000978/*******************************************************************************
Craig Tillerc67cc992017-04-27 10:15:51 -0700979 * Pollset-set Definitions
980 */
981
982static grpc_pollset_set *pollset_set_create(void) {
983 return (grpc_pollset_set *)((intptr_t)0xdeafbeef);
984}
985
986static void pollset_set_destroy(grpc_exec_ctx *exec_ctx,
987 grpc_pollset_set *pss) {}
988
989static void pollset_set_add_fd(grpc_exec_ctx *exec_ctx, grpc_pollset_set *pss,
990 grpc_fd *fd) {}
991
992static void pollset_set_del_fd(grpc_exec_ctx *exec_ctx, grpc_pollset_set *pss,
993 grpc_fd *fd) {}
994
995static void pollset_set_add_pollset(grpc_exec_ctx *exec_ctx,
996 grpc_pollset_set *pss, grpc_pollset *ps) {}
997
998static void pollset_set_del_pollset(grpc_exec_ctx *exec_ctx,
999 grpc_pollset_set *pss, grpc_pollset *ps) {}
1000
1001static void pollset_set_add_pollset_set(grpc_exec_ctx *exec_ctx,
1002 grpc_pollset_set *bag,
1003 grpc_pollset_set *item) {}
1004
1005static void pollset_set_del_pollset_set(grpc_exec_ctx *exec_ctx,
1006 grpc_pollset_set *bag,
1007 grpc_pollset_set *item) {}
1008
1009/*******************************************************************************
1010 * Event engine binding
1011 */
1012
1013static void shutdown_engine(void) {
1014 fd_global_shutdown();
1015 pollset_global_shutdown();
Sree Kuchibhotla54c31c72017-07-17 14:57:27 -07001016 close(g_epfd);
Craig Tillerc67cc992017-04-27 10:15:51 -07001017}
1018
1019static const grpc_event_engine_vtable vtable = {
1020 .pollset_size = sizeof(grpc_pollset),
1021
1022 .fd_create = fd_create,
1023 .fd_wrapped_fd = fd_wrapped_fd,
1024 .fd_orphan = fd_orphan,
1025 .fd_shutdown = fd_shutdown,
1026 .fd_is_shutdown = fd_is_shutdown,
1027 .fd_notify_on_read = fd_notify_on_read,
1028 .fd_notify_on_write = fd_notify_on_write,
1029 .fd_get_read_notifier_pollset = fd_get_read_notifier_pollset,
Craig Tillerc67cc992017-04-27 10:15:51 -07001030
1031 .pollset_init = pollset_init,
1032 .pollset_shutdown = pollset_shutdown,
1033 .pollset_destroy = pollset_destroy,
1034 .pollset_work = pollset_work,
1035 .pollset_kick = pollset_kick,
1036 .pollset_add_fd = pollset_add_fd,
1037
1038 .pollset_set_create = pollset_set_create,
1039 .pollset_set_destroy = pollset_set_destroy,
1040 .pollset_set_add_pollset = pollset_set_add_pollset,
1041 .pollset_set_del_pollset = pollset_set_del_pollset,
1042 .pollset_set_add_pollset_set = pollset_set_add_pollset_set,
1043 .pollset_set_del_pollset_set = pollset_set_del_pollset_set,
1044 .pollset_set_add_fd = pollset_set_add_fd,
1045 .pollset_set_del_fd = pollset_set_del_fd,
1046
Craig Tillerc67cc992017-04-27 10:15:51 -07001047 .shutdown_engine = shutdown_engine,
1048};
1049
1050/* It is possible that GLIBC has epoll but the underlying kernel doesn't.
1051 * Create a dummy epoll_fd to make sure epoll support is available */
Craig Tiller6f0af492017-04-27 19:26:16 +00001052const grpc_event_engine_vtable *grpc_init_epoll1_linux(bool explicit_request) {
Craig Tillerc67cc992017-04-27 10:15:51 -07001053 if (!grpc_has_wakeup_fd()) {
1054 return NULL;
1055 }
1056
Craig Tiller4509c472017-04-27 19:05:13 +00001057 g_epfd = epoll_create1(EPOLL_CLOEXEC);
1058 if (g_epfd < 0) {
1059 gpr_log(GPR_ERROR, "epoll unavailable");
Craig Tillerc67cc992017-04-27 10:15:51 -07001060 return NULL;
1061 }
1062
Craig Tillerc67cc992017-04-27 10:15:51 -07001063 fd_global_init();
1064
1065 if (!GRPC_LOG_IF_ERROR("pollset_global_init", pollset_global_init())) {
Craig Tiller4509c472017-04-27 19:05:13 +00001066 close(g_epfd);
1067 fd_global_shutdown();
Craig Tillerc67cc992017-04-27 10:15:51 -07001068 return NULL;
1069 }
1070
Craig Tiller830e82a2017-05-31 16:26:27 -07001071 gpr_log(GPR_ERROR, "grpc epoll fd: %d", g_epfd);
1072
Craig Tillerc67cc992017-04-27 10:15:51 -07001073 return &vtable;
1074}
1075
1076#else /* defined(GRPC_LINUX_EPOLL) */
1077#if defined(GRPC_POSIX_SOCKET)
1078#include "src/core/lib/iomgr/ev_posix.h"
1079/* If GRPC_LINUX_EPOLL is not defined, it means epoll is not available. Return
1080 * NULL */
Craig Tiller9ddb3152017-04-27 21:32:56 +00001081const grpc_event_engine_vtable *grpc_init_epoll1_linux(bool explicit_request) {
1082 return NULL;
1083}
Craig Tillerc67cc992017-04-27 10:15:51 -07001084#endif /* defined(GRPC_POSIX_SOCKET) */
1085#endif /* !defined(GRPC_LINUX_EPOLL) */