The FreeRADIUS server $Id: 15bac2a4c627c01d1aa2047687b3418955ac7f00 $
Loading...
Searching...
No Matches
schedule.c
Go to the documentation of this file.
1/*
2 * This program is free software; you can redistribute it and/or modify
3 * it under the terms of the GNU General Public License as published by
4 * the Free Software Foundation; either version 2 of the License, or
5 * (at your option) any later version.
6 *
7 * This program is distributed in the hope that it will be useful,
8 * but WITHOUT ANY WARRANTY; without even the implied warranty of
9 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
10 * GNU General Public License for more details.
11 *
12 * You should have received a copy of the GNU General Public License
13 * along with this program; if not, write to the Free Software
14 * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA
15 */
16
17/**
18 * $Id: 81485068bc3214427fd6f54c0993939a3a8a0f01 $
19 *
20 * @brief Network / worker thread scheduling
21 * @file io/schedule.c
22 *
23 * @copyright 2016 Alan DeKok (aland@freeradius.org)
24 */
25RCSID("$Id: 81485068bc3214427fd6f54c0993939a3a8a0f01 $")
26
27#define LOG_DST sc->log
28
29#include <freeradius-devel/autoconf.h>
30
31#include <freeradius-devel/io/schedule.h>
32#include <freeradius-devel/util/dlist.h>
33#include <freeradius-devel/util/rb.h>
34#include <freeradius-devel/util/syserror.h>
35#include <freeradius-devel/server/trigger.h>
36
37#include <pthread.h>
38
39/*
40 * Other OS's have sem_init, OS X doesn't.
41 */
42#ifdef HAVE_SEMAPHORE_H
43#include <semaphore.h>
44#endif
45
46#define SEMAPHORE_LOCKED (0)
47
48#ifdef __APPLE__
49#include <mach/task.h>
50#include <mach/mach_init.h>
51#include <mach/semaphore.h>
52
53#undef sem_t
54#define sem_t semaphore_t
55#undef sem_init
56#define sem_init(s,p,c) semaphore_create(mach_task_self(),s,SYNC_POLICY_FIFO,c)
57#undef sem_wait
58#define sem_wait(s) semaphore_wait(*s)
59#undef sem_post
60#define sem_post(s) semaphore_signal(*s)
61#undef sem_destroy
62#define sem_destroy(s) semaphore_destroy(mach_task_self(),*s)
63#endif /* __APPLE__ */
64
65#define SEM_WAIT_INTR(_x) do {if (sem_wait(_x) == 0) break;} while (errno == EINTR)
66
67/**
68 * Track the child thread status.
69 */
71 FR_CHILD_FREE = 0, //!< child is free
72 FR_CHILD_INITIALIZING, //!< initialized, but not running
73 FR_CHILD_RUNNING, //!< running, and in the running queue
74 FR_CHILD_EXITED, //!< exited, and in the exited queue
75 FR_CHILD_FAIL //!< failed, and in the exited queue
77
78/** Scheduler specific information for worker threads
79 *
80 * Wraps a fr_worker_t, tracking additional information that
81 * the scheduler uses.
82 */
83typedef struct {
84 TALLOC_CTX *ctx; //!< our allocation ctx
85 fr_event_list_t *el; //!< our event list
86 pthread_t pthread_id; //!< the thread of this worker
87
88 unsigned int id; //!< a unique ID
89 int uses; //!< how many network threads are using it
90 fr_time_t cpu_time; //!< how much CPU time this worker has used
91
92 fr_dlist_t entry; //!< our entry into the linked list of workers
93
94 fr_schedule_t *sc; //!< the scheduler we are running under
95
96 fr_schedule_child_status_t status; //!< status of the worker
97 fr_worker_t *worker; //!< the worker data structure
99
100/** Scheduler specific information for network threads
101 *
102 * Wraps a fr_network_t, tracking additional information that
103 * the scheduler uses.
104 */
105typedef struct {
106 TALLOC_CTX *ctx; //!< our allocation ctx
107 pthread_t pthread_id; //!< the thread of this network
108
109 unsigned int id; //!< a unique ID
110
111 fr_dlist_t entry; //!< our entry into the linked list of networks
112
113 fr_schedule_t *sc; //!< the scheduler we are running under
114
115 fr_schedule_child_status_t status; //!< status of the worker
116 fr_network_t *nr; //!< the receive data structure
117
118 fr_timer_t *ev; //!< timer for stats_interval
120
121
122/**
123 * The scheduler
124 */
126 bool running; //!< is the scheduler running?
127
128 CONF_SECTION *cs; //!< thread pool configuration section
129 fr_event_list_t *el; //!< event list for single-threaded mode.
130
131 fr_log_t *log; //!< log destination
132 fr_log_lvl_t lvl; //!< log level
133
134 fr_schedule_config_t *config; //!< configuration
135
136 unsigned int num_workers_exited; //!< number of exited workers
137
138 sem_t worker_sem; //!< for inter-thread signaling
139 sem_t network_sem; //!< for inter-thread signaling
140
143
144 fr_dlist_head_t workers; //!< list of workers
145 fr_dlist_head_t networks; //!< list of networks
146
147 fr_network_t *single_network; //!< for single-threaded mode
148 fr_worker_t *single_worker; //!< for single-threaded mode
149};
150
151static _Thread_local int worker_id; //!< Internal ID of the current worker thread.
152
153/** Return the worker id for the current thread
154 *
155 * @return worker ID
156 */
158{
159 return worker_id;
160}
161
162/** Entry point for worker threads
163 *
164 * @param[in] arg the fr_schedule_worker_t
165 * @return NULL
166 */
167static void *fr_schedule_worker_thread(void *arg)
168{
169 TALLOC_CTX *ctx;
170 fr_schedule_worker_t *sw = talloc_get_type_abort(arg, fr_schedule_worker_t);
171 fr_schedule_t *sc = sw->sc;
174 char worker_name[32];
175
176#ifndef __APPLE__
177 /*
178 * This ifdef is because macOS doesn't use pthread_signmask in its
179 * setcontext function, and seems to apply the signal mask of the thread
180 * to the entire process when setcontext is called.
181 *
182 * * frame #0: 0x00000001934118b0 libsystem_kernel.dylib`sigprocmask
183 * frame #1: 0x0000000193481f3c libsystem_platform.dylib`setcontext + 44
184 * frame #2: 0x0000000100f27298 libcrypto.3.dylib`async_fibre_swapcontext + 52
185 * frame #3: 0x0000000100f274a0 libcrypto.3.dylib`ASYNC_start_job + 496
186 * frame #4: 0x0000000100b17884 libssl.3.dylib`ssl_start_async_job + 116
187 * frame #5: 0x0000000100b17804 libssl.3.dylib`ssl_read_internal + 356
188 * frame #6: 0x0000000100b17a0c libssl.3.dylib`SSL_read + 28
189 * frame #7: 0x00000001004f5b94 libfreeradius-tls.dylib`tls_session_async_handshake_cont(p_result=0x0000000112815c7c, priority=0x0000000112815edc, request=0x0000000112815a80, uctx=0x0000000139160060) at session.c:1366:26
190 */
191 sigset_t sigset;
192
193 sigfillset(&sigset);
194
195 /*
196 * Ensure workers aren't interrupted by signals.
197 * The main thread, and main event loop are mostly
198 * idle, so they can handle signals.
199 */
200 pthread_sigmask(SIG_BLOCK, &sigset, NULL);
201#endif
202
203 worker_id = sw->id; /* Store the current worker ID */
204
205 snprintf(worker_name, sizeof(worker_name), "Worker %d", sw->id);
206
207 sw->ctx = ctx = talloc_init("%s", worker_name);
208 if (!ctx) {
209 ERROR("%s - Failed allocating memory", worker_name);
210 goto fail;
211 }
212
213 INFO("%s - Starting", worker_name);
214
215 sw->el = fr_event_list_alloc(ctx, NULL, NULL);
216 if (!sw->el) {
217 PERROR("%s - Failed creating event list", worker_name);
218 goto fail;
219 }
220
221
222 sw->worker = fr_worker_create(ctx, sw->el, worker_name, sc->log, sc->lvl, &sc->config->worker);
223 if (!sw->worker) {
224 PERROR("%s - Failed creating worker", worker_name);
225 goto fail;
226 }
227
228 /*
229 * @todo make this a registry
230 */
231 if (sc->worker_thread_instantiate) {
232 CONF_SECTION *cs;
233 char section_name[32];
234
235 snprintf(section_name, sizeof(section_name), "%u", sw->id);
236
237 cs = cf_section_find(sc->cs, "worker", section_name);
238 if (!cs) cs = cf_section_find(sc->cs, "worker", NULL);
239
240 if (sc->worker_thread_instantiate(sw->ctx, sw->el, cs) < 0) {
241 PERROR("%s - Worker thread instantiation failed", worker_name);
242 goto fail;
243 }
244 }
245
247
248 /*
249 * Add this worker to all network threads.
250 */
251 for (sn = fr_dlist_head(&sc->networks);
252 sn != NULL;
253 sn = fr_dlist_next(&sc->networks, sn)) {
254 if (unlikely(fr_network_worker_add(sn->nr, sw->worker) < 0)) {
255 PERROR("%s - Failed adding worker to network %u", worker_name, sn->id);
256 goto fail; /* FIXME - Should maybe try to undo partial adds? */
257 }
258 }
259
260 DEBUG3("%s - Started", worker_name);
261
262 /*
263 * Tell the originator that the thread has started.
264 */
265 sem_post(&sc->worker_sem);
266
267 /*
268 * Do all of the work.
269 */
270 fr_worker(sw->worker);
271
272 status = FR_CHILD_EXITED;
273
274fail:
275 sw->status = status;
276
277 if (sw->worker) {
279 sw->worker = NULL;
280 }
281
282 INFO("%s - Exiting", worker_name);
283
284 if (sc->worker_thread_detach) sc->worker_thread_detach(NULL); /* Fixme once we figure out what uctx should be */
285
286 /*
287 * Not looping at this point, but may catch timer/fd
288 * insertions being done after the thread should have
289 * exited.
290 */
291 if (sw->el) fr_event_loop_exit(sw->el, 1);
292
293 /*
294 * Tell the scheduler we're done.
295 */
296 sem_post(&sc->worker_sem);
297
298 talloc_free(ctx);
299
300 return NULL;
301}
302
303
304static void stats_timer(fr_timer_list_t *tl, fr_time_t now, void *uctx)
305{
306 fr_schedule_network_t *sn = talloc_get_type_abort(uctx, fr_schedule_network_t);
307
308 fr_network_stats_log(sn->nr, sn->sc->log);
309
310 (void) fr_timer_at(sn, tl, &sn->ev, fr_time_add(now, sn->sc->config->stats_interval), false, stats_timer, sn);
311}
312
313/** Initialize and run the network thread.
314 *
315 * @param[in] arg the fr_schedule_network_t
316 * @return NULL
317 */
318static void *fr_schedule_network_thread(void *arg)
319{
320 TALLOC_CTX *ctx;
321 fr_schedule_network_t *sn = talloc_get_type_abort(arg, fr_schedule_network_t);
322 fr_schedule_t *sc = sn->sc;
325 char network_name[32];
326
327#ifndef __APPLE__
328 /*
329 * This ifdef is because macOS doesn't use pthread_signmask in its
330 * setcontext function, and seems to apply the signal mask of the thread
331 * to the entire process when setcontext is called.
332 *
333 * * frame #0: 0x00000001934118b0 libsystem_kernel.dylib`sigprocmask
334 * frame #1: 0x0000000193481f3c libsystem_platform.dylib`setcontext + 44
335 * frame #2: 0x0000000100f27298 libcrypto.3.dylib`async_fibre_swapcontext + 52
336 * frame #3: 0x0000000100f274a0 libcrypto.3.dylib`ASYNC_start_job + 496
337 * frame #4: 0x0000000100b17884 libssl.3.dylib`ssl_start_async_job + 116
338 * frame #5: 0x0000000100b17804 libssl.3.dylib`ssl_read_internal + 356
339 * frame #6: 0x0000000100b17a0c libssl.3.dylib`SSL_read + 28
340 * frame #7: 0x00000001004f5b94 libfreeradius-tls.dylib`tls_session_async_handshake_cont(p_result=0x0000000112815c7c, priority=0x0000000112815edc, request=0x0000000112815a80, uctx=0x0000000139160060) at session.c:1366:26
341 */
342 sigset_t sigset;
343
344 sigfillset(&sigset);
345
346 /*
347 * Ensure workers aren't interrupted by signals.
348 * The main thread, and main event loop are mostly
349 * idle, so they can handle signals.
350 */
351 pthread_sigmask(SIG_BLOCK, &sigset, NULL);
352#endif
353
354 snprintf(network_name, sizeof(network_name), "Network %d", sn->id);
355
356 INFO("%s - Starting", network_name);
357
358 sn->ctx = ctx = talloc_init("%s", network_name);
359 if (!ctx) {
360 ERROR("%s - Failed allocating memory", network_name);
361 goto fail;
362 }
363
364 el = fr_event_list_alloc(ctx, NULL, NULL);
365 if (!el) {
366 PERROR("%s - Failed creating event list", network_name);
367 goto fail;
368 }
369
370 sn->nr = fr_network_create(ctx, el, network_name, sc->log, sc->lvl, &sc->config->network);
371 if (!sn->nr) {
372 PERROR("%s - Failed creating network", network_name);
373 goto fail;
374 }
375
377
378 /*
379 * Tell the originator that the thread has started.
380 */
381 sem_post(&sc->network_sem);
382
383 DEBUG3("%s - Started", network_name);
384
385 /*
386 * Print out statistics for this network IO handler.
387 */
388 if (fr_time_delta_ispos(sc->config->stats_interval)) {
389 (void) fr_timer_in(sn, el->tl, &sn->ev, sn->sc->config->stats_interval, false, stats_timer, sn);
390 }
391 /*
392 * Call the main event processing loop of the network
393 * thread Will not return until the worker is about
394 * to exit.
395 */
396 fr_network(sn->nr);
397
398 status = FR_CHILD_EXITED;
399
400fail:
401 sn->status = status;
402
403 INFO("%s - Exiting", network_name);
404
405 /*
406 * Tell the scheduler we're done.
407 */
408 sem_post(&sc->network_sem);
409
410 talloc_free(ctx);
411
412 return NULL;
413}
414
415/** Creates a new thread using our standard set of options
416 *
417 * New threads are:
418 * - Joinable, i.e. you can call pthread_join on them to confirm they've exited
419 * - Immune to catchable signals.
420 *
421 * @param[out] thread handled that was created by pthread_create.
422 * @param[in] func entry point for the thread.
423 * @param[in] arg Argument to pass to func.
424 * @return
425 * - 0 on success.
426 * - -1 on failure.
427 */
428int fr_schedule_pthread_create(pthread_t *thread, void *(*func)(void *), void *arg)
429{
430 pthread_attr_t attr;
431 int ret;
432
433 /*
434 * Set the thread to wait around after it's exited
435 * so it can be joined. This is more of a useful
436 * mechanism for the parent to determine if all
437 * the threads have exited so it can continue with
438 * a graceful shutdown.
439 */
440 pthread_attr_init(&attr);
441 pthread_attr_setdetachstate(&attr, PTHREAD_CREATE_JOINABLE);
442
443 ret = pthread_create(thread, &attr, func, arg);
444 if (ret != 0) {
445 fr_strerror_printf("Failed creating thread: %s", fr_syserror(ret));
446 return -1;
447 }
448
449 return 0;
450}
451
452/** Create a scheduler and spawn the child threads.
453 *
454 * @param[in] ctx talloc context.
455 * @param[in] el event list, only for single-threaded mode.
456 * @param[in] logger destination for all logging messages.
457 * @param[in] lvl log level.
458 * @param[in] worker_thread_instantiate callback for new worker threads.
459 * @param[in] worker_thread_detach callback to destroy resources
460 * allocated by worker_thread_instantiate.
461 * @param[in] config configuration for the scheduler
462 * @return
463 * - NULL on error
464 * - fr_schedule_t new scheduler
465 */
467 fr_log_t *logger, fr_log_lvl_t lvl,
468 fr_schedule_thread_instantiate_t worker_thread_instantiate,
469 fr_schedule_thread_detach_t worker_thread_detach,
471{
472 unsigned int i;
473 fr_schedule_worker_t *sw, *next_sw;
474 fr_schedule_network_t *sn, *next_sn;
476
477 sc = talloc_zero(ctx, fr_schedule_t);
478 if (!sc) {
479 fr_strerror_const("Failed allocating memory");
480 return NULL;
481 }
482
483 sc->config = config;
484 sc->el = el;
485 sc->log = logger;
486 sc->lvl = lvl;
487
488 sc->worker_thread_instantiate = worker_thread_instantiate;
489 sc->worker_thread_detach = worker_thread_detach;
490 sc->running = true;
491
492 /*
493 * If we're single-threaded, create network / worker, and insert them into the event loop.
494 */
495 if (el) {
496 sc->single_network = fr_network_create(sc, el, "Network", sc->log, sc->lvl, &sc->config->network);
497 if (!sc->single_network) {
498 PERROR("Failed creating network");
499 pre_instantiate_st_fail:
501 return NULL;
502 }
503
504 sc->single_worker = fr_worker_create(sc, el, "Worker", sc->log, sc->lvl, &sc->config->worker);
505 if (!sc->single_worker) {
506 PERROR("Failed creating worker");
507 if (unlikely(fr_network_destroy(sc->single_network) < 0)) {
508 PERROR("Failed destroying network");
509 }
510 goto pre_instantiate_st_fail;
511 }
512
513 /*
514 * Parent thread-specific data from the single_worker
515 */
516 if (sc->worker_thread_instantiate) {
517 CONF_SECTION *subcs;
518
519 subcs = cf_section_find(sc->cs, "worker", "0");
520 if (!subcs) subcs = cf_section_find(sc->cs, "worker", NULL);
521
522 if (sc->worker_thread_instantiate(sc->single_worker, el, subcs) < 0) {
523 PERROR("Worker thread instantiation failed");
524 destroy_both:
525 if (unlikely(fr_network_destroy(sc->single_network) < 0)) {
526 PERROR("Failed destroying network");
527 }
528 fr_worker_destroy(sc->single_worker);
529 goto pre_instantiate_st_fail;
530 }
531 }
532
533 if (fr_command_register_hook(NULL, "0", sc->single_worker, cmd_worker_table) < 0) {
534 PERROR("Failed adding worker commands");
535 st_fail:
536 if (sc->worker_thread_detach) sc->worker_thread_detach(NULL);
537 goto destroy_both;
538 }
539
540 if (fr_command_register_hook(NULL, "0", sc->single_network, cmd_network_table) < 0) {
541 PERROR("Failed adding network commands");
542 goto st_fail;
543 }
544
545 /*
546 * Register the worker with the network, so
547 * things like fr_network_send_request() work.
548 */
549 fr_network_worker_add_self(sc->single_network, sc->single_worker);
550 DEBUG("Scheduler created in single-threaded mode");
551
552 if (fr_event_pre_insert(el, fr_worker_pre_event, sc->single_worker) < 0) {
553 fr_strerror_const("Failed adding pre-check to event list");
554 goto st_fail;
555 }
556
557 /*
558 * Add the event which processes request_t packets.
559 */
560 if (fr_event_post_insert(el, fr_worker_post_event, sc->single_worker) < 0) {
561 fr_strerror_const("Failed inserting post-processing event");
562 goto st_fail;
563 }
564
565 return sc;
566 }
567
568 /*
569 * Parse any scheduler-specific configuration.
570 */
571 if (!config) {
572 MEM(sc->config = talloc_zero(sc, fr_schedule_config_t));
573 sc->config->max_networks = 1;
574 sc->config->max_workers = 4;
575 } else {
576 sc->config = config;
577
578 if (sc->config->max_networks < 1) sc->config->max_networks = 1;
579 if (sc->config->max_networks > 64) sc->config->max_networks = 64;
580 if (sc->config->max_workers < 1) sc->config->max_workers = 1;
581 if (sc->config->max_workers > 64) sc->config->max_workers = 64;
582 }
583
584 /*
585 * Create the lists which hold the workers and networks.
586 */
587 fr_dlist_init(&sc->workers, fr_schedule_worker_t, entry);
588 fr_dlist_init(&sc->networks, fr_schedule_network_t, entry);
589
590 memset(&sc->network_sem, 0, sizeof(sc->network_sem));
591 if (sem_init(&sc->network_sem, 0, SEMAPHORE_LOCKED) != 0) {
592 ERROR("Failed creating semaphore: %s", fr_syserror(errno));
594 return NULL;
595 }
596
597 memset(&sc->worker_sem, 0, sizeof(sc->worker_sem));
598 if (sem_init(&sc->worker_sem, 0, SEMAPHORE_LOCKED) != 0) {
599 ERROR("Failed creating semaphore: %s", fr_syserror(errno));
601 return NULL;
602 }
603
604 /*
605 * Create the network threads first.
606 */
607 for (i = 0; i < sc->config->max_networks; i++) {
608 DEBUG3("Creating %u/%u networks", i + 1, sc->config->max_networks);
609
610 /*
611 * Create a worker "glue" structure
612 */
613 sn = talloc_zero(sc, fr_schedule_network_t);
614 if (!sn) {
615 ERROR("Network %u - Failed allocating memory", i);
616 break;
617 }
618
619 sn->id = i;
620 sn->sc = sc;
622 fr_dlist_insert_head(&sc->networks, sn);
623
625 PERROR("Failed creating network %u", i);
626 break;
627 }
628 }
629
630 /*
631 * Wait for all of the networks to signal us that either
632 * they've started, OR there's been a problem and they
633 * can't start.
634 */
635 for (i = 0; i < (unsigned int)fr_dlist_num_elements(&sc->networks); i++) {
636 DEBUG3("Waiting for semaphore from network %u/%u",
637 i + 1, (unsigned int)fr_dlist_num_elements(&sc->networks));
638 SEM_WAIT_INTR(&sc->network_sem);
639 }
640
641 /*
642 * See if all of the networks have started.
643 */
644 for (sn = fr_dlist_head(&sc->networks);
645 sn != NULL;
646 sn = next_sn) {
647 next_sn = fr_dlist_next(&sc->networks, sn);
648
649 if (sn->status != FR_CHILD_RUNNING) {
650 fr_dlist_remove(&sc->networks, sn);
651 continue;
652 }
653 }
654
655 /*
656 * Failed to start some workers, refuse to do anything!
657 */
658 if ((unsigned int)fr_dlist_num_elements(&sc->networks) < sc->config->max_networks) {
660 return NULL;
661 }
662
663 /*
664 * Create all of the workers.
665 */
666 for (i = 0; i < sc->config->max_workers; i++) {
667 DEBUG3("Creating %u/%u workers", i + 1, sc->config->max_workers);
668
669 /*
670 * Create a worker "glue" structure
671 */
672 sw = talloc_zero(sc, fr_schedule_worker_t);
673 if (!sw) {
674 ERROR("Worker %u - Failed allocating memory", i);
675 break;
676 }
677
678 sw->id = i;
679 sw->sc = sc;
681 fr_dlist_insert_head(&sc->workers, sw);
682
684 PERROR("Failed creating worker %u", i);
685 break;
686 }
687 }
688
689 /*
690 * Wait for all of the workers to signal us that either
691 * they've started, OR there's been a problem and they
692 * can't start.
693 */
694 for (i = 0; i < (unsigned int)fr_dlist_num_elements(&sc->workers); i++) {
695 DEBUG3("Waiting for semaphore from worker %u/%u",
696 i + 1, (unsigned int)fr_dlist_num_elements(&sc->workers));
697 SEM_WAIT_INTR(&sc->worker_sem);
698 }
699
700 /*
701 * See if all of the workers have started.
702 */
703 for (sw = fr_dlist_head(&sc->workers);
704 sw != NULL;
705 sw = next_sw) {
706
707 next_sw = fr_dlist_next(&sc->workers, sw);
708
709 if (sw->status != FR_CHILD_RUNNING) {
710 fr_dlist_remove(&sc->workers, sw);
711 continue;
712 }
713 }
714
715 /*
716 * Failed to start some workers, refuse to do anything!
717 */
718 if ((unsigned int)fr_dlist_num_elements(&sc->workers) < sc->config->max_workers) {
720 return NULL;
721 }
722
723 for (sw = fr_dlist_head(&sc->workers), i = 0;
724 sw != NULL;
725 sw = next_sw, i++) {
726 char buffer[32];
727
728 next_sw = fr_dlist_next(&sc->workers, sw);
729
730 snprintf(buffer, sizeof(buffer), "%d", i);
732 PERROR("Failed adding worker commands");
733 goto st_fail;
734 }
735 }
736
737 for (sn = fr_dlist_head(&sc->networks), i = 0;
738 sn != NULL;
739 sn = next_sn, i++) {
740 char buffer[32];
741
742 next_sn = fr_dlist_next(&sc->networks, sn);
743
744 snprintf(buffer, sizeof(buffer), "%d", i);
746 PERROR("Failed adding network commands");
747 goto st_fail;
748 }
749 }
750
751 if (sc) INFO("Scheduler created successfully with %u networks and %u workers",
752 sc->config->max_networks, (unsigned int)fr_dlist_num_elements(&sc->workers));
753
754 return sc;
755}
756
757/** Destroy a scheduler, and tell its child threads to exit.
758 *
759 * @note This may be called with no worker or network threads in the case of a
760 * instantiation error. This function _should_ deal with that condition
761 * gracefully.
762 *
763 * @param[in] sc_to_free the scheduler
764 * @return
765 * - <0 on error
766 * - 0 on success
767 */
769{
770 fr_schedule_t *sc = *sc_to_free;
771 unsigned int i;
774 int ret;
775
776 if (!sc) return 0;
777
778 sc->running = false;
779
780 /*
781 * Single threaded mode: kill the only network / worker we have.
782 */
783 if (sc->el) {
784 /*
785 * Destroy the network side first. It tells the
786 * workers to close.
787 */
788 if (unlikely(fr_network_destroy(sc->single_network) < 0)) {
789 ERROR("Failed destroying network");
790 }
791 fr_worker_destroy(sc->single_worker);
792 goto done;
793 }
794
795 /*
796 * Signal each network thread to exit.
797 */
798 for (sn = fr_dlist_head(&sc->networks);
799 sn != NULL;
800 sn = fr_dlist_next(&sc->networks, sn)) {
801 if (fr_network_exit(sn->nr) < 0) {
802 PERROR("Failed signaling network %i to exit", sn->id);
803 }
804 }
805
806 /*
807 * If the network threads are running, tell them to exit,
808 * and wait for them to do so. Each network thread tells
809 * all of its worker threads that it's exiting. It then
810 * closes the channels. When the workers see that there
811 * are no input channels, they exit, too.
812 */
813 for (i = 0; i < (unsigned int)fr_dlist_num_elements(&sc->networks); i++) {
814 DEBUG2("Scheduler - Waiting for semaphore indicating network exit %u/%u", i + 1,
815 (unsigned int)fr_dlist_num_elements(&sc->networks));
816 SEM_WAIT_INTR(&sc->network_sem);
817 }
818 DEBUG2("Scheduler - All networks indicated exit complete");
819
820 while ((sn = fr_dlist_head(&sc->networks)) != NULL) {
821 fr_dlist_remove(&sc->networks, sn);
822
823 /*
824 * Ensure that the thread has exited before
825 * cleaning up the context.
826 *
827 * This also ensures that the child threads have
828 * exited before the main thread cleans up the
829 * module instances.
830 */
831 if ((ret = pthread_join(sn->pthread_id, NULL)) != 0) {
832 ERROR("Failed joining network %i: %s", sn->id, fr_syserror(ret));
833 } else {
834 DEBUG2("Network %i joined (cleaned up)", sn->id);
835 }
836 }
837
838 /*
839 * Wait for all worker threads to finish. THEN clean up
840 * modules. Otherwise, the modules will be removed from
841 * underneath the workers!
842 */
843 for (i = 0; i < (unsigned int)fr_dlist_num_elements(&sc->workers); i++) {
844 DEBUG2("Scheduler - Waiting for semaphore indicating worker exit %u/%u", i + 1,
845 (unsigned int)fr_dlist_num_elements(&sc->workers));
846 SEM_WAIT_INTR(&sc->worker_sem);
847 }
848 DEBUG2("Scheduler - All workers indicated exit complete");
849
850 /*
851 * Clean up the exited workers.
852 */
853 while ((sw = fr_dlist_head(&sc->workers)) != NULL) {
854 fr_dlist_remove(&sc->workers, sw);
855
856 /*
857 * Ensure that the thread has exited before
858 * cleaning up the context.
859 *
860 * This also ensures that the child threads have
861 * exited before the main thread cleans up the
862 * module instances.
863 */
864 if ((ret = pthread_join(sw->pthread_id, NULL)) != 0) {
865 ERROR("Failed joining worker %i: %s", sw->id, fr_syserror(ret));
866 } else {
867 DEBUG2("Worker %i joined (cleaned up)", sw->id);
868 }
869 }
870
871 sem_destroy(&sc->network_sem);
872 sem_destroy(&sc->worker_sem);
873done:
874 /*
875 * Now that all of the workers are done, we can return to
876 * the caller, and have it dlclose() the modules.
877 */
879 *sc_to_free = NULL;
880
881 return 0;
882}
883
884/** Add a fr_listen_t to a scheduler.
885 *
886 * @param[in] sc the scheduler
887 * @param[in] li the ctx and callbacks for the transport.
888 * @return
889 * - NULL on error
890 * - the fr_network_t that the socket was added to.
891 */
893{
894 fr_network_t *nr;
895
896 (void) talloc_get_type_abort(sc, fr_schedule_t);
897
898 if (sc->el) {
899 nr = sc->single_network;
900 } else {
902
903 /*
904 * @todo - round robin it among the listeners?
905 * or maybe add it to the same parent thread?
906 */
907 sn = fr_dlist_head(&sc->networks);
908 nr = sn->nr;
909 }
910
911 if (fr_network_listen_add(nr, li) < 0) return NULL;
912
913 return nr;
914}
915
916/** Add a directory NOTE_EXTEND to a scheduler.
917 *
918 * @param[in] sc the scheduler
919 * @param[in] li the ctx and callbacks for the transport.
920 * @return
921 * - NULL on error
922 * - the fr_network_t that the socket was added to.
923 */
925{
926 fr_network_t *nr;
927
928 (void) talloc_get_type_abort(sc, fr_schedule_t);
929
930 if (sc->el) {
931 nr = sc->single_network;
932 } else {
934
935 /*
936 * @todo - round robin it among the listeners?
937 * or maybe add it to the same parent thread?
938 */
939 sn = fr_dlist_head(&sc->networks);
940 nr = sn->nr;
941 }
942
943 if (fr_network_directory_add(nr, li) < 0) return NULL;
944
945 return nr;
946}
static int const char char buffer[256]
Definition acutest.h:576
#define RCSID(id)
Definition build.h:485
#define unlikely(_x)
Definition build.h:383
A section grouping multiple CONF_PAIR.
Definition cf_priv.h:101
CONF_SECTION * cf_section_find(CONF_SECTION const *cs, char const *name1, char const *name2)
Find a CONF_SECTION with name1 and optionally name2.
Definition cf_util.c:1028
fr_command_register_hook_t fr_command_register_hook
Definition command.c:42
#define MEM(x)
Definition debug.h:36
#define ERROR(fmt,...)
Definition dhcpclient.c:41
#define DEBUG(fmt,...)
Definition dhcpclient.c:39
#define fr_dlist_init(_head, _type, _field)
Initialise the head structure of a doubly linked list.
Definition dlist.h:260
static void * fr_dlist_head(fr_dlist_head_t const *list_head)
Return the HEAD item of a list or NULL if the list is empty.
Definition dlist.h:486
static void * fr_dlist_remove(fr_dlist_head_t *list_head, void *ptr)
Remove an item from the list.
Definition dlist.h:638
static unsigned int fr_dlist_num_elements(fr_dlist_head_t const *head)
Return the number of elements in the dlist.
Definition dlist.h:939
static int fr_dlist_insert_head(fr_dlist_head_t *list_head, void *ptr)
Insert an item into the head of a list.
Definition dlist.h:338
static void * fr_dlist_next(fr_dlist_head_t const *list_head, void const *ptr)
Get the next item in a list.
Definition dlist.h:555
Head of a doubly linked list.
Definition dlist.h:51
Entry in a doubly linked list.
Definition dlist.h:41
fr_cmd_table_t cmd_network_table[]
Definition network.c:2099
int fr_network_listen_add(fr_network_t *nr, fr_listen_t *li)
Add a fr_listen_t to a network.
Definition network.c:236
int fr_network_worker_add(fr_network_t *nr, fr_worker_t *worker)
Add a worker to a network in a different thread.
Definition network.c:293
int fr_network_destroy(fr_network_t *nr)
Stop a network thread in an orderly way.
Definition network.c:1687
int fr_network_directory_add(fr_network_t *nr, fr_listen_t *li)
Add a "watch directory" call to a network.
Definition network.c:278
void fr_network(fr_network_t *nr)
The main network worker function.
Definition network.c:1803
void fr_network_worker_add_self(fr_network_t *nr, fr_worker_t *worker)
Add a worker to a network in the same thread.
Definition network.c:313
int fr_network_exit(fr_network_t *nr)
Signal a network thread to exit.
Definition network.c:1858
void fr_network_stats_log(fr_network_t const *nr, fr_log_t const *log)
Definition network.c:2032
fr_network_t * fr_network_create(TALLOC_CTX *ctx, fr_event_list_t *el, char const *name, fr_log_t const *logger, fr_log_lvl_t lvl, fr_network_config_t const *config)
Create a network.
Definition network.c:1891
#define PERROR(_fmt,...)
Definition log.h:228
#define DEBUG3(_fmt,...)
Definition log.h:266
talloc_free(reap)
fr_event_list_t * fr_event_list_alloc(TALLOC_CTX *ctx, fr_event_status_cb_t status, void *status_uctx)
Initialise a new event list.
Definition event.c:2526
int fr_event_pre_insert(fr_event_list_t *el, fr_event_status_cb_t callback, void *uctx)
Add a pre-event callback to the event list.
Definition event.c:1957
void fr_event_loop_exit(fr_event_list_t *el, int code)
Signal an event loop exit with the specified code.
Definition event.c:2375
int fr_event_post_insert(fr_event_list_t *el, fr_event_post_cb_t callback, void *uctx)
Add a post-event callback to the event list.
Definition event.c:2011
Stores all information relating to an event list.
Definition event.c:380
fr_log_lvl_t
Definition log.h:67
static const conf_parser_t config[]
Definition base.c:183
static bool done
Definition radclient.c:80
#define DEBUG2(fmt,...)
Definition radclient.h:43
#define INFO(fmt,...)
Definition radict.c:54
CONF_SECTION * cs
thread pool configuration section
Definition schedule.c:128
TALLOC_CTX * ctx
our allocation ctx
Definition schedule.c:106
fr_timer_t * ev
timer for stats_interval
Definition schedule.c:118
sem_t worker_sem
for inter-thread signaling
Definition schedule.c:138
fr_schedule_child_status_t status
status of the worker
Definition schedule.c:115
static _Thread_local int worker_id
Internal ID of the current worker thread.
Definition schedule.c:151
fr_event_list_t * el
event list for single-threaded mode.
Definition schedule.c:129
fr_schedule_t * sc
the scheduler we are running under
Definition schedule.c:113
fr_worker_t * single_worker
for single-threaded mode
Definition schedule.c:148
fr_log_lvl_t lvl
log level
Definition schedule.c:132
static void stats_timer(fr_timer_list_t *tl, fr_time_t now, void *uctx)
Definition schedule.c:304
fr_network_t * fr_schedule_directory_add(fr_schedule_t *sc, fr_listen_t *li)
Add a directory NOTE_EXTEND to a scheduler.
Definition schedule.c:924
#define SEM_WAIT_INTR(_x)
Definition schedule.c:65
fr_schedule_config_t * config
configuration
Definition schedule.c:134
fr_network_t * single_network
for single-threaded mode
Definition schedule.c:147
fr_schedule_thread_instantiate_t worker_thread_instantiate
thread instantiation callback
Definition schedule.c:141
fr_schedule_child_status_t
Track the child thread status.
Definition schedule.c:70
@ FR_CHILD_FAIL
failed, and in the exited queue
Definition schedule.c:75
@ FR_CHILD_FREE
child is free
Definition schedule.c:71
@ FR_CHILD_RUNNING
running, and in the running queue
Definition schedule.c:73
@ FR_CHILD_EXITED
exited, and in the exited queue
Definition schedule.c:74
@ FR_CHILD_INITIALIZING
initialized, but not running
Definition schedule.c:72
fr_network_t * fr_schedule_listen_add(fr_schedule_t *sc, fr_listen_t *li)
Add a fr_listen_t to a scheduler.
Definition schedule.c:892
fr_network_t * nr
the receive data structure
Definition schedule.c:116
fr_schedule_thread_detach_t worker_thread_detach
Definition schedule.c:142
bool running
is the scheduler running?
Definition schedule.c:126
int fr_schedule_worker_id(void)
Return the worker id for the current thread.
Definition schedule.c:157
static void * fr_schedule_worker_thread(void *arg)
Entry point for worker threads.
Definition schedule.c:167
int fr_schedule_pthread_create(pthread_t *thread, void *(*func)(void *), void *arg)
Creates a new thread using our standard set of options.
Definition schedule.c:428
fr_schedule_t * fr_schedule_create(TALLOC_CTX *ctx, fr_event_list_t *el, fr_log_t *logger, fr_log_lvl_t lvl, fr_schedule_thread_instantiate_t worker_thread_instantiate, fr_schedule_thread_detach_t worker_thread_detach, fr_schedule_config_t *config)
Create a scheduler and spawn the child threads.
Definition schedule.c:466
unsigned int num_workers_exited
number of exited workers
Definition schedule.c:136
sem_t network_sem
for inter-thread signaling
Definition schedule.c:139
int fr_schedule_destroy(fr_schedule_t **sc_to_free)
Destroy a scheduler, and tell its child threads to exit.
Definition schedule.c:768
unsigned int id
a unique ID
Definition schedule.c:109
fr_dlist_head_t networks
list of networks
Definition schedule.c:145
pthread_t pthread_id
the thread of this network
Definition schedule.c:107
fr_log_t * log
log destination
Definition schedule.c:131
fr_dlist_head_t workers
list of workers
Definition schedule.c:144
static void * fr_schedule_network_thread(void *arg)
Initialize and run the network thread.
Definition schedule.c:318
fr_dlist_t entry
our entry into the linked list of networks
Definition schedule.c:111
#define SEMAPHORE_LOCKED
Definition schedule.c:46
Scheduler specific information for network threads.
Definition schedule.c:105
The scheduler.
Definition schedule.c:125
int(* fr_schedule_thread_instantiate_t)(TALLOC_CTX *ctx, fr_event_list_t *el, void *uctx)
Setup a new thread.
Definition schedule.h:55
void(* fr_schedule_thread_detach_t)(void *uctx)
Explicitly free resources allocated by fr_schedule_thread_instantiate_t.
Definition schedule.h:61
fr_time_delta_t stats_interval
print channel statistics
Definition schedule.h:70
static const uchar sc[16]
Definition smbdes.c:115
PUBLIC int snprintf(char *string, size_t length, char *format, va_alist)
Definition snprintf.c:689
Definition log.h:96
char const * fr_syserror(int num)
Guaranteed to be thread-safe version of strerror.
Definition syserror.c:243
#define fr_time_delta_ispos(_a)
Definition time.h:290
#define fr_time_add(_a, _b)
Add a time/time delta together.
Definition time.h:196
"server local" time.
Definition time.h:69
An event timer list.
Definition timer.c:53
A timer event.
Definition timer.c:79
#define fr_timer_in(...)
Definition timer.h:86
#define fr_timer_at(...)
Definition timer.h:80
static fr_event_list_t * el
#define fr_strerror_printf(_fmt,...)
Log to thread local error buffer.
Definition strerror.h:64
#define fr_strerror_const(_msg)
Definition strerror.h:223
int fr_worker_pre_event(UNUSED fr_time_t now, UNUSED fr_time_delta_t wake, void *uctx)
Pre-event handler.
Definition worker.c:1551
fr_worker_t * fr_worker_create(TALLOC_CTX *ctx, fr_event_list_t *el, char const *name, fr_log_t const *logger, fr_log_lvl_t lvl, fr_worker_config_t *config)
Create a worker.
Definition worker.c:1356
fr_cmd_table_t cmd_worker_table[]
Definition worker.c:1738
void fr_worker_destroy(fr_worker_t *worker)
Destroy a worker.
Definition worker.c:1012
void fr_worker_post_event(UNUSED fr_event_list_t *el, UNUSED fr_time_t now, void *uctx)
Post-event handler.
Definition worker.c:1572
void fr_worker(fr_worker_t *worker)
The main loop and entry point of the stand-alone worker thread.
Definition worker.c:1493
A worker which takes packets from a master, and processes them.
Definition worker.c:94
unsigned int id
a unique ID
Definition schedule.c:88
int uses
how many network threads are using it
Definition schedule.c:89
pthread_t pthread_id
the thread of this worker
Definition schedule.c:86
fr_schedule_t * sc
the scheduler we are running under
Definition schedule.c:94
TALLOC_CTX * ctx
our allocation ctx
Definition schedule.c:84
fr_event_list_t * el
our event list
Definition schedule.c:85
fr_time_t cpu_time
how much CPU time this worker has used
Definition schedule.c:90
fr_dlist_t entry
our entry into the linked list of workers
Definition schedule.c:92
fr_schedule_child_status_t status
status of the worker
Definition schedule.c:96
fr_worker_t * worker
the worker data structure
Definition schedule.c:97
Scheduler specific information for worker threads.
Definition schedule.c:83