2 * Copyright (c) 1995, the EUROPAGATE consortium (see below).
4 * The EUROPAGATE consortium members are:
6 * University College Dublin
7 * Danmarks Teknologiske Videnscenter
8 * An Chomhairle Leabharlanna
9 * Consejo Superior de Investigaciones Cientificas
11 * Permission to use, copy, modify, distribute, and sell this software and
12 * its documentation, in whole or in part, for any purpose, is hereby granted,
15 * 1. This copyright and permission notice appear in all copies of the
16 * software and its documentation. Notices of copyright or attribution
17 * which appear at the beginning of any file must remain unchanged.
19 * 2. The names of EUROPAGATE or the project partners may not be used to
20 * endorse or promote products derived from this software without specific
21 * prior written permission.
23 * 3. Users of this software (implementors and gateway operators) agree to
24 * inform the EUROPAGATE consortium of their use of the software. This
25 * information will be used to evaluate the EUROPAGATE project and the
26 * software, and to plan further developments. The consortium may use
27 * the information in later publications.
29 * 4. Users of this software agree to make their best efforts, when
30 * documenting their use of the software, to acknowledge the EUROPAGATE
31 * consortium, and the role played by the software in their work.
33 * THIS SOFTWARE IS PROVIDED "AS IS" AND WITHOUT WARRANTY OF ANY KIND,
34 * EXPRESS, IMPLIED, OR OTHERWISE, INCLUDING WITHOUT LIMITATION, ANY
35 * WARRANTY OF MERCHANTABILITY OR FITNESS FOR A PARTICULAR PURPOSE.
36 * IN NO EVENT SHALL THE EUROPAGATE CONSORTIUM OR ITS MEMBERS BE LIABLE
37 * FOR ANY SPECIAL, INCIDENTAL, INDIRECT OR CONSEQUENTIAL DAMAGES OF
38 * ANY KIND, OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA
39 * OR PROFITS, WHETHER OR NOT ADVISED OF THE POSSIBILITY OF DAMAGE, AND
40 * ON ANY THEORY OF LIABILITY, ARISING OUT OF OR IN CONNECTION WITH THE
41 * USE OR PERFORMANCE OF THIS SOFTWARE.
44 /* Gateway Resource Monitor
48 * Revision 1.14 1995/05/23 08:12:59 adam
51 * Revision 1.13 1995/05/22 11:42:48 adam
52 * Minor changes on dtbsun.
54 * Revision 1.12 1995/05/19 14:51:06 adam
55 * Bug fix: stopped kernels sometimes got IPC messages from the monitor.
57 * Revision 1.11 1995/05/19 13:26:00 adam
58 * Bug fixes. Better command line options.
60 * Revision 1.10 1995/05/18 12:03:09 adam
61 * Bug fixes and minor improvements.
63 * Revision 1.9 1995/05/17 10:51:32 adam
64 * Added a few more error checks to the show command.
66 * Revision 1.8 1995/05/16 09:40:42 adam
67 * LICENSE. Setting of CCL token names (and/or/not/set) in read_kernel_res.
69 * Revision 1.7 1995/05/03 12:18:46 adam
70 * This code ran on dtbsun. Minor changes.
72 * Revision 1.6 1995/05/03 09:16:17 adam
75 * Revision 1.5 1995/05/03 07:37:42 adam
76 * CCL commands stop/continue implemented. New functions gw_res_{int,bool}
77 * are used when possible.
79 * Revision 1.4 1995/05/02 15:26:00 adam
80 * Monitor observes death of child (email kernel). The number
81 * of simultanous processes is controlled now. Email requests are
82 * queued if necessary. This scheme should only be forced if no kernels
85 * Revision 1.3 1995/05/02 07:20:10 adam
86 * Use pid of exited child to close fifos.
88 * Revision 1.2 1995/05/01 16:26:57 adam
89 * More work on resource monitor.
91 * Revision 1.1 1995/05/01 12:43:36 adam
92 * First work on resource monitor program.
107 #include <sys/file.h>
108 #include <sys/stat.h>
109 #include <sys/types.h>
110 #include <sys/time.h>
111 #include <sys/wait.h>
116 #include <strqueue.h>
119 #define LINE_MAX 1024
121 #define MONITOR_FIFO_S "fifo.s.m"
122 #define MONITOR_FIFO_C "fifo.c.m"
124 static char *module = "monitor";
125 static jmp_buf retry_jmp;
127 static GwRes monitor_res = NULL;
128 static int no_process = 0;
129 static int max_process = 1;
130 static int got_sighup = 0;
131 static int got_term = 0;
132 static int got_int = 0;
133 const char *default_res = "default.res";
136 * reread_resources: reread monitor resources. The static variable,
137 * max_process, is updated.
139 static void reread_resources (void)
142 gw_res_close (monitor_res);
143 monitor_res = gw_res_init ();
144 if (gw_res_merge (monitor_res, default_res))
146 gw_log (GW_LOG_WARN, module, "Couldn't read resource file %s",
150 max_process = gw_res_int (monitor_res, "gw.max.process", 10);
154 int id; /* email user-id */
155 int stopped; /* stop flag */
156 pid_t pid; /* pid of email kernel child */
157 GIP gip; /* fifo information */
158 struct str_queue *queue; /* message queue */
159 struct ke_info *next; /* link to next */
162 /* list of email kernel infos */
163 static struct ke_info *ke_info_list = NULL;
166 * ke_info_add: add/lookup of email kernel info.
167 * id: email user-id to search for.
168 * return: pointer to info structure.
170 struct ke_info *ke_info_add (int id)
172 struct ke_info **kip;
174 for (kip = &ke_info_list; *kip; kip= &(*kip)->next)
175 if ((*kip)->id == id)
177 *kip = malloc (sizeof(**kip));
182 (*kip)->queue = NULL;
187 static void ke_info_del (void)
191 assert (ke_info_list);
193 str_queue_rm (&ki->queue);
194 ke_info_list = ki->next;
199 * catch_child: catch SIGCHLD. Set email kernel pid to -1
200 * to indicate that child has exited
202 static void catch_child (int num)
207 while ((pid=waitpid (-1, 0, WNOHANG)) > 0)
209 for (ki = ke_info_list; ki; ki = ki->next)
214 signal (SIGCHLD, catch_child);
218 * catch_int: catch SIGHUP.
220 static void catch_hup (int num)
223 signal (SIGHUP, catch_hup);
227 * catch_int: catch SIGTERM.
229 static void catch_term (int num)
232 signal (SIGTERM, catch_term);
236 * catch_int: catch SIGINT.
238 static void catch_int (int num)
241 signal (SIGINT, catch_int);
245 * pipe_handle: handle SIGPIPE when transferring message to kernel
247 static void pipe_handle (int dummy)
249 longjmp (retry_jmp, 1);
253 * start_kernel: start email kernel.
254 * argc: argc of email kernel
255 * argv: argv of email kernel
257 * return: pid of email kernel child
259 static pid_t start_kernel (int argc, char **argv, int id)
264 char userid_option[20];
266 argv_p = malloc (sizeof(*argv_p)*(argc+2));
269 gw_log (GW_LOG_FATAL|GW_LOG_ERRNO, module, "malloc fail");
272 argv_p[0] = "kernel";
273 for (i = 1; i<argc; i++)
275 sprintf (userid_option, "-i%d", id);
276 argv_p[i++] = userid_option;
279 gw_log (GW_LOG_DEBUG, module, "Starting kernel");
283 gw_log (GW_LOG_FATAL|GW_LOG_ERRNO, module, "fork");
288 execv ("kernel", argv_p);
289 gw_log (GW_LOG_FATAL|GW_LOG_ERRNO, module, "execvp");
296 * deliver: deliver message to child (email kernel).
297 * argc: exec argc to child (if it need to be started)
298 * argv: exec argv to child (if it need to be started)
300 * queue: message queue to be transferred
301 * gip: pointer to FIFO info. if *gip is NULL prior invocation
302 * it will be created (initialized) and the pointer will be
304 * pidp: pointer to pid. Will hold process-id of child (if it need to
306 * dont_exec: if non-zero a child will never be started; otherwise child
307 * will be started if not already running.
308 * return: 0 if message couldn't be transferred, i.e. dont_exec is non-zero
309 * and the child is not already running.
310 * 1 if message was transferred and the child was already running.
311 * 2 if message was transferred and the child was started and
312 * dont_exec was zero.
313 * 3 serious error. Permissions denied or kernel couldn't be
316 static int deliver (int argc, char **argv, int id, struct str_queue *queue,
317 GIP *gip, pid_t *pidp, int dont_exec)
322 char fifo_server_name[128];
323 char fifo_client_name[128];
327 sprintf (fifo_server_name, "fifo.s.%d", id);
328 sprintf (fifo_client_name, "fifo.c.%d", id);
332 *gip = gipc_initialize (fifo_client_name);
334 oldsig = signal (SIGPIPE, pipe_handle);
338 { /* assume child is running */
339 gipc_close (*gip); /* shut down existing FIFOs */
340 r = gipc_open (*gip, fifo_server_name, 0); /* try re-open ... */
343 { /* assume child is NOT running */
347 { /* we aren't allowed to start */
348 signal (SIGPIPE, oldsig);
351 mknod (fifo_server_name, S_IFIFO|0666, 0);
352 pid = start_kernel (argc, argv, id);
353 if (pidp) /* set pid of child */
355 r = gipc_open (*gip, fifo_server_name, 1);
358 { /* message couldn't be transferred */
359 signal (SIGPIPE, oldsig);
360 gw_log (GW_LOG_WARN, module, "Cannot start kernel");
363 if (r < 0) /* gipc_open fail? */
366 gw_log (GW_LOG_DEBUG|GW_LOG_ERRNO, module, "r==-2");
368 gw_log (GW_LOG_DEBUG|GW_LOG_ERRNO, module, "r==-1");
370 gw_log (GW_LOG_WARN|GW_LOG_ERRNO, module, "gipc_open");
371 longjmp (retry_jmp, 1); /* yet another pass */
373 index = 0; /* transfer. may be interrupted */
374 while ((msg = str_queue_get (queue, index++)))
376 gw_log (GW_LOG_DEBUG, module, "deliver: %s", msg);
377 gip_wline (*gip, msg);
379 signal (SIGPIPE, oldsig);
380 return pass; /* successful transfer */
384 * monitor_events: Event loop of monitor
385 * argc: argc of monitor (used in exec of Email kernel children)
386 * argv: argv of monitor (used in exec of Email kernel children)
388 static void monitor_events (int argc, char **argv)
391 int r, gip_m_fd, too_many;
394 char command[128], *cp;
396 mknod (MONITOR_FIFO_C, S_IFIFO|0666, 0);
397 open (MONITOR_FIFO_C, O_RDONLY|O_NONBLOCK);
398 gip_m = gips_initialize (MONITOR_FIFO_S);
399 r = gips_open (gip_m, MONITOR_FIFO_C, 0);
400 gip_m_fd = gip_infileno (gip_m);
402 open (MONITOR_FIFO_S, O_WRONLY);
404 gw_log (GW_LOG_DEBUG, module, "Starting event loop");
414 gw_log (GW_LOG_STAT, module, "Got SIGHUP. Reading resources");
420 gw_log (GW_LOG_STAT, module, "Got SIGTERM. Exiting...");
421 unlink (MONITOR_FIFO_S);
422 unlink (MONITOR_FIFO_C);
427 gw_log (GW_LOG_STAT, module, "Got SIGINT. Exiting...");
428 unlink (MONITOR_FIFO_S);
429 unlink (MONITOR_FIFO_C);
432 /* deliver any unsent messages to Email kernels */
434 for (ki = ke_info_list; ki; ki = ki->next)
436 if (!ki->queue || ki->stopped)
438 gw_log (GW_LOG_DEBUG, module, "Transfer mail to %d", ki->id);
439 r = deliver (argc, argv, ki->id, ki->queue, &ki->gip, &ki->pid,
440 no_process >= max_process);
441 if (r == 2) /* new child was spawned? */
444 gw_log (GW_LOG_DEBUG, module, "Start of %d", ki->id);
446 if (r == 1 || r == 2) /* transfer at all? */
447 str_queue_rm (&ki->queue);
448 if (r == 0) /* too many pending? */
453 gw_log (GW_LOG_DEBUG, module, "%d too many pending",
455 for (ki = ke_info_list; ki; ki = ki->next)
457 if (!ki->queue && ki->pid != -1 && !ki->stopped)
459 if (!(ki->queue = str_queue_mk ()))
461 gw_log (GW_LOG_FATAL|GW_LOG_ERRNO, module,
465 str_queue_enq (ki->queue, "stop\n");
466 str_queue_enq (ki->queue, "\001");
467 r = deliver (argc, argv, ki->id, ki->queue, &ki->gip,
470 gw_log (GW_LOG_DEBUG, module,
471 "Stop not sent: %d", r);
472 str_queue_rm (&ki->queue);
479 FD_SET (gip_m_fd, &set_r);
480 gw_log (GW_LOG_DEBUG, module, "set gip_m_fd %d", gip_m_fd);
483 for (ki = ke_info_list; ki; ki = ki->next)
489 { /* child has exited */
490 gw_log (GW_LOG_DEBUG, module, "Close of %d", ki->id);
491 gipc_close (ki->gip);
492 gipc_destroy (ki->gip);
496 else if ((fd = gip_infileno (ki->gip)) != -1)
497 { /* read select on child FIFO */
498 gw_log (GW_LOG_DEBUG, module, "set fd %d", fd);
505 gw_log (GW_LOG_DEBUG, module, "Cur/Max processes %d/%d",
506 no_process, max_process);
507 gw_log (GW_LOG_DEBUG, module, "IPC select");
508 r = select (fd_max+1, &set_r, NULL, NULL, NULL);
512 { /* select aborted. And it was not due to interrupt */
513 gw_log (GW_LOG_FATAL|GW_LOG_ERRNO, module, "select");
516 /* select was interrupted. Probably child has died */
517 gw_log (GW_LOG_DEBUG|GW_LOG_ERRNO, module, "select");
519 /* go through list of Email kernels. See if any message has arrived */
520 gw_log (GW_LOG_DEBUG, module, "Testing ke_info_list");
521 for (ki = ke_info_list; ki; ki = ki->next)
524 if (ki->gip && (fd = gip_infileno (ki->gip)) != -1)
526 gw_log (GW_LOG_DEBUG, module, "Test of %d", fd);
527 if (FD_ISSET (fd, &set_r))
529 if (lgets (line_buf, sizeof(line_buf)-1, fd))
531 gw_log (GW_LOG_DEBUG, module, "IPC: %s", line_buf);
535 gw_log (GW_LOG_DEBUG, module, "Close of %d", ki->id);
536 gipc_close (ki->gip);
537 gipc_destroy (ki->gip);
544 /* see if any message from eti has arrived */
545 gw_log (GW_LOG_DEBUG, module, "Testing gip_m_fd %d", gip_m_fd);
546 if (FD_ISSET (gip_m_fd, &set_r))
548 gw_log (GW_LOG_DEBUG, module, "Reading from %d", gip_m_fd);
549 if (!(lgets (command, sizeof(command)-1, gip_m_fd)))
551 gw_log (GW_LOG_FATAL, module, "Unexpected close");
554 gw_log (GW_LOG_DEBUG, module, "Done");
555 if ((cp = strchr (command, '\n')))
557 gw_log (GW_LOG_DEBUG, module, "IPC: %s", command);
558 if (!memcmp (command, "eti ", 4))
560 int id = atoi (command+4);
561 struct ke_info *new_k;
563 new_k = ke_info_add (id);
564 gw_log (GW_LOG_DEBUG, module, "Incoming mail %d", id);
568 if (!(new_k->queue = str_queue_mk ()))
570 gw_log (GW_LOG_FATAL|GW_LOG_ERRNO, module,
575 str_queue_enq (new_k->queue, "mail\n");
576 while (lgets (line_buf, sizeof(line_buf)-1, gip_m_fd))
577 str_queue_enq (new_k->queue, line_buf);
578 str_queue_enq (new_k->queue, "\001");
585 * main: main of monitor
587 int main (int argc, char **argv)
592 while (++argno < argc)
594 if (argv[argno][0] == '-')
596 if (argv[argno][1] == '-')
598 switch (argv[argno][1])
602 fprintf (stderr, "monitor [options] [resourceFile]"
603 " -- [kernelOptions]\n");
604 fprintf (stderr, "If no resource file is specified");
605 fprintf (stderr, " default.res is used\n");
606 fprintf (stderr, "Options:\n");
607 fprintf (stderr, " -l log Set Log file\n");
608 fprintf (stderr, " -d Enable debugging log\n");
609 fprintf (stderr, " -D Enable more debugging log\n");
610 fprintf (stderr, " -- Precedes kernel options\n");
611 fprintf (stderr, "Kernel options are transferred to kernel\n");
615 gw_log_file (GW_LOG_ALL, argv[argno]+2);
616 else if (++argno < argc)
617 gw_log_file (GW_LOG_ALL, argv[argno]);
620 fprintf (stderr, "%s: missing log filename\n", *argv);
625 gw_log_level (GW_LOG_ALL & ~RES_DEBUG);
628 gw_log_level (GW_LOG_ALL);
631 fprintf (stderr, "%s: unknown option `%s'; use -H for help\n",
637 default_res = argv[argno];
640 signal (SIGCHLD, catch_child);
641 signal (SIGHUP, catch_hup);
642 signal (SIGTERM, catch_term);
643 signal (SIGINT, catch_int);
644 monitor_events (argc-argno, argv+argno);