chiark / gitweb /
c9ee21a29cee0e81c0ab351468a7d9dfea752009
[elogind.git] / udev / udevd.c
1 /*
2  * Copyright (C) 2004-2006 Kay Sievers <kay.sievers@vrfy.org>
3  * Copyright (C) 2004 Chris Friesen <chris_friesen@sympatico.ca>
4  *
5  *      This program is free software; you can redistribute it and/or modify it
6  *      under the terms of the GNU General Public License as published by the
7  *      Free Software Foundation version 2 of the License.
8  *
9  *      This program is distributed in the hope that it will be useful, but
10  *      WITHOUT ANY WARRANTY; without even the implied warranty of
11  *      MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
12  *      General Public License for more details.
13  *
14  *      You should have received a copy of the GNU General Public License along
15  *      with this program; if not, write to the Free Software Foundation, Inc.,
16  *      51 Franklin Street, Fifth Floor, Boston, MA  02110-1301, USA.
17  *
18  */
19
20 #include "config.h"
21
22 #include <stddef.h>
23 #include <signal.h>
24 #include <unistd.h>
25 #include <errno.h>
26 #include <stdio.h>
27 #include <stdlib.h>
28 #include <string.h>
29 #include <ctype.h>
30 #include <dirent.h>
31 #include <fcntl.h>
32 #include <syslog.h>
33 #include <time.h>
34 #include <getopt.h>
35 #include <sys/select.h>
36 #include <sys/wait.h>
37 #include <sys/types.h>
38 #include <sys/socket.h>
39 #include <sys/un.h>
40 #include <sys/stat.h>
41 #include <sys/ioctl.h>
42 #include <linux/types.h>
43 #include <linux/netlink.h>
44 #ifdef HAVE_INOTIFY
45 #include <sys/inotify.h>
46 #endif
47
48 #include "udev.h"
49 #include "udev_rules.h"
50 #include "udevd.h"
51 #include "udev_selinux.h"
52
53 static int debug;
54
55 static void log_fn(struct udev *udev, int priority,
56                    const char *file, int line, const char *fn,
57                    const char *format, va_list args)
58 {
59         if (debug) {
60                 fprintf(stderr, "[%d] %s: ", (int) getpid(), fn);
61                 vfprintf(stderr, format, args);
62         } else {
63                 vsyslog(priority, format, args);
64         }
65 }
66
67 struct udevd_uevent_msg {
68         struct udev *udev;
69         struct list_head node;
70         pid_t pid;
71         int exitstatus;
72         time_t queue_time;
73         char *action;
74         char *devpath;
75         char *subsystem;
76         char *driver;
77         dev_t devt;
78         unsigned long long seqnum;
79         char *devpath_old;
80         char *physdevpath;
81         unsigned int timeout;
82         char *envp[UEVENT_NUM_ENVP+1];
83         char envbuf[];
84 };
85
86 static int debug_trace;
87 static struct udev_rules rules;
88 static int udevd_sock = -1;
89 static int uevent_netlink_sock = -1;
90 static int inotify_fd = -1;
91 static pid_t sid;
92
93 static int signal_pipe[2] = {-1, -1};
94 static volatile int sigchilds_waiting;
95 static volatile int udev_exit;
96 static volatile int reload_config;
97 static int run_exec_q;
98 static int stop_exec_q;
99 static int max_childs;
100 static int max_childs_running;
101 static char udev_log_env[32];
102
103 static LIST_HEAD(exec_list);
104 static LIST_HEAD(running_list);
105
106 static void asmlinkage udev_event_sig_handler(int signum)
107 {
108         if (signum == SIGALRM)
109                 exit(1);
110 }
111
112 static int udev_event_process(struct udevd_uevent_msg *msg)
113 {
114         struct sigaction act;
115         struct udevice *udevice;
116         int i;
117         int retval;
118
119         /* set signal handlers */
120         memset(&act, 0x00, sizeof(act));
121         act.sa_handler = (void (*)(int)) udev_event_sig_handler;
122         sigemptyset (&act.sa_mask);
123         act.sa_flags = 0;
124         sigaction(SIGALRM, &act, NULL);
125
126         /* reset to default */
127         act.sa_handler = SIG_DFL;
128         sigaction(SIGINT, &act, NULL);
129         sigaction(SIGTERM, &act, NULL);
130         sigaction(SIGCHLD, &act, NULL);
131         sigaction(SIGHUP, &act, NULL);
132
133         /* trigger timeout to prevent hanging processes */
134         alarm(UDEV_EVENT_TIMEOUT);
135
136         /* reconstruct event environment from message */
137         for (i = 0; msg->envp[i]; i++)
138                 putenv(msg->envp[i]);
139
140         udevice = udev_device_init(msg->udev);
141         if (udevice == NULL)
142                 return -1;
143         strlcpy(udevice->action, msg->action, sizeof(udevice->action));
144         sysfs_device_set_values(udevice->udev, udevice->dev, msg->devpath, msg->subsystem, msg->driver);
145         udevice->devpath_old = msg->devpath_old;
146         udevice->devt = msg->devt;
147
148         retval = udev_device_event(&rules, udevice);
149
150         /* rules may change/disable the timeout */
151         if (udevice->event_timeout >= 0)
152                 alarm(udevice->event_timeout);
153
154         /* run programs collected by RUN-key*/
155         if (retval == 0 && !udevice->ignore_device && udev_get_run(msg->udev))
156                 retval = udev_rules_run(udevice);
157
158         udev_device_cleanup(udevice);
159         return retval;
160 }
161
162 enum event_state {
163         EVENT_QUEUED,
164         EVENT_FINISHED,
165         EVENT_FAILED,
166 };
167
168 static void export_event_state(struct udevd_uevent_msg *msg, enum event_state state)
169 {
170         char filename[PATH_SIZE];
171         char filename_failed[PATH_SIZE];
172         size_t start;
173
174         /* location of queue file */
175         snprintf(filename, sizeof(filename), "%s/.udev/queue/%llu", udev_get_dev_path(msg->udev), msg->seqnum);
176
177         /* location of failed file */
178         strlcpy(filename_failed, udev_get_dev_path(msg->udev), sizeof(filename_failed));
179         strlcat(filename_failed, "/", sizeof(filename_failed));
180         start = strlcat(filename_failed, ".udev/failed/", sizeof(filename_failed));
181         strlcat(filename_failed, msg->devpath, sizeof(filename_failed));
182         path_encode(&filename_failed[start], sizeof(filename_failed) - start);
183
184         switch (state) {
185         case EVENT_QUEUED:
186                 unlink(filename_failed);
187                 delete_path(msg->udev, filename_failed);
188                 create_path(msg->udev, filename);
189                 selinux_setfscreatecon(msg->udev, filename, NULL, S_IFLNK);
190                 symlink(msg->devpath, filename);
191                 selinux_resetfscreatecon(msg->udev);
192                 break;
193         case EVENT_FINISHED:
194                 if (msg->devpath_old != NULL) {
195                         /* "move" event - rename failed file to current name, do not delete failed */
196                         char filename_failed_old[PATH_SIZE];
197
198                         strlcpy(filename_failed_old, udev_get_dev_path(msg->udev), sizeof(filename_failed_old));
199                         strlcat(filename_failed_old, "/", sizeof(filename_failed_old));
200                         start = strlcat(filename_failed_old, ".udev/failed/", sizeof(filename_failed_old));
201                         strlcat(filename_failed_old, msg->devpath_old, sizeof(filename_failed_old));
202                         path_encode(&filename_failed_old[start], sizeof(filename) - start);
203
204                         if (rename(filename_failed_old, filename_failed) == 0)
205                                 info(msg->udev, "renamed devpath, moved failed state of '%s' to %s'\n",
206                                      msg->devpath_old, msg->devpath);
207                 } else {
208                         unlink(filename_failed);
209                         delete_path(msg->udev, filename_failed);
210                 }
211
212                 unlink(filename);
213                 delete_path(msg->udev, filename);
214                 break;
215         case EVENT_FAILED:
216                 /* move failed event to the failed directory */
217                 create_path(msg->udev, filename_failed);
218                 rename(filename, filename_failed);
219
220                 /* clean up possibly empty queue directory */
221                 delete_path(msg->udev, filename);
222                 break;
223         }
224
225         return;
226 }
227
228 static void msg_queue_delete(struct udevd_uevent_msg *msg)
229 {
230         list_del(&msg->node);
231
232         /* mark as failed, if "add" event returns non-zero */
233         if (msg->exitstatus && strcmp(msg->action, "add") == 0)
234                 export_event_state(msg, EVENT_FAILED);
235         else
236                 export_event_state(msg, EVENT_FINISHED);
237
238         free(msg);
239 }
240
241 static void udev_event_run(struct udevd_uevent_msg *msg)
242 {
243         pid_t pid;
244         int retval;
245
246         pid = fork();
247         switch (pid) {
248         case 0:
249                 /* child */
250                 close(uevent_netlink_sock);
251                 close(udevd_sock);
252                 if (inotify_fd >= 0)
253                         close(inotify_fd);
254                 close(signal_pipe[READ_END]);
255                 close(signal_pipe[WRITE_END]);
256                 logging_close();
257                 logging_init("udevd-event");
258                 setpriority(PRIO_PROCESS, 0, UDEV_PRIORITY);
259
260                 retval = udev_event_process(msg);
261                 info(msg->udev, "seq %llu finished with %i\n", msg->seqnum, retval);
262
263                 logging_close();
264                 if (retval)
265                         exit(1);
266                 exit(0);
267         case -1:
268                 err(msg->udev, "fork of child failed: %s\n", strerror(errno));
269                 msg_queue_delete(msg);
270                 break;
271         default:
272                 /* get SIGCHLD in main loop */
273                 info(msg->udev, "seq %llu forked, pid [%d], '%s' '%s', %ld seconds old\n",
274                      msg->seqnum, pid,  msg->action, msg->subsystem, time(NULL) - msg->queue_time);
275                 msg->pid = pid;
276         }
277 }
278
279 static void msg_queue_insert(struct udevd_uevent_msg *msg)
280 {
281         char filename[PATH_SIZE];
282         int fd;
283
284         msg->queue_time = time(NULL);
285
286         export_event_state(msg, EVENT_QUEUED);
287         info(msg->udev, "seq %llu queued, '%s' '%s'\n", msg->seqnum, msg->action, msg->subsystem);
288
289         strlcpy(filename, udev_get_dev_path(msg->udev), sizeof(filename));
290         strlcat(filename, "/.udev/uevent_seqnum", sizeof(filename));
291         fd = open(filename, O_WRONLY|O_TRUNC|O_CREAT, 0644);
292         if (fd >= 0) {
293                 char str[32];
294                 int len;
295
296                 len = sprintf(str, "%llu\n", msg->seqnum);
297                 write(fd, str, len);
298                 close(fd);
299         }
300
301         /* run one event after the other in debug mode */
302         if (debug_trace) {
303                 list_add_tail(&msg->node, &running_list);
304                 udev_event_run(msg);
305                 waitpid(msg->pid, NULL, 0);
306                 msg_queue_delete(msg);
307                 return;
308         }
309
310         /* run all events with a timeout set immediately */
311         if (msg->timeout != 0) {
312                 list_add_tail(&msg->node, &running_list);
313                 udev_event_run(msg);
314                 return;
315         }
316
317         list_add_tail(&msg->node, &exec_list);
318         run_exec_q = 1;
319 }
320
321 static int mem_size_mb(void)
322 {
323         FILE* f;
324         char buf[4096];
325         long int memsize = -1;
326
327         f = fopen("/proc/meminfo", "r");
328         if (f == NULL)
329                 return -1;
330
331         while (fgets(buf, sizeof(buf), f) != NULL) {
332                 long int value;
333
334                 if (sscanf(buf, "MemTotal: %ld kB", &value) == 1) {
335                         memsize = value / 1024;
336                         break;
337                 }
338         }
339
340         fclose(f);
341         return memsize;
342 }
343
344 static int cpu_count(void)
345 {
346         FILE* f;
347         char buf[4096];
348         int count = 0;
349
350         f = fopen("/proc/stat", "r");
351         if (f == NULL)
352                 return -1;
353
354         while (fgets(buf, sizeof(buf), f) != NULL) {
355                 if (strncmp(buf, "cpu", 3) == 0 && isdigit(buf[3]))
356                         count++;
357         }
358
359         fclose(f);
360         if (count == 0)
361                 return -1;
362         return count;
363 }
364
365 static int running_processes(void)
366 {
367         FILE* f;
368         char buf[4096];
369         int running = -1;
370
371         f = fopen("/proc/stat", "r");
372         if (f == NULL)
373                 return -1;
374
375         while (fgets(buf, sizeof(buf), f) != NULL) {
376                 int value;
377
378                 if (sscanf(buf, "procs_running %u", &value) == 1) {
379                         running = value;
380                         break;
381                 }
382         }
383
384         fclose(f);
385         return running;
386 }
387
388 /* return the number of process es in our session, count only until limit */
389 static int running_processes_in_session(pid_t session, int limit)
390 {
391         DIR *dir;
392         struct dirent *dent;
393         int running = 0;
394
395         dir = opendir("/proc");
396         if (!dir)
397                 return -1;
398
399         /* read process info from /proc */
400         for (dent = readdir(dir); dent != NULL; dent = readdir(dir)) {
401                 int f;
402                 char procdir[64];
403                 char line[256];
404                 const char *pos;
405                 char state;
406                 pid_t ppid, pgrp, sess;
407                 int len;
408
409                 if (!isdigit(dent->d_name[0]))
410                         continue;
411
412                 snprintf(procdir, sizeof(procdir), "/proc/%s/stat", dent->d_name);
413                 procdir[sizeof(procdir)-1] = '\0';
414
415                 f = open(procdir, O_RDONLY);
416                 if (f == -1)
417                         continue;
418
419                 len = read(f, line, sizeof(line)-1);
420                 close(f);
421
422                 if (len <= 0)
423                         continue;
424                 else
425                         line[len] = '\0';
426
427                 /* skip ugly program name */
428                 pos = strrchr(line, ')') + 2;
429                 if (pos == NULL)
430                         continue;
431
432                 if (sscanf(pos, "%c %d %d %d ", &state, &ppid, &pgrp, &sess) != 4)
433                         continue;
434
435                 /* count only processes in our session */
436                 if (sess != session)
437                         continue;
438
439                 /* count only running, no sleeping processes */
440                 if (state != 'R')
441                         continue;
442
443                 running++;
444                 if (limit > 0 && running >= limit)
445                         break;
446         }
447         closedir(dir);
448
449         return running;
450 }
451
452 static int compare_devpath(const char *running, const char *waiting)
453 {
454         int i;
455
456         for (i = 0; i < PATH_SIZE; i++) {
457                 /* identical device event found */
458                 if (running[i] == '\0' && waiting[i] == '\0')
459                         return 1;
460
461                 /* parent device event found */
462                 if (running[i] == '\0' && waiting[i] == '/')
463                         return 2;
464
465                 /* child device event found */
466                 if (running[i] == '/' && waiting[i] == '\0')
467                         return 3;
468
469                 /* no matching event */
470                 if (running[i] != waiting[i])
471                         break;
472         }
473
474         return 0;
475 }
476
477 /* lookup event for identical, parent, child, or physical device */
478 static int devpath_busy(struct udevd_uevent_msg *msg, int limit)
479 {
480         struct udevd_uevent_msg *loop_msg;
481         int childs_count = 0;
482
483         /* check exec-queue which may still contain delayed events we depend on */
484         list_for_each_entry(loop_msg, &exec_list, node) {
485                 /* skip ourself and all later events */
486                 if (loop_msg->seqnum >= msg->seqnum)
487                         break;
488
489                 /* check our old name */
490                 if (msg->devpath_old != NULL)
491                         if (strcmp(loop_msg->devpath , msg->devpath_old) == 0)
492                                 return 2;
493
494                 /* check identical, parent, or child device event */
495                 if (compare_devpath(loop_msg->devpath, msg->devpath) != 0) {
496                         dbg(msg->udev, "%llu, device event still pending %llu (%s)\n",
497                             msg->seqnum, loop_msg->seqnum, loop_msg->devpath);
498                         return 3;
499                 }
500
501                 /* check for our major:minor number */
502                 if (msg->devt && loop_msg->devt == msg->devt &&
503                     strcmp(msg->subsystem, loop_msg->subsystem) == 0) {
504                         dbg(msg->udev, "%llu, device event still pending %llu (%d:%d)\n", msg->seqnum,
505                             loop_msg->seqnum, major(loop_msg->devt), minor(loop_msg->devt));
506                         return 4;
507                 }
508
509                 /* check physical device event (special case of parent) */
510                 if (msg->physdevpath && msg->action && strcmp(msg->action, "add") == 0)
511                         if (compare_devpath(loop_msg->devpath, msg->physdevpath) != 0) {
512                                 dbg(msg->udev, "%llu, physical device event still pending %llu (%s)\n",
513                                     msg->seqnum, loop_msg->seqnum, loop_msg->devpath);
514                                 return 5;
515                         }
516         }
517
518         /* check run queue for still running events */
519         list_for_each_entry(loop_msg, &running_list, node) {
520                 if (limit && childs_count++ > limit) {
521                         dbg(msg->udev, "%llu, maximum number (%i) of childs reached\n", msg->seqnum, childs_count);
522                         return 1;
523                 }
524
525                 /* check our old name */
526                 if (msg->devpath_old != NULL)
527                         if (strcmp(loop_msg->devpath , msg->devpath_old) == 0)
528                                 return 2;
529
530                 /* check identical, parent, or child device event */
531                 if (compare_devpath(loop_msg->devpath, msg->devpath) != 0) {
532                         dbg(msg->udev, "%llu, device event still running %llu (%s)\n",
533                             msg->seqnum, loop_msg->seqnum, loop_msg->devpath);
534                         return 3;
535                 }
536
537                 /* check for our major:minor number */
538                 if (msg->devt && loop_msg->devt == msg->devt &&
539                     strcmp(msg->subsystem, loop_msg->subsystem) == 0) {
540                         dbg(msg->udev, "%llu, device event still running %llu (%d:%d)\n", msg->seqnum,
541                             loop_msg->seqnum, major(loop_msg->devt), minor(loop_msg->devt));
542                         return 4;
543                 }
544
545                 /* check physical device event (special case of parent) */
546                 if (msg->physdevpath && msg->action && strcmp(msg->action, "add") == 0)
547                         if (compare_devpath(loop_msg->devpath, msg->physdevpath) != 0) {
548                                 dbg(msg->udev, "%llu, physical device event still running %llu (%s)\n",
549                                     msg->seqnum, loop_msg->seqnum, loop_msg->devpath);
550                                 return 5;
551                         }
552         }
553         return 0;
554 }
555
556 /* serializes events for the identical and parent and child devices */
557 static void msg_queue_manager(struct udev *udev)
558 {
559         struct udevd_uevent_msg *loop_msg;
560         struct udevd_uevent_msg *tmp_msg;
561         int running;
562
563         if (list_empty(&exec_list))
564                 return;
565
566         running = running_processes();
567         dbg(udev, "%d processes runnning on system\n", running);
568         if (running < 0)
569                 running = max_childs_running;
570
571         list_for_each_entry_safe(loop_msg, tmp_msg, &exec_list, node) {
572                 /* check running processes in our session and possibly throttle */
573                 if (running >= max_childs_running) {
574                         running = running_processes_in_session(sid, max_childs_running+10);
575                         dbg(udev, "at least %d processes running in session\n", running);
576                         if (running >= max_childs_running) {
577                                 dbg(udev, "delay seq %llu, too many processes already running\n", loop_msg->seqnum);
578                                 return;
579                         }
580                 }
581
582                 /* serialize and wait for parent or child events */
583                 if (devpath_busy(loop_msg, max_childs) != 0) {
584                         dbg(udev, "delay seq %llu (%s)\n", loop_msg->seqnum, loop_msg->devpath);
585                         continue;
586                 }
587
588                 /* move event to run list */
589                 list_move_tail(&loop_msg->node, &running_list);
590                 udev_event_run(loop_msg);
591                 running++;
592                 dbg(udev, "moved seq %llu to running list\n", loop_msg->seqnum);
593         }
594 }
595
596 static struct udevd_uevent_msg *get_msg_from_envbuf(struct udev *udev, const char *buf, int buf_size)
597 {
598         int bufpos;
599         int i;
600         struct udevd_uevent_msg *msg;
601         char *physdevdriver_key = NULL;
602         int maj = 0;
603         int min = 0;
604
605         msg = malloc(sizeof(struct udevd_uevent_msg) + buf_size);
606         if (msg == NULL)
607                 return NULL;
608         memset(msg, 0x00, sizeof(struct udevd_uevent_msg) + buf_size);
609         msg->udev = udev;
610
611         /* copy environment buffer and reconstruct envp */
612         memcpy(msg->envbuf, buf, buf_size);
613         bufpos = 0;
614         for (i = 0; (bufpos < buf_size) && (i < UEVENT_NUM_ENVP-2); i++) {
615                 int keylen;
616                 char *key;
617
618                 key = &msg->envbuf[bufpos];
619                 keylen = strlen(key);
620                 msg->envp[i] = key;
621                 bufpos += keylen + 1;
622                 dbg(udev, "add '%s' to msg.envp[%i]\n", msg->envp[i], i);
623
624                 /* remember some keys for further processing */
625                 if (strncmp(key, "ACTION=", 7) == 0)
626                         msg->action = &key[7];
627                 else if (strncmp(key, "DEVPATH=", 8) == 0)
628                         msg->devpath = &key[8];
629                 else if (strncmp(key, "SUBSYSTEM=", 10) == 0)
630                         msg->subsystem = &key[10];
631                 else if (strncmp(key, "DRIVER=", 7) == 0)
632                         msg->driver = &key[7];
633                 else if (strncmp(key, "SEQNUM=", 7) == 0)
634                         msg->seqnum = strtoull(&key[7], NULL, 10);
635                 else if (strncmp(key, "DEVPATH_OLD=", 12) == 0)
636                         msg->devpath_old = &key[12];
637                 else if (strncmp(key, "PHYSDEVPATH=", 12) == 0)
638                         msg->physdevpath = &key[12];
639                 else if (strncmp(key, "PHYSDEVDRIVER=", 14) == 0)
640                         physdevdriver_key = key;
641                 else if (strncmp(key, "MAJOR=", 6) == 0)
642                         maj = strtoull(&key[6], NULL, 10);
643                 else if (strncmp(key, "MINOR=", 6) == 0)
644                         min = strtoull(&key[6], NULL, 10);
645                 else if (strncmp(key, "TIMEOUT=", 8) == 0)
646                         msg->timeout = strtoull(&key[8], NULL, 10);
647         }
648         msg->devt = makedev(maj, min);
649         msg->envp[i++] = "UDEVD_EVENT=1";
650
651         if (msg->driver == NULL && msg->physdevpath == NULL && physdevdriver_key != NULL) {
652                 /* for older kernels DRIVER is empty for a bus device, export PHYSDEVDRIVER as DRIVER */
653                 msg->envp[i++] = &physdevdriver_key[7];
654                 msg->driver = &physdevdriver_key[14];
655         }
656
657         msg->envp[i] = NULL;
658
659         if (msg->devpath == NULL || msg->action == NULL) {
660                 info(udev, "DEVPATH or ACTION missing, ignore message\n");
661                 free(msg);
662                 return NULL;
663         }
664         return msg;
665 }
666
667 /* receive the udevd message from userspace */
668 static void get_ctrl_msg(struct udev *udev)
669 {
670         struct udevd_ctrl_msg ctrl_msg;
671         ssize_t size;
672         struct msghdr smsg;
673         struct cmsghdr *cmsg;
674         struct iovec iov;
675         struct ucred *cred;
676         char cred_msg[CMSG_SPACE(sizeof(struct ucred))];
677         char *pos;
678
679         memset(&ctrl_msg, 0x00, sizeof(struct udevd_ctrl_msg));
680         iov.iov_base = &ctrl_msg;
681         iov.iov_len = sizeof(struct udevd_ctrl_msg);
682
683         memset(&smsg, 0x00, sizeof(struct msghdr));
684         smsg.msg_iov = &iov;
685         smsg.msg_iovlen = 1;
686         smsg.msg_control = cred_msg;
687         smsg.msg_controllen = sizeof(cred_msg);
688
689         size = recvmsg(udevd_sock, &smsg, 0);
690         if (size <  0) {
691                 if (errno != EINTR)
692                         err(udev, "unable to receive user udevd message: %s\n", strerror(errno));
693                 return;
694         }
695         cmsg = CMSG_FIRSTHDR(&smsg);
696         cred = (struct ucred *) CMSG_DATA(cmsg);
697
698         if (cmsg == NULL || cmsg->cmsg_type != SCM_CREDENTIALS) {
699                 err(udev, "no sender credentials received, message ignored\n");
700                 return;
701         }
702
703         if (cred->uid != 0) {
704                 err(udev, "sender uid=%i, message ignored\n", cred->uid);
705                 return;
706         }
707
708         if (strncmp(ctrl_msg.magic, UDEVD_CTRL_MAGIC, sizeof(UDEVD_CTRL_MAGIC)) != 0 ) {
709                 err(udev, "message magic '%s' doesn't match, ignore it\n", ctrl_msg.magic);
710                 return;
711         }
712
713         switch (ctrl_msg.type) {
714         case UDEVD_CTRL_ENV:
715                 pos = strchr(ctrl_msg.buf, '=');
716                 if (pos == NULL) {
717                         err(udev, "wrong key format '%s'\n", ctrl_msg.buf);
718                         break;
719                 }
720                 pos[0] = '\0';
721                 if (pos[1] == '\0') {
722                         info(udev, "udevd message (ENV) received, unset '%s'\n", ctrl_msg.buf);
723                         unsetenv(ctrl_msg.buf);
724                 } else {
725                         info(udev, "udevd message (ENV) received, set '%s=%s'\n", ctrl_msg.buf, &pos[1]);
726                         setenv(ctrl_msg.buf, &pos[1], 1);
727                 }
728                 break;
729         case UDEVD_CTRL_STOP_EXEC_QUEUE:
730                 info(udev, "udevd message (STOP_EXEC_QUEUE) received\n");
731                 stop_exec_q = 1;
732                 break;
733         case UDEVD_CTRL_START_EXEC_QUEUE:
734                 info(udev, "udevd message (START_EXEC_QUEUE) received\n");
735                 stop_exec_q = 0;
736                 msg_queue_manager(udev);
737                 break;
738         case UDEVD_CTRL_SET_LOG_LEVEL:
739                 info(udev, "udevd message (SET_LOG_PRIORITY) received, log_priority=%i\n", ctrl_msg.intval);
740                 udev_set_log_priority(udev, ctrl_msg.intval);
741                 sprintf(udev_log_env, "UDEV_LOG=%i", udev_get_log_priority(udev));
742                 putenv(udev_log_env);
743                 break;
744         case UDEVD_CTRL_SET_MAX_CHILDS:
745                 info(udev, "udevd message (UDEVD_SET_MAX_CHILDS) received, max_childs=%i\n", ctrl_msg.intval);
746                 max_childs = ctrl_msg.intval;
747                 break;
748         case UDEVD_CTRL_SET_MAX_CHILDS_RUNNING:
749                 info(udev, "udevd message (UDEVD_SET_MAX_CHILDS_RUNNING) received, max_childs_running=%i\n", ctrl_msg.intval);
750                 max_childs_running = ctrl_msg.intval;
751                 break;
752         case UDEVD_CTRL_RELOAD_RULES:
753                 info(udev, "udevd message (RELOAD_RULES) received\n");
754                 reload_config = 1;
755                 break;
756         default:
757                 err(udev, "unknown control message type\n");
758         }
759 }
760
761 /* receive the kernel user event message and do some sanity checks */
762 static struct udevd_uevent_msg *get_netlink_msg(struct udev *udev)
763 {
764         struct udevd_uevent_msg *msg;
765         int bufpos;
766         ssize_t size;
767         static char buffer[UEVENT_BUFFER_SIZE+512];
768         char *pos;
769
770         size = recv(uevent_netlink_sock, &buffer, sizeof(buffer), 0);
771         if (size <  0) {
772                 if (errno != EINTR)
773                         err(udev, "unable to receive kernel netlink message: %s\n", strerror(errno));
774                 return NULL;
775         }
776
777         if ((size_t)size > sizeof(buffer)-1)
778                 size = sizeof(buffer)-1;
779         buffer[size] = '\0';
780         dbg(udev, "uevent_size=%zi\n", size);
781
782         /* start of event payload */
783         bufpos = strlen(buffer)+1;
784         msg = get_msg_from_envbuf(udev, &buffer[bufpos], size-bufpos);
785         if (msg == NULL)
786                 return NULL;
787
788         /* validate message */
789         pos = strchr(buffer, '@');
790         if (pos == NULL) {
791                 err(udev, "invalid uevent '%s'\n", buffer);
792                 free(msg);
793                 return NULL;
794         }
795         pos[0] = '\0';
796
797         if (msg->action == NULL) {
798                 info(udev, "no ACTION in payload found, skip event '%s'\n", buffer);
799                 free(msg);
800                 return NULL;
801         }
802
803         if (strcmp(msg->action, buffer) != 0) {
804                 err(udev, "ACTION in payload does not match uevent, skip event '%s'\n", buffer);
805                 free(msg);
806                 return NULL;
807         }
808
809         return msg;
810 }
811
812 static void asmlinkage sig_handler(int signum)
813 {
814         switch (signum) {
815                 case SIGINT:
816                 case SIGTERM:
817                         udev_exit = 1;
818                         break;
819                 case SIGCHLD:
820                         /* set flag, then write to pipe if needed */
821                         sigchilds_waiting = 1;
822                         break;
823                 case SIGHUP:
824                         reload_config = 1;
825                         break;
826         }
827
828         /* write to pipe, which will wakeup select() in our mainloop */
829         write(signal_pipe[WRITE_END], "", 1);
830 }
831
832 static void udev_done(int pid, int exitstatus)
833 {
834         /* find msg associated with pid and delete it */
835         struct udevd_uevent_msg *msg;
836
837         list_for_each_entry(msg, &running_list, node) {
838                 if (msg->pid == pid) {
839                         info(msg->udev, "seq %llu, pid [%d] exit with %i, %ld seconds old\n", msg->seqnum, msg->pid,
840                              exitstatus, time(NULL) - msg->queue_time);
841                         msg->exitstatus = exitstatus;
842                         msg_queue_delete(msg);
843
844                         /* there may be events waiting with the same devpath */
845                         run_exec_q = 1;
846                         return;
847                 }
848         }
849 }
850
851 static void reap_sigchilds(void)
852 {
853         pid_t pid;
854         int status;
855
856         while (1) {
857                 pid = waitpid(-1, &status, WNOHANG);
858                 if (pid <= 0)
859                         break;
860                 if (WIFEXITED(status))
861                         status = WEXITSTATUS(status);
862                 else if (WIFSIGNALED(status))
863                         status = WTERMSIG(status) + 128;
864                 else
865                         status = 0;
866                 udev_done(pid, status);
867         }
868 }
869
870 static int init_udevd_socket(struct udev *udev)
871 {
872         struct sockaddr_un saddr;
873         socklen_t addrlen;
874         const int feature_on = 1;
875         int retval;
876
877         memset(&saddr, 0x00, sizeof(saddr));
878         saddr.sun_family = AF_LOCAL;
879         strcpy(saddr.sun_path, UDEVD_CTRL_SOCK_PATH);
880         addrlen = offsetof(struct sockaddr_un, sun_path) + strlen(saddr.sun_path);
881         /* translate leading '@' to abstract namespace */
882         if (saddr.sun_path[0] == '@')
883                 saddr.sun_path[0] = '\0';
884
885         udevd_sock = socket(AF_LOCAL, SOCK_DGRAM, 0);
886         if (udevd_sock == -1) {
887                 err(udev, "error getting socket: %s\n", strerror(errno));
888                 return -1;
889         }
890
891         /* the bind takes care of ensuring only one copy running */
892         retval = bind(udevd_sock, (struct sockaddr *) &saddr, addrlen);
893         if (retval < 0) {
894                 err(udev, "bind failed: %s\n", strerror(errno));
895                 close(udevd_sock);
896                 udevd_sock = -1;
897                 return -1;
898         }
899
900         /* enable receiving of the sender credentials */
901         setsockopt(udevd_sock, SOL_SOCKET, SO_PASSCRED, &feature_on, sizeof(feature_on));
902
903         return 0;
904 }
905
906 static int init_uevent_netlink_sock(struct udev *udev)
907 {
908         struct sockaddr_nl snl;
909         const int buffersize = 16 * 1024 * 1024;
910         int retval;
911
912         memset(&snl, 0x00, sizeof(struct sockaddr_nl));
913         snl.nl_family = AF_NETLINK;
914         snl.nl_pid = getpid();
915         snl.nl_groups = 1;
916
917         uevent_netlink_sock = socket(PF_NETLINK, SOCK_DGRAM, NETLINK_KOBJECT_UEVENT);
918         if (uevent_netlink_sock == -1) {
919                 err(udev, "error getting socket: %s\n", strerror(errno));
920                 return -1;
921         }
922
923         /* set receive buffersize */
924         setsockopt(uevent_netlink_sock, SOL_SOCKET, SO_RCVBUFFORCE, &buffersize, sizeof(buffersize));
925
926         retval = bind(uevent_netlink_sock, (struct sockaddr *) &snl, sizeof(struct sockaddr_nl));
927         if (retval < 0) {
928                 err(udev, "bind failed: %s\n", strerror(errno));
929                 close(uevent_netlink_sock);
930                 uevent_netlink_sock = -1;
931                 return -1;
932         }
933         return 0;
934 }
935
936 static void export_initial_seqnum(struct udev *udev)
937 {
938         char filename[PATH_SIZE];
939         int fd;
940         char seqnum[32];
941         ssize_t len = 0;
942
943         strlcpy(filename, udev_get_sys_path(udev), sizeof(filename));
944         strlcat(filename, "/kernel/uevent_seqnum", sizeof(filename));
945         fd = open(filename, O_RDONLY);
946         if (fd >= 0) {
947                 len = read(fd, seqnum, sizeof(seqnum)-1);
948                 close(fd);
949         }
950         if (len <= 0) {
951                 strcpy(seqnum, "0\n");
952                 len = 3;
953         }
954         strlcpy(filename, udev_get_dev_path(udev), sizeof(filename));
955         strlcat(filename, "/.udev/uevent_seqnum", sizeof(filename));
956         create_path(udev, filename);
957         fd = open(filename, O_WRONLY|O_TRUNC|O_CREAT, 0644);
958         if (fd >= 0) {
959                 write(fd, seqnum, len);
960                 close(fd);
961         }
962 }
963
964 int main(int argc, char *argv[])
965 {
966         struct udev *udev;
967         int retval;
968         int fd;
969         struct sigaction act;
970         fd_set readfds;
971         const char *value;
972         int daemonize = 0;
973         static const struct option options[] = {
974                 { "daemon", 0, NULL, 'd' },
975                 { "debug-trace", 0, NULL, 't' },
976                 { "debug", 0, NULL, 'D' },
977                 { "help", 0, NULL, 'h' },
978                 { "version", 0, NULL, 'V' },
979                 {}
980         };
981         int rc = 1;
982         int maxfd;
983
984         udev = udev_new();
985         if (udev == NULL)
986                 goto exit;
987
988         logging_init("udevd");
989         udev_set_log_fn(udev, log_fn);
990
991         selinux_init(udev);
992         dbg(udev, "version %s\n", VERSION);
993
994         while (1) {
995                 int option;
996
997                 option = getopt_long(argc, argv, "dDthV", options, NULL);
998                 if (option == -1)
999                         break;
1000
1001                 switch (option) {
1002                 case 'd':
1003                         daemonize = 1;
1004                         break;
1005                 case 't':
1006                         debug_trace = 1;
1007                         break;
1008                 case 'D':
1009                         debug = 1;
1010                         if (udev_get_log_priority(udev) < LOG_INFO)
1011                                 udev_set_log_priority(udev, LOG_INFO);
1012                         break;
1013                 case 'h':
1014                         printf("Usage: udevd [--help] [--daemon] [--debug-trace] [--debug] [--version]\n");
1015                         goto exit;
1016                 case 'V':
1017                         printf("%s\n", VERSION);
1018                         goto exit;
1019                 default:
1020                         goto exit;
1021                 }
1022         }
1023
1024         if (getuid() != 0) {
1025                 fprintf(stderr, "root privileges required\n");
1026                 err(udev, "root privileges required\n");
1027                 goto exit;
1028         }
1029
1030         /* make sure std{in,out,err} fd's are in a sane state */
1031         fd = open("/dev/null", O_RDWR);
1032         if (fd < 0) {
1033                 fprintf(stderr, "cannot open /dev/null\n");
1034                 err(udev, "cannot open /dev/null\n");
1035         }
1036         if (fd > STDIN_FILENO)
1037                 dup2(fd, STDIN_FILENO);
1038         if (write(STDOUT_FILENO, 0, 0) < 0)
1039                 dup2(fd, STDOUT_FILENO);
1040         if (write(STDERR_FILENO, 0, 0) < 0)
1041                 dup2(fd, STDERR_FILENO);
1042
1043         /* init sockets to receive events */
1044         if (init_udevd_socket(udev) < 0) {
1045                 if (errno == EADDRINUSE) {
1046                         fprintf(stderr, "another udev daemon already running\n");
1047                         err(udev, "another udev daemon already running\n");
1048                         rc = 1;
1049                 } else {
1050                         fprintf(stderr, "error initializing udevd socket\n");
1051                         err(udev, "error initializing udevd socket\n");
1052                         rc = 2;
1053                 }
1054                 goto exit;
1055         }
1056
1057         if (init_uevent_netlink_sock(udev) < 0) {
1058                 fprintf(stderr, "error initializing netlink socket\n");
1059                 err(udev, "error initializing netlink socket\n");
1060                 rc = 3;
1061                 goto exit;
1062         }
1063
1064         /* setup signal handler pipe */
1065         retval = pipe(signal_pipe);
1066         if (retval < 0) {
1067                 err(udev, "error getting pipes: %s\n", strerror(errno));
1068                 goto exit;
1069         }
1070
1071         retval = fcntl(signal_pipe[READ_END], F_GETFL, 0);
1072         if (retval < 0) {
1073                 err(udev, "error fcntl on read pipe: %s\n", strerror(errno));
1074                 goto exit;
1075         }
1076         retval = fcntl(signal_pipe[READ_END], F_SETFL, retval | O_NONBLOCK);
1077         if (retval < 0) {
1078                 err(udev, "error fcntl on read pipe: %s\n", strerror(errno));
1079                 goto exit;
1080         }
1081
1082         retval = fcntl(signal_pipe[WRITE_END], F_GETFL, 0);
1083         if (retval < 0) {
1084                 err(udev, "error fcntl on write pipe: %s\n", strerror(errno));
1085                 goto exit;
1086         }
1087         retval = fcntl(signal_pipe[WRITE_END], F_SETFL, retval | O_NONBLOCK);
1088         if (retval < 0) {
1089                 err(udev, "error fcntl on write pipe: %s\n", strerror(errno));
1090                 goto exit;
1091         }
1092
1093         /* parse the rules and keep them in memory */
1094         sysfs_init();
1095         udev_rules_init(udev, &rules, 1);
1096
1097         export_initial_seqnum(udev);
1098
1099         if (daemonize) {
1100                 pid_t pid;
1101
1102                 pid = fork();
1103                 switch (pid) {
1104                 case 0:
1105                         dbg(udev, "daemonized fork running\n");
1106                         break;
1107                 case -1:
1108                         err(udev, "fork of daemon failed: %s\n", strerror(errno));
1109                         rc = 4;
1110                         goto exit;
1111                 default:
1112                         dbg(udev, "child [%u] running, parent exits\n", pid);
1113                         rc = 0;
1114                         goto exit;
1115                 }
1116         }
1117
1118         /* redirect std{out,err} fd's */
1119         if (!debug)
1120                 dup2(fd, STDOUT_FILENO);
1121         dup2(fd, STDERR_FILENO);
1122         if (fd > STDERR_FILENO)
1123                 close(fd);
1124
1125         /* set scheduling priority for the daemon */
1126         setpriority(PRIO_PROCESS, 0, UDEVD_PRIORITY);
1127
1128         chdir("/");
1129         umask(022);
1130
1131         /* become session leader */
1132         sid = setsid();
1133         dbg(udev, "our session is %d\n", sid);
1134
1135         /* OOM_DISABLE == -17 */
1136         fd = open("/proc/self/oom_adj", O_RDWR);
1137         if (fd < 0)
1138                 err(udev, "error disabling OOM: %s\n", strerror(errno));
1139         else {
1140                 write(fd, "-17", 3);
1141                 close(fd);
1142         }
1143
1144         fd = open("/dev/kmsg", O_WRONLY);
1145         if (fd > 0) {
1146                 const char *str = "<6>udevd version " VERSION " started\n";
1147
1148                 write(fd, str, strlen(str));
1149                 close(fd);
1150         }
1151
1152         /* set signal handlers */
1153         memset(&act, 0x00, sizeof(struct sigaction));
1154         act.sa_handler = (void (*)(int)) sig_handler;
1155         sigemptyset(&act.sa_mask);
1156         act.sa_flags = SA_RESTART;
1157         sigaction(SIGINT, &act, NULL);
1158         sigaction(SIGTERM, &act, NULL);
1159         sigaction(SIGCHLD, &act, NULL);
1160         sigaction(SIGHUP, &act, NULL);
1161
1162         /* watch rules directory */
1163         inotify_fd = inotify_init();
1164         if (inotify_fd >= 0) {
1165                 if (udev_get_rules_path(udev) != NULL) {
1166                         inotify_add_watch(inotify_fd, udev_get_rules_path(udev),
1167                                           IN_CREATE | IN_DELETE | IN_MOVE | IN_CLOSE_WRITE);
1168                 } else {
1169                         char filename[PATH_MAX];
1170
1171                         inotify_add_watch(inotify_fd, UDEV_PREFIX "/lib/udev/rules.d",
1172                                           IN_CREATE | IN_DELETE | IN_MOVE | IN_CLOSE_WRITE);
1173                         inotify_add_watch(inotify_fd, SYSCONFDIR "/udev/rules.d",
1174                                           IN_CREATE | IN_DELETE | IN_MOVE | IN_CLOSE_WRITE);
1175
1176                         /* watch dynamic rules directory */
1177                         strlcpy(filename, udev_get_dev_path(udev), sizeof(filename));
1178                         strlcat(filename, "/.udev/rules.d", sizeof(filename));
1179                         inotify_add_watch(inotify_fd, filename,
1180                                           IN_CREATE | IN_DELETE | IN_MOVE | IN_CLOSE_WRITE);
1181                 }
1182         } else if (errno == ENOSYS)
1183                 err(udev, "the kernel does not support inotify, udevd can't monitor rules file changes\n");
1184         else
1185                 err(udev, "inotify_init failed: %s\n", strerror(errno));
1186
1187         /* maximum limit of forked childs */
1188         value = getenv("UDEVD_MAX_CHILDS");
1189         if (value)
1190                 max_childs = strtoul(value, NULL, 10);
1191         else {
1192                 int memsize = mem_size_mb();
1193                 if (memsize > 0)
1194                         max_childs = 128 + (memsize / 4);
1195                 else
1196                         max_childs = UDEVD_MAX_CHILDS;
1197         }
1198         info(udev, "initialize max_childs to %u\n", max_childs);
1199
1200         /* start to throttle forking if maximum number of _running_ childs is reached */
1201         value = getenv("UDEVD_MAX_CHILDS_RUNNING");
1202         if (value)
1203                 max_childs_running = strtoull(value, NULL, 10);
1204         else {
1205                 int cpus = cpu_count();
1206                 if (cpus > 0)
1207                         max_childs_running = 8 + (8 * cpus);
1208                 else
1209                         max_childs_running = UDEVD_MAX_CHILDS_RUNNING;
1210         }
1211         info(udev, "initialize max_childs_running to %u\n", max_childs_running);
1212
1213         /* clear environment for forked event processes */
1214         clearenv();
1215
1216         /* export log_priority , as called programs may want to follow that setting */
1217         sprintf(udev_log_env, "UDEV_LOG=%i", udev_get_log_priority(udev));
1218         putenv(udev_log_env);
1219         if (debug_trace)
1220                 putenv("DEBUG=1");
1221
1222         maxfd = udevd_sock;
1223         maxfd = UDEV_MAX(maxfd, uevent_netlink_sock);
1224         maxfd = UDEV_MAX(maxfd, signal_pipe[READ_END]);
1225         maxfd = UDEV_MAX(maxfd, inotify_fd);
1226
1227         while (!udev_exit) {
1228                 struct udevd_uevent_msg *msg;
1229                 int fdcount;
1230
1231                 FD_ZERO(&readfds);
1232                 FD_SET(signal_pipe[READ_END], &readfds);
1233                 FD_SET(udevd_sock, &readfds);
1234                 FD_SET(uevent_netlink_sock, &readfds);
1235                 if (inotify_fd >= 0)
1236                         FD_SET(inotify_fd, &readfds);
1237
1238                 fdcount = select(maxfd+1, &readfds, NULL, NULL, NULL);
1239                 if (fdcount < 0) {
1240                         if (errno != EINTR)
1241                                 err(udev, "error in select: %s\n", strerror(errno));
1242                         continue;
1243                 }
1244
1245                 /* get control message */
1246                 if (FD_ISSET(udevd_sock, &readfds))
1247                         get_ctrl_msg(udev);
1248
1249                 /* get netlink message */
1250                 if (FD_ISSET(uevent_netlink_sock, &readfds)) {
1251                         msg = get_netlink_msg(udev);
1252                         if (msg)
1253                                 msg_queue_insert(msg);
1254                 }
1255
1256                 /* received a signal, clear our notification pipe */
1257                 if (FD_ISSET(signal_pipe[READ_END], &readfds)) {
1258                         char buf[256];
1259
1260                         read(signal_pipe[READ_END], &buf, sizeof(buf));
1261                 }
1262
1263                 /* rules directory inotify watch */
1264                 if ((inotify_fd >= 0) && FD_ISSET(inotify_fd, &readfds)) {
1265                         int nbytes;
1266
1267                         /* discard all possible events, we can just reload the config */
1268                         if ((ioctl(inotify_fd, FIONREAD, &nbytes) == 0) && nbytes > 0) {
1269                                 char *buf;
1270
1271                                 reload_config = 1;
1272                                 buf = malloc(nbytes);
1273                                 if (buf == NULL) {
1274                                         err(udev, "error getting buffer for inotify, disable watching\n");
1275                                         close(inotify_fd);
1276                                         inotify_fd = -1;
1277                                 }
1278                                 read(inotify_fd, buf, nbytes);
1279                                 free(buf);
1280                         }
1281                 }
1282
1283                 /* rules changed, set by inotify or a HUP signal */
1284                 if (reload_config) {
1285                         reload_config = 0;
1286                         udev_rules_cleanup(&rules);
1287                         udev_rules_init(udev, &rules, 1);
1288                 }
1289
1290                 /* forked child has returned */
1291                 if (sigchilds_waiting) {
1292                         sigchilds_waiting = 0;
1293                         reap_sigchilds();
1294                 }
1295
1296                 if (run_exec_q) {
1297                         run_exec_q = 0;
1298                         if (!stop_exec_q)
1299                                 msg_queue_manager(udev);
1300                 }
1301         }
1302         rc = 0;
1303
1304 exit:
1305         udev_rules_cleanup(&rules);
1306         sysfs_cleanup();
1307         selinux_exit(udev);
1308
1309         if (signal_pipe[READ_END] >= 0)
1310                 close(signal_pipe[READ_END]);
1311         if (signal_pipe[WRITE_END] >= 0)
1312                 close(signal_pipe[WRITE_END]);
1313
1314         if (udevd_sock >= 0)
1315                 close(udevd_sock);
1316         if (inotify_fd >= 0)
1317                 close(inotify_fd);
1318         if (uevent_netlink_sock >= 0)
1319                 close(uevent_netlink_sock);
1320
1321         logging_close();
1322         return rc;
1323 }