chiark / gitweb /
path: simplify recheck logic
[elogind.git] / src / socket.c
1 /*-*- Mode: C; c-basic-offset: 8; indent-tabs-mode: nil -*-*/
2
3 /***
4   This file is part of systemd.
5
6   Copyright 2010 Lennart Poettering
7
8   systemd is free software; you can redistribute it and/or modify it
9   under the terms of the GNU General Public License as published by
10   the Free Software Foundation; either version 2 of the License, or
11   (at your option) any later version.
12
13   systemd is distributed in the hope that it will be useful, but
14   WITHOUT ANY WARRANTY; without even the implied warranty of
15   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16   General Public License for more details.
17
18   You should have received a copy of the GNU General Public License
19   along with systemd; If not, see <http://www.gnu.org/licenses/>.
20 ***/
21
22 #include <sys/types.h>
23 #include <sys/stat.h>
24 #include <unistd.h>
25 #include <errno.h>
26 #include <fcntl.h>
27 #include <sys/epoll.h>
28 #include <signal.h>
29 #include <arpa/inet.h>
30
31 #include "unit.h"
32 #include "socket.h"
33 #include "netinet/tcp.h"
34 #include "log.h"
35 #include "load-dropin.h"
36 #include "load-fragment.h"
37 #include "strv.h"
38 #include "unit-name.h"
39 #include "dbus-socket.h"
40 #include "missing.h"
41 #include "special.h"
42 #include "bus-errors.h"
43 #include "label.h"
44 #include "exit-status.h"
45 #include "def.h"
46
47 static const UnitActiveState state_translation_table[_SOCKET_STATE_MAX] = {
48         [SOCKET_DEAD] = UNIT_INACTIVE,
49         [SOCKET_START_PRE] = UNIT_ACTIVATING,
50         [SOCKET_START_POST] = UNIT_ACTIVATING,
51         [SOCKET_LISTENING] = UNIT_ACTIVE,
52         [SOCKET_RUNNING] = UNIT_ACTIVE,
53         [SOCKET_STOP_PRE] = UNIT_DEACTIVATING,
54         [SOCKET_STOP_PRE_SIGTERM] = UNIT_DEACTIVATING,
55         [SOCKET_STOP_PRE_SIGKILL] = UNIT_DEACTIVATING,
56         [SOCKET_STOP_POST] = UNIT_DEACTIVATING,
57         [SOCKET_FINAL_SIGTERM] = UNIT_DEACTIVATING,
58         [SOCKET_FINAL_SIGKILL] = UNIT_DEACTIVATING,
59         [SOCKET_FAILED] = UNIT_FAILED
60 };
61
62 static void socket_init(Unit *u) {
63         Socket *s = SOCKET(u);
64
65         assert(u);
66         assert(u->meta.load_state == UNIT_STUB);
67
68         s->backlog = SOMAXCONN;
69         s->timeout_usec = DEFAULT_TIMEOUT_USEC;
70         s->directory_mode = 0755;
71         s->socket_mode = 0777;
72
73         s->max_connections = 64;
74
75         s->priority = -1;
76         s->ip_tos = -1;
77         s->ip_ttl = -1;
78         s->mark = -1;
79
80         exec_context_init(&s->exec_context);
81         s->exec_context.std_output = u->meta.manager->default_std_output;
82         s->exec_context.std_error = u->meta.manager->default_std_error;
83
84         s->control_command_id = _SOCKET_EXEC_COMMAND_INVALID;
85 }
86
87 static void socket_unwatch_control_pid(Socket *s) {
88         assert(s);
89
90         if (s->control_pid <= 0)
91                 return;
92
93         unit_unwatch_pid(UNIT(s), s->control_pid);
94         s->control_pid = 0;
95 }
96
97 static void socket_done(Unit *u) {
98         Socket *s = SOCKET(u);
99         SocketPort *p;
100         Meta *i;
101
102         assert(s);
103
104         while ((p = s->ports)) {
105                 LIST_REMOVE(SocketPort, port, s->ports, p);
106
107                 if (p->fd >= 0) {
108                         unit_unwatch_fd(UNIT(s), &p->fd_watch);
109                         close_nointr_nofail(p->fd);
110                 }
111
112                 free(p->path);
113                 free(p);
114         }
115
116         exec_context_done(&s->exec_context);
117         exec_command_free_array(s->exec_command, _SOCKET_EXEC_COMMAND_MAX);
118         s->control_command = NULL;
119
120         socket_unwatch_control_pid(s);
121
122         s->service = NULL;
123
124         free(s->tcp_congestion);
125         s->tcp_congestion = NULL;
126
127         free(s->bind_to_device);
128         s->bind_to_device = NULL;
129
130         unit_unwatch_timer(u, &s->timer_watch);
131
132         /* Make sure no service instance refers to us anymore. */
133         LIST_FOREACH(units_per_type, i, u->meta.manager->units_per_type[UNIT_SERVICE]) {
134                 Service *service = (Service *) i;
135
136                 if (service->accept_socket == s)
137                         service->accept_socket = NULL;
138
139                 set_remove(service->configured_sockets, s);
140         }
141 }
142
143 static int socket_instantiate_service(Socket *s) {
144         char *prefix, *name;
145         int r;
146         Unit *u;
147
148         assert(s);
149
150         /* This fills in s->service if it isn't filled in yet. For
151          * Accept=yes sockets we create the next connection service
152          * here. For Accept=no this is mostly a NOP since the service
153          * is figured out at load time anyway. */
154
155         if (s->service)
156                 return 0;
157
158         assert(s->accept);
159
160         if (!(prefix = unit_name_to_prefix(s->meta.id)))
161                 return -ENOMEM;
162
163         r = asprintf(&name, "%s@%u.service", prefix, s->n_accepted);
164         free(prefix);
165
166         if (r < 0)
167                 return -ENOMEM;
168
169         r = manager_load_unit(s->meta.manager, name, NULL, NULL, &u);
170         free(name);
171
172         if (r < 0)
173                 return r;
174
175 #ifdef HAVE_SYSV_COMPAT
176         if (SERVICE(u)->sysv_path) {
177                 log_error("Using SysV services for socket activation is not supported. Refusing.");
178                 return -ENOENT;
179         }
180 #endif
181
182         u->meta.no_gc = true;
183         s->service = SERVICE(u);
184         return 0;
185 }
186
187 static bool have_non_accept_socket(Socket *s) {
188         SocketPort *p;
189
190         assert(s);
191
192         if (!s->accept)
193                 return true;
194
195         LIST_FOREACH(port, p, s->ports) {
196
197                 if (p->type != SOCKET_SOCKET)
198                         return true;
199
200                 if (!socket_address_can_accept(&p->address))
201                         return true;
202         }
203
204         return false;
205 }
206
207 static int socket_verify(Socket *s) {
208         assert(s);
209
210         if (s->meta.load_state != UNIT_LOADED)
211                 return 0;
212
213         if (!s->ports) {
214                 log_error("%s lacks Listen setting. Refusing.", s->meta.id);
215                 return -EINVAL;
216         }
217
218         if (s->accept && have_non_accept_socket(s)) {
219                 log_error("%s configured for accepting sockets, but sockets are non-accepting. Refusing.", s->meta.id);
220                 return -EINVAL;
221         }
222
223         if (s->accept && s->max_connections <= 0) {
224                 log_error("%s's MaxConnection setting too small. Refusing.", s->meta.id);
225                 return -EINVAL;
226         }
227
228         if (s->accept && s->service) {
229                 log_error("Explicit service configuration for accepting sockets not supported on %s. Refusing.", s->meta.id);
230                 return -EINVAL;
231         }
232
233         if (s->exec_context.pam_name && s->exec_context.kill_mode != KILL_CONTROL_GROUP) {
234                 log_error("%s has PAM enabled. Kill mode must be set to 'control-group'. Refusing.", s->meta.id);
235                 return -EINVAL;
236         }
237
238         return 0;
239 }
240
241 static bool socket_needs_mount(Socket *s, const char *prefix) {
242         SocketPort *p;
243
244         assert(s);
245
246         LIST_FOREACH(port, p, s->ports) {
247
248                 if (p->type == SOCKET_SOCKET) {
249                         if (socket_address_needs_mount(&p->address, prefix))
250                                 return true;
251                 } else {
252                         assert(p->type == SOCKET_FIFO || p->type == SOCKET_SPECIAL);
253                         if (path_startswith(p->path, prefix))
254                                 return true;
255                 }
256         }
257
258         return false;
259 }
260
261 int socket_add_one_mount_link(Socket *s, Mount *m) {
262         int r;
263
264         assert(s);
265         assert(m);
266
267         if (s->meta.load_state != UNIT_LOADED ||
268             m->meta.load_state != UNIT_LOADED)
269                 return 0;
270
271         if (!socket_needs_mount(s, m->where))
272                 return 0;
273
274         if ((r = unit_add_two_dependencies(UNIT(s), UNIT_AFTER, UNIT_REQUIRES, UNIT(m), true)) < 0)
275                 return r;
276
277         return 0;
278 }
279
280 static int socket_add_mount_links(Socket *s) {
281         Meta *other;
282         int r;
283
284         assert(s);
285
286         LIST_FOREACH(units_per_type, other, s->meta.manager->units_per_type[UNIT_MOUNT])
287                 if ((r = socket_add_one_mount_link(s, (Mount*) other)) < 0)
288                         return r;
289
290         return 0;
291 }
292
293 static int socket_add_device_link(Socket *s) {
294         char *t;
295         int r;
296
297         assert(s);
298
299         if (!s->bind_to_device)
300                 return 0;
301
302         if (asprintf(&t, "/sys/subsystem/net/devices/%s", s->bind_to_device) < 0)
303                 return -ENOMEM;
304
305         r = unit_add_node_link(UNIT(s), t, false);
306         free(t);
307
308         return r;
309 }
310
311 static int socket_add_default_dependencies(Socket *s) {
312         int r;
313         assert(s);
314
315         if (s->meta.manager->running_as == MANAGER_SYSTEM) {
316                 if ((r = unit_add_dependency_by_name(UNIT(s), UNIT_BEFORE, SPECIAL_SOCKETS_TARGET, NULL, true)) < 0)
317                         return r;
318
319                 if ((r = unit_add_two_dependencies_by_name(UNIT(s), UNIT_AFTER, UNIT_REQUIRES, SPECIAL_SYSINIT_TARGET, NULL, true)) < 0)
320                         return r;
321         }
322
323         return unit_add_two_dependencies_by_name(UNIT(s), UNIT_BEFORE, UNIT_CONFLICTS, SPECIAL_SHUTDOWN_TARGET, NULL, true);
324 }
325
326 static int socket_load(Unit *u) {
327         Socket *s = SOCKET(u);
328         int r;
329
330         assert(u);
331         assert(u->meta.load_state == UNIT_STUB);
332
333         if ((r = unit_load_fragment_and_dropin(u)) < 0)
334                 return r;
335
336         /* This is a new unit? Then let's add in some extras */
337         if (u->meta.load_state == UNIT_LOADED) {
338
339                 if (have_non_accept_socket(s)) {
340
341                         if (!s->service)
342                                 if ((r = unit_load_related_unit(u, ".service", (Unit**) &s->service)) < 0)
343                                         return r;
344
345                         if ((r = unit_add_dependency(u, UNIT_BEFORE, UNIT(s->service), true)) < 0)
346                                 return r;
347                 }
348
349                 if ((r = socket_add_mount_links(s)) < 0)
350                         return r;
351
352                 if ((r = socket_add_device_link(s)) < 0)
353                         return r;
354
355                 if ((r = unit_add_exec_dependencies(u, &s->exec_context)) < 0)
356                         return r;
357
358                 if ((r = unit_add_default_cgroups(u)) < 0)
359                         return r;
360
361                 if (s->meta.default_dependencies)
362                         if ((r = socket_add_default_dependencies(s)) < 0)
363                                 return r;
364         }
365
366         return socket_verify(s);
367 }
368
369 static const char* listen_lookup(int family, int type) {
370
371         if (family == AF_NETLINK)
372                 return "ListenNetlink";
373
374         if (type == SOCK_STREAM)
375                 return "ListenStream";
376         else if (type == SOCK_DGRAM)
377                 return "ListenDatagram";
378         else if (type == SOCK_SEQPACKET)
379                 return "ListenSequentialPacket";
380
381         assert_not_reached("Unknown socket type");
382         return NULL;
383 }
384
385 static void socket_dump(Unit *u, FILE *f, const char *prefix) {
386
387         SocketExecCommand c;
388         Socket *s = SOCKET(u);
389         SocketPort *p;
390         const char *prefix2;
391         char *p2;
392
393         assert(s);
394         assert(f);
395
396         p2 = strappend(prefix, "\t");
397         prefix2 = p2 ? p2 : prefix;
398
399         fprintf(f,
400                 "%sSocket State: %s\n"
401                 "%sBindIPv6Only: %s\n"
402                 "%sBacklog: %u\n"
403                 "%sSocketMode: %04o\n"
404                 "%sDirectoryMode: %04o\n"
405                 "%sKeepAlive: %s\n"
406                 "%sFreeBind: %s\n"
407                 "%sTCPCongestion: %s\n",
408                 prefix, socket_state_to_string(s->state),
409                 prefix, socket_address_bind_ipv6_only_to_string(s->bind_ipv6_only),
410                 prefix, s->backlog,
411                 prefix, s->socket_mode,
412                 prefix, s->directory_mode,
413                 prefix, yes_no(s->keep_alive),
414                 prefix, yes_no(s->free_bind),
415                 prefix, strna(s->tcp_congestion));
416
417         if (s->control_pid > 0)
418                 fprintf(f,
419                         "%sControl PID: %lu\n",
420                         prefix, (unsigned long) s->control_pid);
421
422         if (s->bind_to_device)
423                 fprintf(f,
424                         "%sBindToDevice: %s\n",
425                         prefix, s->bind_to_device);
426
427         if (s->accept)
428                 fprintf(f,
429                         "%sAccepted: %u\n"
430                         "%sNConnections: %u\n"
431                         "%sMaxConnections: %u\n",
432                         prefix, s->n_accepted,
433                         prefix, s->n_connections,
434                         prefix, s->max_connections);
435
436         if (s->priority >= 0)
437                 fprintf(f,
438                         "%sPriority: %i\n",
439                         prefix, s->priority);
440
441         if (s->receive_buffer > 0)
442                 fprintf(f,
443                         "%sReceiveBuffer: %zu\n",
444                         prefix, s->receive_buffer);
445
446         if (s->send_buffer > 0)
447                 fprintf(f,
448                         "%sSendBuffer: %zu\n",
449                         prefix, s->send_buffer);
450
451         if (s->ip_tos >= 0)
452                 fprintf(f,
453                         "%sIPTOS: %i\n",
454                         prefix, s->ip_tos);
455
456         if (s->ip_ttl >= 0)
457                 fprintf(f,
458                         "%sIPTTL: %i\n",
459                         prefix, s->ip_ttl);
460
461         if (s->pipe_size > 0)
462                 fprintf(f,
463                         "%sPipeSize: %zu\n",
464                         prefix, s->pipe_size);
465
466         if (s->mark >= 0)
467                 fprintf(f,
468                         "%sMark: %i\n",
469                         prefix, s->mark);
470
471         LIST_FOREACH(port, p, s->ports) {
472
473                 if (p->type == SOCKET_SOCKET) {
474                         const char *t;
475                         int r;
476                         char *k = NULL;
477
478                         if ((r = socket_address_print(&p->address, &k)) < 0)
479                                 t = strerror(-r);
480                         else
481                                 t = k;
482
483                         fprintf(f, "%s%s: %s\n", prefix, listen_lookup(socket_address_family(&p->address), p->address.type), t);
484                         free(k);
485                 } else if (p->type == SOCKET_SPECIAL)
486                         fprintf(f, "%sListenSpecial: %s\n", prefix, p->path);
487                 else
488                         fprintf(f, "%sListenFIFO: %s\n", prefix, p->path);
489         }
490
491         exec_context_dump(&s->exec_context, f, prefix);
492
493         for (c = 0; c < _SOCKET_EXEC_COMMAND_MAX; c++) {
494                 if (!s->exec_command[c])
495                         continue;
496
497                 fprintf(f, "%s-> %s:\n",
498                         prefix, socket_exec_command_to_string(c));
499
500                 exec_command_dump_list(s->exec_command[c], f, prefix2);
501         }
502
503         free(p2);
504 }
505
506 static int instance_from_socket(int fd, unsigned nr, char **instance) {
507         socklen_t l;
508         char *r;
509         union {
510                 struct sockaddr sa;
511                 struct sockaddr_un un;
512                 struct sockaddr_in in;
513                 struct sockaddr_in6 in6;
514                 struct sockaddr_storage storage;
515         } local, remote;
516
517         assert(fd >= 0);
518         assert(instance);
519
520         l = sizeof(local);
521         if (getsockname(fd, &local.sa, &l) < 0)
522                 return -errno;
523
524         l = sizeof(remote);
525         if (getpeername(fd, &remote.sa, &l) < 0)
526                 return -errno;
527
528         switch (local.sa.sa_family) {
529
530         case AF_INET: {
531                 uint32_t
532                         a = ntohl(local.in.sin_addr.s_addr),
533                         b = ntohl(remote.in.sin_addr.s_addr);
534
535                 if (asprintf(&r,
536                              "%u.%u.%u.%u:%u-%u.%u.%u.%u:%u",
537                              a >> 24, (a >> 16) & 0xFF, (a >> 8) & 0xFF, a & 0xFF,
538                              ntohs(local.in.sin_port),
539                              b >> 24, (b >> 16) & 0xFF, (b >> 8) & 0xFF, b & 0xFF,
540                              ntohs(remote.in.sin_port)) < 0)
541                         return -ENOMEM;
542
543                 break;
544         }
545
546         case AF_INET6: {
547                 static const char ipv4_prefix[] = {
548                         0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0xFF, 0xFF
549                 };
550
551                 if (memcmp(&local.in6.sin6_addr, ipv4_prefix, sizeof(ipv4_prefix)) == 0 &&
552                     memcmp(&remote.in6.sin6_addr, ipv4_prefix, sizeof(ipv4_prefix)) == 0) {
553                         const uint8_t
554                                 *a = local.in6.sin6_addr.s6_addr+12,
555                                 *b = remote.in6.sin6_addr.s6_addr+12;
556
557                         if (asprintf(&r,
558                                      "%u.%u.%u.%u:%u-%u.%u.%u.%u:%u",
559                                      a[0], a[1], a[2], a[3],
560                                      ntohs(local.in6.sin6_port),
561                                      b[0], b[1], b[2], b[3],
562                                      ntohs(remote.in6.sin6_port)) < 0)
563                                 return -ENOMEM;
564                 } else {
565                         char a[INET6_ADDRSTRLEN], b[INET6_ADDRSTRLEN];
566
567                         if (asprintf(&r,
568                                      "%s:%u-%s:%u",
569                                      inet_ntop(AF_INET6, &local.in6.sin6_addr, a, sizeof(a)),
570                                      ntohs(local.in6.sin6_port),
571                                      inet_ntop(AF_INET6, &remote.in6.sin6_addr, b, sizeof(b)),
572                                      ntohs(remote.in6.sin6_port)) < 0)
573                                 return -ENOMEM;
574                 }
575
576                 break;
577         }
578
579         case AF_UNIX: {
580                 struct ucred ucred;
581
582                 l = sizeof(ucred);
583                 if (getsockopt(fd, SOL_SOCKET, SO_PEERCRED, &ucred, &l) < 0)
584                         return -errno;
585
586                 if (asprintf(&r,
587                              "%u-%lu-%lu",
588                              nr,
589                              (unsigned long) ucred.pid,
590                              (unsigned long) ucred.uid) < 0)
591                         return -ENOMEM;
592
593                 break;
594         }
595
596         default:
597                 assert_not_reached("Unhandled socket type.");
598         }
599
600         *instance = r;
601         return 0;
602 }
603
604 static void socket_close_fds(Socket *s) {
605         SocketPort *p;
606
607         assert(s);
608
609         LIST_FOREACH(port, p, s->ports) {
610                 if (p->fd < 0)
611                         continue;
612
613                 unit_unwatch_fd(UNIT(s), &p->fd_watch);
614                 close_nointr_nofail(p->fd);
615
616                 /* One little note: we should never delete any sockets
617                  * in the file system here! After all some other
618                  * process we spawned might still have a reference of
619                  * this fd and wants to continue to use it. Therefore
620                  * we delete sockets in the file system before we
621                  * create a new one, not after we stopped using
622                  * one! */
623
624                 p->fd = -1;
625         }
626 }
627
628 static void socket_apply_socket_options(Socket *s, int fd) {
629         assert(s);
630         assert(fd >= 0);
631
632         if (s->keep_alive) {
633                 int b = s->keep_alive;
634                 if (setsockopt(fd, SOL_SOCKET, SO_KEEPALIVE, &b, sizeof(b)) < 0)
635                         log_warning("SO_KEEPALIVE failed: %m");
636         }
637
638         if (s->priority >= 0)
639                 if (setsockopt(fd, SOL_SOCKET, SO_PRIORITY, &s->priority, sizeof(s->priority)) < 0)
640                         log_warning("SO_PRIORITY failed: %m");
641
642         if (s->receive_buffer > 0) {
643                 int value = (int) s->receive_buffer;
644                 if (setsockopt(fd, SOL_SOCKET, SO_RCVBUF, &value, sizeof(value)) < 0)
645                         log_warning("SO_RCVBUF failed: %m");
646         }
647
648         if (s->send_buffer > 0) {
649                 int value = (int) s->send_buffer;
650                 if (setsockopt(fd, SOL_SOCKET, SO_SNDBUF, &value, sizeof(value)) < 0)
651                         log_warning("SO_SNDBUF failed: %m");
652         }
653
654         if (s->mark >= 0)
655                 if (setsockopt(fd, SOL_SOCKET, SO_MARK, &s->mark, sizeof(s->mark)) < 0)
656                         log_warning("SO_MARK failed: %m");
657
658         if (s->ip_tos >= 0)
659                 if (setsockopt(fd, IPPROTO_IP, IP_TOS, &s->ip_tos, sizeof(s->ip_tos)) < 0)
660                         log_warning("IP_TOS failed: %m");
661
662         if (s->ip_ttl >= 0) {
663                 int r, x;
664
665                 r = setsockopt(fd, IPPROTO_IP, IP_TTL, &s->ip_ttl, sizeof(s->ip_ttl));
666
667                 if (socket_ipv6_is_supported())
668                         x = setsockopt(fd, IPPROTO_IPV6, IPV6_UNICAST_HOPS, &s->ip_ttl, sizeof(s->ip_ttl));
669                 else {
670                         x = -1;
671                         errno = EAFNOSUPPORT;
672                 }
673
674                 if (r < 0 && x < 0)
675                         log_warning("IP_TTL/IPV6_UNICAST_HOPS failed: %m");
676         }
677
678         if (s->tcp_congestion)
679                 if (setsockopt(fd, SOL_TCP, TCP_CONGESTION, s->tcp_congestion, strlen(s->tcp_congestion)+1) < 0)
680                         log_warning("TCP_CONGESTION failed: %m");
681 }
682
683 static void socket_apply_fifo_options(Socket *s, int fd) {
684         assert(s);
685         assert(fd >= 0);
686
687         if (s->pipe_size > 0)
688                 if (fcntl(fd, F_SETPIPE_SZ, s->pipe_size) < 0)
689                         log_warning("F_SETPIPE_SZ: %m");
690 }
691
692 static int fifo_address_create(
693                 const char *path,
694                 mode_t directory_mode,
695                 mode_t socket_mode,
696                 int *_fd) {
697
698         int fd = -1, r = 0;
699         struct stat st;
700         mode_t old_mask;
701
702         assert(path);
703         assert(_fd);
704
705         mkdir_parents(path, directory_mode);
706
707         if ((r = label_fifofile_set(path)) < 0)
708                 goto fail;
709
710         /* Enforce the right access mode for the fifo */
711         old_mask = umask(~ socket_mode);
712
713         /* Include the original umask in our mask */
714         umask(~socket_mode | old_mask);
715
716         r = mkfifo(path, socket_mode);
717         umask(old_mask);
718
719         if (r < 0 && errno != EEXIST) {
720                 r = -errno;
721                 goto fail;
722         }
723
724         if ((fd = open(path, O_RDWR|O_CLOEXEC|O_NOCTTY|O_NONBLOCK|O_NOFOLLOW)) < 0) {
725                 r = -errno;
726                 goto fail;
727         }
728
729         label_file_clear();
730
731         if (fstat(fd, &st) < 0) {
732                 r = -errno;
733                 goto fail;
734         }
735
736         if (!S_ISFIFO(st.st_mode) ||
737             (st.st_mode & 0777) != (socket_mode & ~old_mask) ||
738             st.st_uid != getuid() ||
739             st.st_gid != getgid()) {
740
741                 r = -EEXIST;
742                 goto fail;
743         }
744
745         *_fd = fd;
746         return 0;
747
748 fail:
749         label_file_clear();
750
751         if (fd >= 0)
752                 close_nointr_nofail(fd);
753
754         return r;
755 }
756
757 static int special_address_create(
758                 const char *path,
759                 int *_fd) {
760
761         int fd = -1, r = 0;
762         struct stat st;
763
764         assert(path);
765         assert(_fd);
766
767         if ((fd = open(path, O_RDONLY|O_CLOEXEC|O_NOCTTY|O_NONBLOCK|O_NOFOLLOW)) < 0) {
768                 r = -errno;
769                 goto fail;
770         }
771
772         if (fstat(fd, &st) < 0) {
773                 r = -errno;
774                 goto fail;
775         }
776
777         /* Check whether this is a /proc, /sys or /dev file or char device */
778         if (!S_ISREG(st.st_mode) && !S_ISCHR(st.st_mode)) {
779                 r = -EEXIST;
780                 goto fail;
781         }
782
783         *_fd = fd;
784         return 0;
785
786 fail:
787         if (fd >= 0)
788                 close_nointr_nofail(fd);
789
790         return r;
791 }
792
793 static int socket_open_fds(Socket *s) {
794         SocketPort *p;
795         int r;
796         char *label = NULL;
797         bool know_label = false;
798
799         assert(s);
800
801         LIST_FOREACH(port, p, s->ports) {
802
803                 if (p->fd >= 0)
804                         continue;
805
806                 if (p->type == SOCKET_SOCKET) {
807
808                         if (!know_label) {
809
810                                 if ((r = socket_instantiate_service(s)) < 0)
811                                         return r;
812
813                                 if (s->service && s->service->exec_command[SERVICE_EXEC_START])
814                                         if ((r = label_get_socket_label_from_exe(s->service->exec_command[SERVICE_EXEC_START]->path, &label)) < 0) {
815                                                 if (r != -EPERM)
816                                                         return r;
817                                         }
818
819                                 know_label = true;
820                         }
821
822                         if ((r = socket_address_listen(
823                                              &p->address,
824                                              s->backlog,
825                                              s->bind_ipv6_only,
826                                              s->bind_to_device,
827                                              s->free_bind,
828                                              s->directory_mode,
829                                              s->socket_mode,
830                                              label,
831                                              &p->fd)) < 0)
832                                 goto rollback;
833
834                         socket_apply_socket_options(s, p->fd);
835
836                 } else  if (p->type == SOCKET_SPECIAL) {
837
838                         if ((r = special_address_create(
839                                              p->path,
840                                              &p->fd)) < 0)
841                                 goto rollback;
842
843                 } else  if (p->type == SOCKET_FIFO) {
844
845                         if ((r = fifo_address_create(
846                                              p->path,
847                                              s->directory_mode,
848                                              s->socket_mode,
849                                              &p->fd)) < 0)
850                                 goto rollback;
851
852                         socket_apply_fifo_options(s, p->fd);
853
854                 } else
855                         assert_not_reached("Unknown port type");
856         }
857
858         label_free(label);
859         return 0;
860
861 rollback:
862         socket_close_fds(s);
863         label_free(label);
864         return r;
865 }
866
867 static void socket_unwatch_fds(Socket *s) {
868         SocketPort *p;
869
870         assert(s);
871
872         LIST_FOREACH(port, p, s->ports) {
873                 if (p->fd < 0)
874                         continue;
875
876                 unit_unwatch_fd(UNIT(s), &p->fd_watch);
877         }
878 }
879
880 static int socket_watch_fds(Socket *s) {
881         SocketPort *p;
882         int r;
883
884         assert(s);
885
886         LIST_FOREACH(port, p, s->ports) {
887                 if (p->fd < 0)
888                         continue;
889
890                 p->fd_watch.socket_accept =
891                         s->accept &&
892                         p->type == SOCKET_SOCKET &&
893                         socket_address_can_accept(&p->address);
894
895                 if ((r = unit_watch_fd(UNIT(s), p->fd, EPOLLIN, &p->fd_watch)) < 0)
896                         goto fail;
897         }
898
899         return 0;
900
901 fail:
902         socket_unwatch_fds(s);
903         return r;
904 }
905
906 static void socket_set_state(Socket *s, SocketState state) {
907         SocketState old_state;
908         assert(s);
909
910         old_state = s->state;
911         s->state = state;
912
913         if (state != SOCKET_START_PRE &&
914             state != SOCKET_START_POST &&
915             state != SOCKET_STOP_PRE &&
916             state != SOCKET_STOP_PRE_SIGTERM &&
917             state != SOCKET_STOP_PRE_SIGKILL &&
918             state != SOCKET_STOP_POST &&
919             state != SOCKET_FINAL_SIGTERM &&
920             state != SOCKET_FINAL_SIGKILL) {
921                 unit_unwatch_timer(UNIT(s), &s->timer_watch);
922                 socket_unwatch_control_pid(s);
923                 s->control_command = NULL;
924                 s->control_command_id = _SOCKET_EXEC_COMMAND_INVALID;
925         }
926
927         if (state != SOCKET_LISTENING)
928                 socket_unwatch_fds(s);
929
930         if (state != SOCKET_START_POST &&
931             state != SOCKET_LISTENING &&
932             state != SOCKET_RUNNING &&
933             state != SOCKET_STOP_PRE &&
934             state != SOCKET_STOP_PRE_SIGTERM &&
935             state != SOCKET_STOP_PRE_SIGKILL)
936                 socket_close_fds(s);
937
938         if (state != old_state)
939                 log_debug("%s changed %s -> %s",
940                           s->meta.id,
941                           socket_state_to_string(old_state),
942                           socket_state_to_string(state));
943
944         unit_notify(UNIT(s), state_translation_table[old_state], state_translation_table[state], true);
945 }
946
947 static int socket_coldplug(Unit *u) {
948         Socket *s = SOCKET(u);
949         int r;
950
951         assert(s);
952         assert(s->state == SOCKET_DEAD);
953
954         if (s->deserialized_state != s->state) {
955
956                 if (s->deserialized_state == SOCKET_START_PRE ||
957                     s->deserialized_state == SOCKET_START_POST ||
958                     s->deserialized_state == SOCKET_STOP_PRE ||
959                     s->deserialized_state == SOCKET_STOP_PRE_SIGTERM ||
960                     s->deserialized_state == SOCKET_STOP_PRE_SIGKILL ||
961                     s->deserialized_state == SOCKET_STOP_POST ||
962                     s->deserialized_state == SOCKET_FINAL_SIGTERM ||
963                     s->deserialized_state == SOCKET_FINAL_SIGKILL) {
964
965                         if (s->control_pid <= 0)
966                                 return -EBADMSG;
967
968                         if ((r = unit_watch_pid(UNIT(s), s->control_pid)) < 0)
969                                 return r;
970
971                         if ((r = unit_watch_timer(UNIT(s), s->timeout_usec, &s->timer_watch)) < 0)
972                                 return r;
973                 }
974
975                 if (s->deserialized_state == SOCKET_START_POST ||
976                     s->deserialized_state == SOCKET_LISTENING ||
977                     s->deserialized_state == SOCKET_RUNNING ||
978                     s->deserialized_state == SOCKET_STOP_PRE ||
979                     s->deserialized_state == SOCKET_STOP_PRE_SIGTERM ||
980                     s->deserialized_state == SOCKET_STOP_PRE_SIGKILL)
981                         if ((r = socket_open_fds(s)) < 0)
982                                 return r;
983
984                 if (s->deserialized_state == SOCKET_LISTENING)
985                         if ((r = socket_watch_fds(s)) < 0)
986                                 return r;
987
988                 socket_set_state(s, s->deserialized_state);
989         }
990
991         return 0;
992 }
993
994 static int socket_spawn(Socket *s, ExecCommand *c, pid_t *_pid) {
995         pid_t pid;
996         int r;
997         char **argv;
998
999         assert(s);
1000         assert(c);
1001         assert(_pid);
1002
1003         if ((r = unit_watch_timer(UNIT(s), s->timeout_usec, &s->timer_watch)) < 0)
1004                 goto fail;
1005
1006         if (!(argv = unit_full_printf_strv(UNIT(s), c->argv))) {
1007                 r = -ENOMEM;
1008                 goto fail;
1009         }
1010
1011         r = exec_spawn(c,
1012                        argv,
1013                        &s->exec_context,
1014                        NULL, 0,
1015                        s->meta.manager->environment,
1016                        true,
1017                        true,
1018                        true,
1019                        s->meta.manager->confirm_spawn,
1020                        s->meta.cgroup_bondings,
1021                        &pid);
1022
1023         strv_free(argv);
1024         if (r < 0)
1025                 goto fail;
1026
1027         if ((r = unit_watch_pid(UNIT(s), pid)) < 0)
1028                 /* FIXME: we need to do something here */
1029                 goto fail;
1030
1031         *_pid = pid;
1032
1033         return 0;
1034
1035 fail:
1036         unit_unwatch_timer(UNIT(s), &s->timer_watch);
1037
1038         return r;
1039 }
1040
1041 static void socket_enter_dead(Socket *s, bool success) {
1042         assert(s);
1043
1044         if (!success)
1045                 s->failure = true;
1046
1047         socket_set_state(s, s->failure ? SOCKET_FAILED : SOCKET_DEAD);
1048 }
1049
1050 static void socket_enter_signal(Socket *s, SocketState state, bool success);
1051
1052 static void socket_enter_stop_post(Socket *s, bool success) {
1053         int r;
1054         assert(s);
1055
1056         if (!success)
1057                 s->failure = true;
1058
1059         socket_unwatch_control_pid(s);
1060
1061         s->control_command_id = SOCKET_EXEC_STOP_POST;
1062
1063         if ((s->control_command = s->exec_command[SOCKET_EXEC_STOP_POST])) {
1064                 if ((r = socket_spawn(s, s->control_command, &s->control_pid)) < 0)
1065                         goto fail;
1066
1067                 socket_set_state(s, SOCKET_STOP_POST);
1068         } else
1069                 socket_enter_signal(s, SOCKET_FINAL_SIGTERM, true);
1070
1071         return;
1072
1073 fail:
1074         log_warning("%s failed to run 'stop-post' task: %s", s->meta.id, strerror(-r));
1075         socket_enter_signal(s, SOCKET_FINAL_SIGTERM, false);
1076 }
1077
1078 static void socket_enter_signal(Socket *s, SocketState state, bool success) {
1079         int r;
1080         Set *pid_set = NULL;
1081         bool wait_for_exit = false;
1082
1083         assert(s);
1084
1085         if (!success)
1086                 s->failure = true;
1087
1088         if (s->exec_context.kill_mode != KILL_NONE) {
1089                 int sig = (state == SOCKET_STOP_PRE_SIGTERM || state == SOCKET_FINAL_SIGTERM) ? s->exec_context.kill_signal : SIGKILL;
1090
1091                 if (s->control_pid > 0) {
1092                         if (kill_and_sigcont(s->control_pid, sig) < 0 && errno != ESRCH)
1093
1094                                 log_warning("Failed to kill control process %li: %m", (long) s->control_pid);
1095                         else
1096                                 wait_for_exit = true;
1097                 }
1098
1099                 if (s->exec_context.kill_mode == KILL_CONTROL_GROUP) {
1100
1101                         if (!(pid_set = set_new(trivial_hash_func, trivial_compare_func))) {
1102                                 r = -ENOMEM;
1103                                 goto fail;
1104                         }
1105
1106                         /* Exclude the control pid from being killed via the cgroup */
1107                         if (s->control_pid > 0)
1108                                 if ((r = set_put(pid_set, LONG_TO_PTR(s->control_pid))) < 0)
1109                                         goto fail;
1110
1111                         if ((r = cgroup_bonding_kill_list(s->meta.cgroup_bondings, sig, true, pid_set)) < 0) {
1112                                 if (r != -EAGAIN && r != -ESRCH && r != -ENOENT)
1113                                         log_warning("Failed to kill control group: %s", strerror(-r));
1114                         } else if (r > 0)
1115                                 wait_for_exit = true;
1116
1117                         set_free(pid_set);
1118                         pid_set = NULL;
1119                 }
1120         }
1121
1122         if (wait_for_exit) {
1123                 if ((r = unit_watch_timer(UNIT(s), s->timeout_usec, &s->timer_watch)) < 0)
1124                         goto fail;
1125
1126                 socket_set_state(s, state);
1127         } else if (state == SOCKET_STOP_PRE_SIGTERM || state == SOCKET_STOP_PRE_SIGKILL)
1128                 socket_enter_stop_post(s, true);
1129         else
1130                 socket_enter_dead(s, true);
1131
1132         return;
1133
1134 fail:
1135         log_warning("%s failed to kill processes: %s", s->meta.id, strerror(-r));
1136
1137         if (state == SOCKET_STOP_PRE_SIGTERM || state == SOCKET_STOP_PRE_SIGKILL)
1138                 socket_enter_stop_post(s, false);
1139         else
1140                 socket_enter_dead(s, false);
1141
1142         if (pid_set)
1143                 set_free(pid_set);
1144 }
1145
1146 static void socket_enter_stop_pre(Socket *s, bool success) {
1147         int r;
1148         assert(s);
1149
1150         if (!success)
1151                 s->failure = true;
1152
1153         socket_unwatch_control_pid(s);
1154
1155         s->control_command_id = SOCKET_EXEC_STOP_PRE;
1156
1157         if ((s->control_command = s->exec_command[SOCKET_EXEC_STOP_PRE])) {
1158                 if ((r = socket_spawn(s, s->control_command, &s->control_pid)) < 0)
1159                         goto fail;
1160
1161                 socket_set_state(s, SOCKET_STOP_PRE);
1162         } else
1163                 socket_enter_stop_post(s, true);
1164
1165         return;
1166
1167 fail:
1168         log_warning("%s failed to run 'stop-pre' task: %s", s->meta.id, strerror(-r));
1169         socket_enter_stop_post(s, false);
1170 }
1171
1172 static void socket_enter_listening(Socket *s) {
1173         int r;
1174         assert(s);
1175
1176         if ((r = socket_watch_fds(s)) < 0) {
1177                 log_warning("%s failed to watch sockets: %s", s->meta.id, strerror(-r));
1178                 goto fail;
1179         }
1180
1181         socket_set_state(s, SOCKET_LISTENING);
1182         return;
1183
1184 fail:
1185         socket_enter_stop_pre(s, false);
1186 }
1187
1188 static void socket_enter_start_post(Socket *s) {
1189         int r;
1190         assert(s);
1191
1192         if ((r = socket_open_fds(s)) < 0) {
1193                 log_warning("%s failed to listen on sockets: %s", s->meta.id, strerror(-r));
1194                 goto fail;
1195         }
1196
1197         socket_unwatch_control_pid(s);
1198
1199         s->control_command_id = SOCKET_EXEC_START_POST;
1200
1201         if ((s->control_command = s->exec_command[SOCKET_EXEC_START_POST])) {
1202                 if ((r = socket_spawn(s, s->control_command, &s->control_pid)) < 0) {
1203                         log_warning("%s failed to run 'start-post' task: %s", s->meta.id, strerror(-r));
1204                         goto fail;
1205                 }
1206
1207                 socket_set_state(s, SOCKET_START_POST);
1208         } else
1209                 socket_enter_listening(s);
1210
1211         return;
1212
1213 fail:
1214         socket_enter_stop_pre(s, false);
1215 }
1216
1217 static void socket_enter_start_pre(Socket *s) {
1218         int r;
1219         assert(s);
1220
1221         socket_unwatch_control_pid(s);
1222
1223         s->control_command_id = SOCKET_EXEC_START_PRE;
1224
1225         if ((s->control_command = s->exec_command[SOCKET_EXEC_START_PRE])) {
1226                 if ((r = socket_spawn(s, s->control_command, &s->control_pid)) < 0)
1227                         goto fail;
1228
1229                 socket_set_state(s, SOCKET_START_PRE);
1230         } else
1231                 socket_enter_start_post(s);
1232
1233         return;
1234
1235 fail:
1236         log_warning("%s failed to run 'start-pre' task: %s", s->meta.id, strerror(-r));
1237         socket_enter_dead(s, false);
1238 }
1239
1240 static void socket_enter_running(Socket *s, int cfd) {
1241         int r;
1242         DBusError error;
1243
1244         assert(s);
1245         dbus_error_init(&error);
1246
1247         /* We don't take connections anymore if we are supposed to
1248          * shut down anyway */
1249         if (unit_pending_inactive(UNIT(s))) {
1250                 log_debug("Suppressing connection request on %s since unit stop is scheduled.", s->meta.id);
1251
1252                 if (cfd >= 0)
1253                         close_nointr_nofail(cfd);
1254                 else  {
1255                         /* Flush all sockets by closing and reopening them */
1256                         socket_close_fds(s);
1257
1258                         if ((r = socket_watch_fds(s)) < 0) {
1259                                 log_warning("%s failed to watch sockets: %s", s->meta.id, strerror(-r));
1260                                 socket_enter_stop_pre(s, false);
1261                         }
1262                 }
1263
1264                 return;
1265         }
1266
1267         if (cfd < 0) {
1268                 bool pending = false;
1269                 Meta *i;
1270
1271                 /* If there's already a start pending don't bother to
1272                  * do anything */
1273                 LIST_FOREACH(units_per_type, i, s->meta.manager->units_per_type[UNIT_SERVICE]) {
1274                         Service *service = (Service *) i;
1275
1276                         if (!set_get(service->configured_sockets, s))
1277                                 continue;
1278
1279                         if (!unit_pending_active(UNIT(service)))
1280                                 continue;
1281
1282                         pending = true;
1283                         break;
1284                 }
1285
1286                 if (!pending)
1287                         if ((r = manager_add_job(s->meta.manager, JOB_START, UNIT(s->service), JOB_REPLACE, true, &error, NULL)) < 0)
1288                                 goto fail;
1289
1290                 socket_set_state(s, SOCKET_RUNNING);
1291         } else {
1292                 char *prefix, *instance = NULL, *name;
1293                 Service *service;
1294
1295                 if (s->n_connections >= s->max_connections) {
1296                         log_warning("Too many incoming connections (%u)", s->n_connections);
1297                         close_nointr_nofail(cfd);
1298                         return;
1299                 }
1300
1301                 if ((r = socket_instantiate_service(s)) < 0)
1302                         goto fail;
1303
1304                 if ((r = instance_from_socket(cfd, s->n_accepted, &instance)) < 0)
1305                         goto fail;
1306
1307                 if (!(prefix = unit_name_to_prefix(s->meta.id))) {
1308                         free(instance);
1309                         r = -ENOMEM;
1310                         goto fail;
1311                 }
1312
1313                 name = unit_name_build(prefix, instance, ".service");
1314                 free(prefix);
1315                 free(instance);
1316
1317                 if (!name) {
1318                         r = -ENOMEM;
1319                         goto fail;
1320                 }
1321
1322                 if ((r = unit_add_name(UNIT(s->service), name)) < 0) {
1323                         free(name);
1324                         goto fail;
1325                 }
1326
1327                 service = s->service;
1328                 s->service = NULL;
1329                 s->n_accepted ++;
1330
1331                 service->meta.no_gc = false;
1332
1333                 unit_choose_id(UNIT(service), name);
1334                 free(name);
1335
1336                 if ((r = service_set_socket_fd(service, cfd, s)) < 0)
1337                         goto fail;
1338
1339                 cfd = -1;
1340                 s->n_connections ++;
1341
1342                 if ((r = manager_add_job(s->meta.manager, JOB_START, UNIT(service), JOB_REPLACE, true, &error, NULL)) < 0)
1343                         goto fail;
1344
1345                 /* Notify clients about changed counters */
1346                 unit_add_to_dbus_queue(UNIT(s));
1347         }
1348
1349         return;
1350
1351 fail:
1352         log_warning("%s failed to queue socket startup job: %s", s->meta.id, bus_error(&error, r));
1353         socket_enter_stop_pre(s, false);
1354
1355         if (cfd >= 0)
1356                 close_nointr_nofail(cfd);
1357
1358         dbus_error_free(&error);
1359 }
1360
1361 static void socket_run_next(Socket *s, bool success) {
1362         int r;
1363
1364         assert(s);
1365         assert(s->control_command);
1366         assert(s->control_command->command_next);
1367
1368         if (!success)
1369                 s->failure = true;
1370
1371         socket_unwatch_control_pid(s);
1372
1373         s->control_command = s->control_command->command_next;
1374
1375         if ((r = socket_spawn(s, s->control_command, &s->control_pid)) < 0)
1376                 goto fail;
1377
1378         return;
1379
1380 fail:
1381         log_warning("%s failed to run next task: %s", s->meta.id, strerror(-r));
1382
1383         if (s->state == SOCKET_START_POST)
1384                 socket_enter_stop_pre(s, false);
1385         else if (s->state == SOCKET_STOP_POST)
1386                 socket_enter_dead(s, false);
1387         else
1388                 socket_enter_signal(s, SOCKET_FINAL_SIGTERM, false);
1389 }
1390
1391 static int socket_start(Unit *u) {
1392         Socket *s = SOCKET(u);
1393
1394         assert(s);
1395
1396         /* We cannot fulfill this request right now, try again later
1397          * please! */
1398         if (s->state == SOCKET_STOP_PRE ||
1399             s->state == SOCKET_STOP_PRE_SIGKILL ||
1400             s->state == SOCKET_STOP_PRE_SIGTERM ||
1401             s->state == SOCKET_STOP_POST ||
1402             s->state == SOCKET_FINAL_SIGTERM ||
1403             s->state == SOCKET_FINAL_SIGKILL)
1404                 return -EAGAIN;
1405
1406         if (s->state == SOCKET_START_PRE ||
1407             s->state == SOCKET_START_POST)
1408                 return 0;
1409
1410         /* Cannot run this without the service being around */
1411         if (s->service) {
1412                 if (s->service->meta.load_state != UNIT_LOADED) {
1413                         log_error("Socket service %s not loaded, refusing.", s->service->meta.id);
1414                         return -ENOENT;
1415                 }
1416
1417                 /* If the service is already active we cannot start the
1418                  * socket */
1419                 if (s->service->state != SERVICE_DEAD &&
1420                     s->service->state != SERVICE_FAILED &&
1421                     s->service->state != SERVICE_AUTO_RESTART) {
1422                         log_error("Socket service %s already active, refusing.", s->service->meta.id);
1423                         return -EBUSY;
1424                 }
1425
1426 #ifdef HAVE_SYSV_COMPAT
1427                 if (s->service->sysv_path) {
1428                         log_error("Using SysV services for socket activation is not supported. Refusing.");
1429                         return -ENOENT;
1430                 }
1431 #endif
1432         }
1433
1434         assert(s->state == SOCKET_DEAD || s->state == SOCKET_FAILED);
1435
1436         s->failure = false;
1437         socket_enter_start_pre(s);
1438         return 0;
1439 }
1440
1441 static int socket_stop(Unit *u) {
1442         Socket *s = SOCKET(u);
1443
1444         assert(s);
1445
1446         /* Already on it */
1447         if (s->state == SOCKET_STOP_PRE ||
1448             s->state == SOCKET_STOP_PRE_SIGTERM ||
1449             s->state == SOCKET_STOP_PRE_SIGKILL ||
1450             s->state == SOCKET_STOP_POST ||
1451             s->state == SOCKET_FINAL_SIGTERM ||
1452             s->state == SOCKET_FINAL_SIGKILL)
1453                 return 0;
1454
1455         /* If there's already something running we go directly into
1456          * kill mode. */
1457         if (s->state == SOCKET_START_PRE ||
1458             s->state == SOCKET_START_POST) {
1459                 socket_enter_signal(s, SOCKET_STOP_PRE_SIGTERM, true);
1460                 return -EAGAIN;
1461         }
1462
1463         assert(s->state == SOCKET_LISTENING || s->state == SOCKET_RUNNING);
1464
1465         socket_enter_stop_pre(s, true);
1466         return 0;
1467 }
1468
1469 static int socket_serialize(Unit *u, FILE *f, FDSet *fds) {
1470         Socket *s = SOCKET(u);
1471         SocketPort *p;
1472         int r;
1473
1474         assert(u);
1475         assert(f);
1476         assert(fds);
1477
1478         unit_serialize_item(u, f, "state", socket_state_to_string(s->state));
1479         unit_serialize_item(u, f, "failure", yes_no(s->failure));
1480         unit_serialize_item_format(u, f, "n-accepted", "%u", s->n_accepted);
1481
1482         if (s->control_pid > 0)
1483                 unit_serialize_item_format(u, f, "control-pid", "%lu", (unsigned long) s->control_pid);
1484
1485         if (s->control_command_id >= 0)
1486                 unit_serialize_item(u, f, "control-command", socket_exec_command_to_string(s->control_command_id));
1487
1488         LIST_FOREACH(port, p, s->ports) {
1489                 int copy;
1490
1491                 if (p->fd < 0)
1492                         continue;
1493
1494                 if ((copy = fdset_put_dup(fds, p->fd)) < 0)
1495                         return copy;
1496
1497                 if (p->type == SOCKET_SOCKET) {
1498                         char *t;
1499
1500                         if ((r = socket_address_print(&p->address, &t)) < 0)
1501                                 return r;
1502
1503                         if (socket_address_family(&p->address) == AF_NETLINK)
1504                                 unit_serialize_item_format(u, f, "netlink", "%i %s", copy, t);
1505                         else
1506                                 unit_serialize_item_format(u, f, "socket", "%i %i %s", copy, p->address.type, t);
1507                         free(t);
1508                 } else if (p->type == SOCKET_SPECIAL)
1509                         unit_serialize_item_format(u, f, "special", "%i %s", copy, p->path);
1510                 else {
1511                         assert(p->type == SOCKET_FIFO);
1512                         unit_serialize_item_format(u, f, "fifo", "%i %s", copy, p->path);
1513                 }
1514         }
1515
1516         return 0;
1517 }
1518
1519 static int socket_deserialize_item(Unit *u, const char *key, const char *value, FDSet *fds) {
1520         Socket *s = SOCKET(u);
1521
1522         assert(u);
1523         assert(key);
1524         assert(value);
1525         assert(fds);
1526
1527         if (streq(key, "state")) {
1528                 SocketState state;
1529
1530                 if ((state = socket_state_from_string(value)) < 0)
1531                         log_debug("Failed to parse state value %s", value);
1532                 else
1533                         s->deserialized_state = state;
1534         } else if (streq(key, "failure")) {
1535                 int b;
1536
1537                 if ((b = parse_boolean(value)) < 0)
1538                         log_debug("Failed to parse failure value %s", value);
1539                 else
1540                         s->failure = b || s->failure;
1541
1542         } else if (streq(key, "n-accepted")) {
1543                 unsigned k;
1544
1545                 if (safe_atou(value, &k) < 0)
1546                         log_debug("Failed to parse n-accepted value %s", value);
1547                 else
1548                         s->n_accepted += k;
1549         } else if (streq(key, "control-pid")) {
1550                 pid_t pid;
1551
1552                 if (parse_pid(value, &pid) < 0)
1553                         log_debug("Failed to parse control-pid value %s", value);
1554                 else
1555                         s->control_pid = pid;
1556         } else if (streq(key, "control-command")) {
1557                 SocketExecCommand id;
1558
1559                 if ((id = socket_exec_command_from_string(value)) < 0)
1560                         log_debug("Failed to parse exec-command value %s", value);
1561                 else {
1562                         s->control_command_id = id;
1563                         s->control_command = s->exec_command[id];
1564                 }
1565         } else if (streq(key, "fifo")) {
1566                 int fd, skip = 0;
1567                 SocketPort *p;
1568
1569                 if (sscanf(value, "%i %n", &fd, &skip) < 1 || fd < 0 || !fdset_contains(fds, fd))
1570                         log_debug("Failed to parse fifo value %s", value);
1571                 else {
1572
1573                         LIST_FOREACH(port, p, s->ports)
1574                                 if (p->type == SOCKET_FIFO &&
1575                                     streq_ptr(p->path, value+skip))
1576                                         break;
1577
1578                         if (p) {
1579                                 if (p->fd >= 0)
1580                                         close_nointr_nofail(p->fd);
1581                                 p->fd = fdset_remove(fds, fd);
1582                         }
1583                 }
1584
1585         } else if (streq(key, "special")) {
1586                 int fd, skip = 0;
1587                 SocketPort *p;
1588
1589                 if (sscanf(value, "%i %n", &fd, &skip) < 1 || fd < 0 || !fdset_contains(fds, fd))
1590                         log_debug("Failed to parse special value %s", value);
1591                 else {
1592
1593                         LIST_FOREACH(port, p, s->ports)
1594                                 if (p->type == SOCKET_SPECIAL &&
1595                                     streq_ptr(p->path, value+skip))
1596                                         break;
1597
1598                         if (p) {
1599                                 if (p->fd >= 0)
1600                                         close_nointr_nofail(p->fd);
1601                                 p->fd = fdset_remove(fds, fd);
1602                         }
1603                 }
1604
1605         } else if (streq(key, "socket")) {
1606                 int fd, type, skip = 0;
1607                 SocketPort *p;
1608
1609                 if (sscanf(value, "%i %i %n", &fd, &type, &skip) < 2 || fd < 0 || type < 0 || !fdset_contains(fds, fd))
1610                         log_debug("Failed to parse socket value %s", value);
1611                 else {
1612
1613                         LIST_FOREACH(port, p, s->ports)
1614                                 if (socket_address_is(&p->address, value+skip, type))
1615                                         break;
1616
1617                         if (p) {
1618                                 if (p->fd >= 0)
1619                                         close_nointr_nofail(p->fd);
1620                                 p->fd = fdset_remove(fds, fd);
1621                         }
1622                 }
1623
1624         } else if (streq(key, "netlink")) {
1625                 int fd, skip = 0;
1626                 SocketPort *p;
1627
1628                 if (sscanf(value, "%i %n", &fd, &skip) < 1 || fd < 0 || !fdset_contains(fds, fd))
1629                         log_debug("Failed to parse socket value %s", value);
1630                 else {
1631
1632                         LIST_FOREACH(port, p, s->ports)
1633                                 if (socket_address_is_netlink(&p->address, value+skip))
1634                                         break;
1635
1636                         if (p) {
1637                                 if (p->fd >= 0)
1638                                         close_nointr_nofail(p->fd);
1639                                 p->fd = fdset_remove(fds, fd);
1640                         }
1641                 }
1642
1643         } else
1644                 log_debug("Unknown serialization key '%s'", key);
1645
1646         return 0;
1647 }
1648
1649 static UnitActiveState socket_active_state(Unit *u) {
1650         assert(u);
1651
1652         return state_translation_table[SOCKET(u)->state];
1653 }
1654
1655 static const char *socket_sub_state_to_string(Unit *u) {
1656         assert(u);
1657
1658         return socket_state_to_string(SOCKET(u)->state);
1659 }
1660
1661 static bool socket_check_gc(Unit *u) {
1662         Socket *s = SOCKET(u);
1663
1664         assert(u);
1665
1666         return s->n_connections > 0;
1667 }
1668
1669 static void socket_fd_event(Unit *u, int fd, uint32_t events, Watch *w) {
1670         Socket *s = SOCKET(u);
1671         int cfd = -1;
1672
1673         assert(s);
1674         assert(fd >= 0);
1675
1676         if (s->state != SOCKET_LISTENING)
1677                 return;
1678
1679         log_debug("Incoming traffic on %s", u->meta.id);
1680
1681         if (events != EPOLLIN) {
1682
1683                 if (events & EPOLLHUP)
1684                         log_error("%s: Got POLLHUP on a listening socket. The service probably invoked shutdown() on it, and should better not do that.", u->meta.id);
1685                 else
1686                         log_error("%s: Got unexpected poll event (0x%x) on socket.", u->meta.id, events);
1687
1688                 goto fail;
1689         }
1690
1691         if (w->socket_accept) {
1692                 for (;;) {
1693
1694                         if ((cfd = accept4(fd, NULL, NULL, SOCK_NONBLOCK)) < 0) {
1695
1696                                 if (errno == EINTR)
1697                                         continue;
1698
1699                                 log_error("Failed to accept socket: %m");
1700                                 goto fail;
1701                         }
1702
1703                         break;
1704                 }
1705
1706                 socket_apply_socket_options(s, cfd);
1707         }
1708
1709         socket_enter_running(s, cfd);
1710         return;
1711
1712 fail:
1713         socket_enter_stop_pre(s, false);
1714 }
1715
1716 static void socket_sigchld_event(Unit *u, pid_t pid, int code, int status) {
1717         Socket *s = SOCKET(u);
1718         bool success;
1719
1720         assert(s);
1721         assert(pid >= 0);
1722
1723         if (pid != s->control_pid)
1724                 return;
1725
1726         s->control_pid = 0;
1727
1728         success = is_clean_exit(code, status);
1729
1730         if (s->control_command) {
1731                 exec_status_exit(&s->control_command->exec_status, pid, code, status, s->exec_context.utmp_id);
1732
1733                 if (s->control_command->ignore)
1734                         success = true;
1735         }
1736
1737         log_full(success ? LOG_DEBUG : LOG_NOTICE,
1738                  "%s control process exited, code=%s status=%i", u->meta.id, sigchld_code_to_string(code), status);
1739         s->failure = s->failure || !success;
1740
1741         if (s->control_command && s->control_command->command_next && success) {
1742                 log_debug("%s running next command for state %s", u->meta.id, socket_state_to_string(s->state));
1743                 socket_run_next(s, success);
1744         } else {
1745                 s->control_command = NULL;
1746                 s->control_command_id = _SOCKET_EXEC_COMMAND_INVALID;
1747
1748                 /* No further commands for this step, so let's figure
1749                  * out what to do next */
1750
1751                 log_debug("%s got final SIGCHLD for state %s", u->meta.id, socket_state_to_string(s->state));
1752
1753                 switch (s->state) {
1754
1755                 case SOCKET_START_PRE:
1756                         if (success)
1757                                 socket_enter_start_post(s);
1758                         else
1759                                 socket_enter_signal(s, SOCKET_FINAL_SIGTERM, false);
1760                         break;
1761
1762                 case SOCKET_START_POST:
1763                         if (success)
1764                                 socket_enter_listening(s);
1765                         else
1766                                 socket_enter_stop_pre(s, false);
1767                         break;
1768
1769                 case SOCKET_STOP_PRE:
1770                 case SOCKET_STOP_PRE_SIGTERM:
1771                 case SOCKET_STOP_PRE_SIGKILL:
1772                         socket_enter_stop_post(s, success);
1773                         break;
1774
1775                 case SOCKET_STOP_POST:
1776                 case SOCKET_FINAL_SIGTERM:
1777                 case SOCKET_FINAL_SIGKILL:
1778                         socket_enter_dead(s, success);
1779                         break;
1780
1781                 default:
1782                         assert_not_reached("Uh, control process died at wrong time.");
1783                 }
1784         }
1785
1786         /* Notify clients about changed exit status */
1787         unit_add_to_dbus_queue(u);
1788 }
1789
1790 static void socket_timer_event(Unit *u, uint64_t elapsed, Watch *w) {
1791         Socket *s = SOCKET(u);
1792
1793         assert(s);
1794         assert(elapsed == 1);
1795         assert(w == &s->timer_watch);
1796
1797         switch (s->state) {
1798
1799         case SOCKET_START_PRE:
1800                 log_warning("%s starting timed out. Terminating.", u->meta.id);
1801                 socket_enter_signal(s, SOCKET_FINAL_SIGTERM, false);
1802                 break;
1803
1804         case SOCKET_START_POST:
1805                 log_warning("%s starting timed out. Stopping.", u->meta.id);
1806                 socket_enter_stop_pre(s, false);
1807                 break;
1808
1809         case SOCKET_STOP_PRE:
1810                 log_warning("%s stopping timed out. Terminating.", u->meta.id);
1811                 socket_enter_signal(s, SOCKET_STOP_PRE_SIGTERM, false);
1812                 break;
1813
1814         case SOCKET_STOP_PRE_SIGTERM:
1815                 if (s->exec_context.send_sigkill) {
1816                         log_warning("%s stopping timed out. Killing.", u->meta.id);
1817                         socket_enter_signal(s, SOCKET_STOP_PRE_SIGKILL, false);
1818                 } else {
1819                         log_warning("%s stopping timed out. Skipping SIGKILL. Ignoring.", u->meta.id);
1820                         socket_enter_stop_post(s, false);
1821                 }
1822                 break;
1823
1824         case SOCKET_STOP_PRE_SIGKILL:
1825                 log_warning("%s still around after SIGKILL. Ignoring.", u->meta.id);
1826                 socket_enter_stop_post(s, false);
1827                 break;
1828
1829         case SOCKET_STOP_POST:
1830                 log_warning("%s stopping timed out (2). Terminating.", u->meta.id);
1831                 socket_enter_signal(s, SOCKET_FINAL_SIGTERM, false);
1832                 break;
1833
1834         case SOCKET_FINAL_SIGTERM:
1835                 if (s->exec_context.send_sigkill) {
1836                         log_warning("%s stopping timed out (2). Killing.", u->meta.id);
1837                         socket_enter_signal(s, SOCKET_FINAL_SIGKILL, false);
1838                 } else {
1839                         log_warning("%s stopping timed out (2). Skipping SIGKILL. Ignoring.", u->meta.id);
1840                         socket_enter_dead(s, false);
1841                 }
1842                 break;
1843
1844         case SOCKET_FINAL_SIGKILL:
1845                 log_warning("%s still around after SIGKILL (2). Entering failed mode.", u->meta.id);
1846                 socket_enter_dead(s, false);
1847                 break;
1848
1849         default:
1850                 assert_not_reached("Timeout at wrong time.");
1851         }
1852 }
1853
1854 int socket_collect_fds(Socket *s, int **fds, unsigned *n_fds) {
1855         int *rfds;
1856         unsigned rn_fds, k;
1857         SocketPort *p;
1858
1859         assert(s);
1860         assert(fds);
1861         assert(n_fds);
1862
1863         /* Called from the service code for requesting our fds */
1864
1865         rn_fds = 0;
1866         LIST_FOREACH(port, p, s->ports)
1867                 if (p->fd >= 0)
1868                         rn_fds++;
1869
1870         if (!(rfds = new(int, rn_fds)))
1871                 return -ENOMEM;
1872
1873         k = 0;
1874         LIST_FOREACH(port, p, s->ports)
1875                 if (p->fd >= 0)
1876                         rfds[k++] = p->fd;
1877
1878         assert(k == rn_fds);
1879
1880         *fds = rfds;
1881         *n_fds = rn_fds;
1882
1883         return 0;
1884 }
1885
1886 void socket_notify_service_dead(Socket *s) {
1887         assert(s);
1888
1889         /* The service is dead. Dang!
1890          *
1891          * This is strictly for one-instance-for-all-connections
1892          * services. */
1893
1894         if (s->state == SOCKET_RUNNING) {
1895                 log_debug("%s got notified about service death.", s->meta.id);
1896                 socket_enter_listening(s);
1897         }
1898 }
1899
1900 void socket_connection_unref(Socket *s) {
1901         assert(s);
1902
1903         /* The service is dead. Yay!
1904          *
1905          * This is strictly for one-instance-per-connection
1906          * services. */
1907
1908         assert(s->n_connections > 0);
1909         s->n_connections--;
1910
1911         log_debug("%s: One connection closed, %u left.", s->meta.id, s->n_connections);
1912 }
1913
1914 static void socket_reset_failed(Unit *u) {
1915         Socket *s = SOCKET(u);
1916
1917         assert(s);
1918
1919         if (s->state == SOCKET_FAILED)
1920                 socket_set_state(s, SOCKET_DEAD);
1921
1922         s->failure = false;
1923 }
1924
1925 static int socket_kill(Unit *u, KillWho who, KillMode mode, int signo, DBusError *error) {
1926         Socket *s = SOCKET(u);
1927         int r = 0;
1928         Set *pid_set = NULL;
1929
1930         assert(s);
1931
1932         if (who == KILL_MAIN) {
1933                 dbus_set_error(error, BUS_ERROR_NO_SUCH_PROCESS, "Socket units have no main processes");
1934                 return -EINVAL;
1935         }
1936
1937         if (s->control_pid <= 0 && who == KILL_CONTROL) {
1938                 dbus_set_error(error, BUS_ERROR_NO_SUCH_PROCESS, "No control process to kill");
1939                 return -ENOENT;
1940         }
1941
1942         if (s->control_pid > 0)
1943                 if (kill(s->control_pid, signo) < 0)
1944                         r = -errno;
1945
1946         if (mode == KILL_CONTROL_GROUP) {
1947                 int q;
1948
1949                 if (!(pid_set = set_new(trivial_hash_func, trivial_compare_func)))
1950                         return -ENOMEM;
1951
1952                 /* Exclude the control pid from being killed via the cgroup */
1953                 if (s->control_pid > 0)
1954                         if ((q = set_put(pid_set, LONG_TO_PTR(s->control_pid))) < 0) {
1955                                 r = q;
1956                                 goto finish;
1957                         }
1958
1959                 if ((q = cgroup_bonding_kill_list(s->meta.cgroup_bondings, signo, false, pid_set)) < 0)
1960                         if (r != -EAGAIN && r != -ESRCH && r != -ENOENT)
1961                                 r = q;
1962         }
1963
1964 finish:
1965         if (pid_set)
1966                 set_free(pid_set);
1967
1968         return r;
1969 }
1970
1971 static const char* const socket_state_table[_SOCKET_STATE_MAX] = {
1972         [SOCKET_DEAD] = "dead",
1973         [SOCKET_START_PRE] = "start-pre",
1974         [SOCKET_START_POST] = "start-post",
1975         [SOCKET_LISTENING] = "listening",
1976         [SOCKET_RUNNING] = "running",
1977         [SOCKET_STOP_PRE] = "stop-pre",
1978         [SOCKET_STOP_PRE_SIGTERM] = "stop-pre-sigterm",
1979         [SOCKET_STOP_PRE_SIGKILL] = "stop-pre-sigkill",
1980         [SOCKET_STOP_POST] = "stop-post",
1981         [SOCKET_FINAL_SIGTERM] = "final-sigterm",
1982         [SOCKET_FINAL_SIGKILL] = "final-sigkill",
1983         [SOCKET_FAILED] = "failed"
1984 };
1985
1986 DEFINE_STRING_TABLE_LOOKUP(socket_state, SocketState);
1987
1988 static const char* const socket_exec_command_table[_SOCKET_EXEC_COMMAND_MAX] = {
1989         [SOCKET_EXEC_START_PRE] = "StartPre",
1990         [SOCKET_EXEC_START_POST] = "StartPost",
1991         [SOCKET_EXEC_STOP_PRE] = "StopPre",
1992         [SOCKET_EXEC_STOP_POST] = "StopPost"
1993 };
1994
1995 DEFINE_STRING_TABLE_LOOKUP(socket_exec_command, SocketExecCommand);
1996
1997 const UnitVTable socket_vtable = {
1998         .suffix = ".socket",
1999
2000         .init = socket_init,
2001         .done = socket_done,
2002         .load = socket_load,
2003
2004         .kill = socket_kill,
2005
2006         .coldplug = socket_coldplug,
2007
2008         .dump = socket_dump,
2009
2010         .start = socket_start,
2011         .stop = socket_stop,
2012
2013         .serialize = socket_serialize,
2014         .deserialize_item = socket_deserialize_item,
2015
2016         .active_state = socket_active_state,
2017         .sub_state_to_string = socket_sub_state_to_string,
2018
2019         .check_gc = socket_check_gc,
2020
2021         .fd_event = socket_fd_event,
2022         .sigchld_event = socket_sigchld_event,
2023         .timer_event = socket_timer_event,
2024
2025         .reset_failed = socket_reset_failed,
2026
2027         .bus_interface = "org.freedesktop.systemd1.Socket",
2028         .bus_message_handler = bus_socket_message_handler,
2029         .bus_invalidating_properties =  bus_socket_invalidating_properties
2030 };