chiark / gitweb /
socket: only add dependency on kmsg socket to socket units which have any kind of...
[elogind.git] / src / socket.c
1 /*-*- Mode: C; c-basic-offset: 8; indent-tabs-mode: nil -*-*/
2
3 /***
4   This file is part of systemd.
5
6   Copyright 2010 Lennart Poettering
7
8   systemd is free software; you can redistribute it and/or modify it
9   under the terms of the GNU General Public License as published by
10   the Free Software Foundation; either version 2 of the License, or
11   (at your option) any later version.
12
13   systemd is distributed in the hope that it will be useful, but
14   WITHOUT ANY WARRANTY; without even the implied warranty of
15   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16   General Public License for more details.
17
18   You should have received a copy of the GNU General Public License
19   along with systemd; If not, see <http://www.gnu.org/licenses/>.
20 ***/
21
22 #include <sys/types.h>
23 #include <sys/stat.h>
24 #include <unistd.h>
25 #include <errno.h>
26 #include <fcntl.h>
27 #include <sys/epoll.h>
28 #include <signal.h>
29 #include <arpa/inet.h>
30 #include <mqueue.h>
31
32 #include "unit.h"
33 #include "socket.h"
34 #include "netinet/tcp.h"
35 #include "log.h"
36 #include "load-dropin.h"
37 #include "load-fragment.h"
38 #include "strv.h"
39 #include "unit-name.h"
40 #include "dbus-socket.h"
41 #include "missing.h"
42 #include "special.h"
43 #include "bus-errors.h"
44 #include "label.h"
45 #include "exit-status.h"
46 #include "def.h"
47
48 static const UnitActiveState state_translation_table[_SOCKET_STATE_MAX] = {
49         [SOCKET_DEAD] = UNIT_INACTIVE,
50         [SOCKET_START_PRE] = UNIT_ACTIVATING,
51         [SOCKET_START_POST] = UNIT_ACTIVATING,
52         [SOCKET_LISTENING] = UNIT_ACTIVE,
53         [SOCKET_RUNNING] = UNIT_ACTIVE,
54         [SOCKET_STOP_PRE] = UNIT_DEACTIVATING,
55         [SOCKET_STOP_PRE_SIGTERM] = UNIT_DEACTIVATING,
56         [SOCKET_STOP_PRE_SIGKILL] = UNIT_DEACTIVATING,
57         [SOCKET_STOP_POST] = UNIT_DEACTIVATING,
58         [SOCKET_FINAL_SIGTERM] = UNIT_DEACTIVATING,
59         [SOCKET_FINAL_SIGKILL] = UNIT_DEACTIVATING,
60         [SOCKET_FAILED] = UNIT_FAILED
61 };
62
63 static void socket_init(Unit *u) {
64         Socket *s = SOCKET(u);
65
66         assert(u);
67         assert(u->meta.load_state == UNIT_STUB);
68
69         s->backlog = SOMAXCONN;
70         s->timeout_usec = DEFAULT_TIMEOUT_USEC;
71         s->directory_mode = 0755;
72         s->socket_mode = 0666;
73
74         s->max_connections = 64;
75
76         s->priority = -1;
77         s->ip_tos = -1;
78         s->ip_ttl = -1;
79         s->mark = -1;
80
81         exec_context_init(&s->exec_context);
82         s->exec_context.std_output = u->meta.manager->default_std_output;
83         s->exec_context.std_error = u->meta.manager->default_std_error;
84
85         s->control_command_id = _SOCKET_EXEC_COMMAND_INVALID;
86 }
87
88 static void socket_unwatch_control_pid(Socket *s) {
89         assert(s);
90
91         if (s->control_pid <= 0)
92                 return;
93
94         unit_unwatch_pid(UNIT(s), s->control_pid);
95         s->control_pid = 0;
96 }
97
98 static void socket_done(Unit *u) {
99         Socket *s = SOCKET(u);
100         SocketPort *p;
101         Meta *i;
102
103         assert(s);
104
105         while ((p = s->ports)) {
106                 LIST_REMOVE(SocketPort, port, s->ports, p);
107
108                 if (p->fd >= 0) {
109                         unit_unwatch_fd(UNIT(s), &p->fd_watch);
110                         close_nointr_nofail(p->fd);
111                 }
112
113                 free(p->path);
114                 free(p);
115         }
116
117         exec_context_done(&s->exec_context);
118         exec_command_free_array(s->exec_command, _SOCKET_EXEC_COMMAND_MAX);
119         s->control_command = NULL;
120
121         socket_unwatch_control_pid(s);
122
123         s->service = NULL;
124
125         free(s->tcp_congestion);
126         s->tcp_congestion = NULL;
127
128         free(s->bind_to_device);
129         s->bind_to_device = NULL;
130
131         unit_unwatch_timer(u, &s->timer_watch);
132
133         /* Make sure no service instance refers to us anymore. */
134         LIST_FOREACH(units_by_type, i, u->meta.manager->units_by_type[UNIT_SERVICE]) {
135                 Service *service = (Service *) i;
136
137                 if (service->accept_socket == s)
138                         service->accept_socket = NULL;
139
140                 set_remove(service->configured_sockets, s);
141         }
142 }
143
144 static int socket_instantiate_service(Socket *s) {
145         char *prefix, *name;
146         int r;
147         Unit *u;
148
149         assert(s);
150
151         /* This fills in s->service if it isn't filled in yet. For
152          * Accept=yes sockets we create the next connection service
153          * here. For Accept=no this is mostly a NOP since the service
154          * is figured out at load time anyway. */
155
156         if (s->service)
157                 return 0;
158
159         assert(s->accept);
160
161         if (!(prefix = unit_name_to_prefix(s->meta.id)))
162                 return -ENOMEM;
163
164         r = asprintf(&name, "%s@%u.service", prefix, s->n_accepted);
165         free(prefix);
166
167         if (r < 0)
168                 return -ENOMEM;
169
170         r = manager_load_unit(s->meta.manager, name, NULL, NULL, &u);
171         free(name);
172
173         if (r < 0)
174                 return r;
175
176 #ifdef HAVE_SYSV_COMPAT
177         if (SERVICE(u)->sysv_path) {
178                 log_error("Using SysV services for socket activation is not supported. Refusing.");
179                 return -ENOENT;
180         }
181 #endif
182
183         u->meta.no_gc = true;
184         s->service = SERVICE(u);
185         return 0;
186 }
187
188 static bool have_non_accept_socket(Socket *s) {
189         SocketPort *p;
190
191         assert(s);
192
193         if (!s->accept)
194                 return true;
195
196         LIST_FOREACH(port, p, s->ports) {
197
198                 if (p->type != SOCKET_SOCKET)
199                         return true;
200
201                 if (!socket_address_can_accept(&p->address))
202                         return true;
203         }
204
205         return false;
206 }
207
208 static int socket_verify(Socket *s) {
209         assert(s);
210
211         if (s->meta.load_state != UNIT_LOADED)
212                 return 0;
213
214         if (!s->ports) {
215                 log_error("%s lacks Listen setting. Refusing.", s->meta.id);
216                 return -EINVAL;
217         }
218
219         if (s->accept && have_non_accept_socket(s)) {
220                 log_error("%s configured for accepting sockets, but sockets are non-accepting. Refusing.", s->meta.id);
221                 return -EINVAL;
222         }
223
224         if (s->accept && s->max_connections <= 0) {
225                 log_error("%s's MaxConnection setting too small. Refusing.", s->meta.id);
226                 return -EINVAL;
227         }
228
229         if (s->accept && s->service) {
230                 log_error("Explicit service configuration for accepting sockets not supported on %s. Refusing.", s->meta.id);
231                 return -EINVAL;
232         }
233
234         if (s->exec_context.pam_name && s->exec_context.kill_mode != KILL_CONTROL_GROUP) {
235                 log_error("%s has PAM enabled. Kill mode must be set to 'control-group'. Refusing.", s->meta.id);
236                 return -EINVAL;
237         }
238
239         return 0;
240 }
241
242 static bool socket_needs_mount(Socket *s, const char *prefix) {
243         SocketPort *p;
244
245         assert(s);
246
247         LIST_FOREACH(port, p, s->ports) {
248
249                 if (p->type == SOCKET_SOCKET) {
250                         if (socket_address_needs_mount(&p->address, prefix))
251                                 return true;
252                 } else if (p->type == SOCKET_FIFO || p->type == SOCKET_SPECIAL) {
253                         if (path_startswith(p->path, prefix))
254                                 return true;
255                 }
256         }
257
258         return false;
259 }
260
261 int socket_add_one_mount_link(Socket *s, Mount *m) {
262         int r;
263
264         assert(s);
265         assert(m);
266
267         if (s->meta.load_state != UNIT_LOADED ||
268             m->meta.load_state != UNIT_LOADED)
269                 return 0;
270
271         if (!socket_needs_mount(s, m->where))
272                 return 0;
273
274         if ((r = unit_add_two_dependencies(UNIT(s), UNIT_AFTER, UNIT_REQUIRES, UNIT(m), true)) < 0)
275                 return r;
276
277         return 0;
278 }
279
280 static int socket_add_mount_links(Socket *s) {
281         Meta *other;
282         int r;
283
284         assert(s);
285
286         LIST_FOREACH(units_by_type, other, s->meta.manager->units_by_type[UNIT_MOUNT])
287                 if ((r = socket_add_one_mount_link(s, (Mount*) other)) < 0)
288                         return r;
289
290         return 0;
291 }
292
293 static int socket_add_device_link(Socket *s) {
294         char *t;
295         int r;
296
297         assert(s);
298
299         if (!s->bind_to_device)
300                 return 0;
301
302         if (asprintf(&t, "/sys/subsystem/net/devices/%s", s->bind_to_device) < 0)
303                 return -ENOMEM;
304
305         r = unit_add_node_link(UNIT(s), t, false);
306         free(t);
307
308         return r;
309 }
310
311 static int socket_add_default_dependencies(Socket *s) {
312         int r;
313         assert(s);
314
315         if (s->meta.manager->running_as == MANAGER_SYSTEM) {
316                 if ((r = unit_add_dependency_by_name(UNIT(s), UNIT_BEFORE, SPECIAL_SOCKETS_TARGET, NULL, true)) < 0)
317                         return r;
318
319                 if ((r = unit_add_two_dependencies_by_name(UNIT(s), UNIT_AFTER, UNIT_REQUIRES, SPECIAL_SYSINIT_TARGET, NULL, true)) < 0)
320                         return r;
321         }
322
323         return unit_add_two_dependencies_by_name(UNIT(s), UNIT_BEFORE, UNIT_CONFLICTS, SPECIAL_SHUTDOWN_TARGET, NULL, true);
324 }
325
326 static bool socket_has_exec(Socket *s) {
327         unsigned i;
328         assert(s);
329
330         for (i = 0; i < _SOCKET_EXEC_COMMAND_MAX; i++)
331                 if (s->exec_command[i])
332                         return true;
333
334         return false;
335 }
336
337 static int socket_load(Unit *u) {
338         Socket *s = SOCKET(u);
339         int r;
340
341         assert(u);
342         assert(u->meta.load_state == UNIT_STUB);
343
344         if ((r = unit_load_fragment_and_dropin(u)) < 0)
345                 return r;
346
347         /* This is a new unit? Then let's add in some extras */
348         if (u->meta.load_state == UNIT_LOADED) {
349
350                 if (have_non_accept_socket(s)) {
351
352                         if (!s->service)
353                                 if ((r = unit_load_related_unit(u, ".service", (Unit**) &s->service)) < 0)
354                                         return r;
355
356                         if ((r = unit_add_dependency(u, UNIT_BEFORE, UNIT(s->service), true)) < 0)
357                                 return r;
358                 }
359
360                 if ((r = socket_add_mount_links(s)) < 0)
361                         return r;
362
363                 if ((r = socket_add_device_link(s)) < 0)
364                         return r;
365
366                 if (socket_has_exec(s))
367                         if ((r = unit_add_exec_dependencies(u, &s->exec_context)) < 0)
368                                 return r;
369
370                 if ((r = unit_add_default_cgroups(u)) < 0)
371                         return r;
372
373                 if (s->meta.default_dependencies)
374                         if ((r = socket_add_default_dependencies(s)) < 0)
375                                 return r;
376         }
377
378         return socket_verify(s);
379 }
380
381 static const char* listen_lookup(int family, int type) {
382
383         if (family == AF_NETLINK)
384                 return "ListenNetlink";
385
386         if (type == SOCK_STREAM)
387                 return "ListenStream";
388         else if (type == SOCK_DGRAM)
389                 return "ListenDatagram";
390         else if (type == SOCK_SEQPACKET)
391                 return "ListenSequentialPacket";
392
393         assert_not_reached("Unknown socket type");
394         return NULL;
395 }
396
397 static void socket_dump(Unit *u, FILE *f, const char *prefix) {
398
399         SocketExecCommand c;
400         Socket *s = SOCKET(u);
401         SocketPort *p;
402         const char *prefix2;
403         char *p2;
404
405         assert(s);
406         assert(f);
407
408         p2 = strappend(prefix, "\t");
409         prefix2 = p2 ? p2 : prefix;
410
411         fprintf(f,
412                 "%sSocket State: %s\n"
413                 "%sBindIPv6Only: %s\n"
414                 "%sBacklog: %u\n"
415                 "%sSocketMode: %04o\n"
416                 "%sDirectoryMode: %04o\n"
417                 "%sKeepAlive: %s\n"
418                 "%sFreeBind: %s\n"
419                 "%sTransparent: %s\n"
420                 "%sBroadcast: %s\n"
421                 "%sPassCrededentials: %s\n"
422                 "%sTCPCongestion: %s\n",
423                 prefix, socket_state_to_string(s->state),
424                 prefix, socket_address_bind_ipv6_only_to_string(s->bind_ipv6_only),
425                 prefix, s->backlog,
426                 prefix, s->socket_mode,
427                 prefix, s->directory_mode,
428                 prefix, yes_no(s->keep_alive),
429                 prefix, yes_no(s->free_bind),
430                 prefix, yes_no(s->transparent),
431                 prefix, yes_no(s->broadcast),
432                 prefix, yes_no(s->pass_cred),
433                 prefix, strna(s->tcp_congestion));
434
435         if (s->control_pid > 0)
436                 fprintf(f,
437                         "%sControl PID: %lu\n",
438                         prefix, (unsigned long) s->control_pid);
439
440         if (s->bind_to_device)
441                 fprintf(f,
442                         "%sBindToDevice: %s\n",
443                         prefix, s->bind_to_device);
444
445         if (s->accept)
446                 fprintf(f,
447                         "%sAccepted: %u\n"
448                         "%sNConnections: %u\n"
449                         "%sMaxConnections: %u\n",
450                         prefix, s->n_accepted,
451                         prefix, s->n_connections,
452                         prefix, s->max_connections);
453
454         if (s->priority >= 0)
455                 fprintf(f,
456                         "%sPriority: %i\n",
457                         prefix, s->priority);
458
459         if (s->receive_buffer > 0)
460                 fprintf(f,
461                         "%sReceiveBuffer: %zu\n",
462                         prefix, s->receive_buffer);
463
464         if (s->send_buffer > 0)
465                 fprintf(f,
466                         "%sSendBuffer: %zu\n",
467                         prefix, s->send_buffer);
468
469         if (s->ip_tos >= 0)
470                 fprintf(f,
471                         "%sIPTOS: %i\n",
472                         prefix, s->ip_tos);
473
474         if (s->ip_ttl >= 0)
475                 fprintf(f,
476                         "%sIPTTL: %i\n",
477                         prefix, s->ip_ttl);
478
479         if (s->pipe_size > 0)
480                 fprintf(f,
481                         "%sPipeSize: %zu\n",
482                         prefix, s->pipe_size);
483
484         if (s->mark >= 0)
485                 fprintf(f,
486                         "%sMark: %i\n",
487                         prefix, s->mark);
488
489         if (s->mq_maxmsg > 0)
490                 fprintf(f,
491                         "%sMessageQueueMaxMessages: %li\n",
492                         prefix, s->mq_maxmsg);
493
494         if (s->mq_msgsize > 0)
495                 fprintf(f,
496                         "%sMessageQueueMessageSize: %li\n",
497                         prefix, s->mq_msgsize);
498
499         LIST_FOREACH(port, p, s->ports) {
500
501                 if (p->type == SOCKET_SOCKET) {
502                         const char *t;
503                         int r;
504                         char *k = NULL;
505
506                         if ((r = socket_address_print(&p->address, &k)) < 0)
507                                 t = strerror(-r);
508                         else
509                                 t = k;
510
511                         fprintf(f, "%s%s: %s\n", prefix, listen_lookup(socket_address_family(&p->address), p->address.type), t);
512                         free(k);
513                 } else if (p->type == SOCKET_SPECIAL)
514                         fprintf(f, "%sListenSpecial: %s\n", prefix, p->path);
515                 else if (p->type == SOCKET_MQUEUE)
516                         fprintf(f, "%sListenMessageQueue: %s\n", prefix, p->path);
517                 else
518                         fprintf(f, "%sListenFIFO: %s\n", prefix, p->path);
519         }
520
521         exec_context_dump(&s->exec_context, f, prefix);
522
523         for (c = 0; c < _SOCKET_EXEC_COMMAND_MAX; c++) {
524                 if (!s->exec_command[c])
525                         continue;
526
527                 fprintf(f, "%s-> %s:\n",
528                         prefix, socket_exec_command_to_string(c));
529
530                 exec_command_dump_list(s->exec_command[c], f, prefix2);
531         }
532
533         free(p2);
534 }
535
536 static int instance_from_socket(int fd, unsigned nr, char **instance) {
537         socklen_t l;
538         char *r;
539         union {
540                 struct sockaddr sa;
541                 struct sockaddr_un un;
542                 struct sockaddr_in in;
543                 struct sockaddr_in6 in6;
544                 struct sockaddr_storage storage;
545         } local, remote;
546
547         assert(fd >= 0);
548         assert(instance);
549
550         l = sizeof(local);
551         if (getsockname(fd, &local.sa, &l) < 0)
552                 return -errno;
553
554         l = sizeof(remote);
555         if (getpeername(fd, &remote.sa, &l) < 0)
556                 return -errno;
557
558         switch (local.sa.sa_family) {
559
560         case AF_INET: {
561                 uint32_t
562                         a = ntohl(local.in.sin_addr.s_addr),
563                         b = ntohl(remote.in.sin_addr.s_addr);
564
565                 if (asprintf(&r,
566                              "%u.%u.%u.%u:%u-%u.%u.%u.%u:%u",
567                              a >> 24, (a >> 16) & 0xFF, (a >> 8) & 0xFF, a & 0xFF,
568                              ntohs(local.in.sin_port),
569                              b >> 24, (b >> 16) & 0xFF, (b >> 8) & 0xFF, b & 0xFF,
570                              ntohs(remote.in.sin_port)) < 0)
571                         return -ENOMEM;
572
573                 break;
574         }
575
576         case AF_INET6: {
577                 static const char ipv4_prefix[] = {
578                         0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0xFF, 0xFF
579                 };
580
581                 if (memcmp(&local.in6.sin6_addr, ipv4_prefix, sizeof(ipv4_prefix)) == 0 &&
582                     memcmp(&remote.in6.sin6_addr, ipv4_prefix, sizeof(ipv4_prefix)) == 0) {
583                         const uint8_t
584                                 *a = local.in6.sin6_addr.s6_addr+12,
585                                 *b = remote.in6.sin6_addr.s6_addr+12;
586
587                         if (asprintf(&r,
588                                      "%u.%u.%u.%u:%u-%u.%u.%u.%u:%u",
589                                      a[0], a[1], a[2], a[3],
590                                      ntohs(local.in6.sin6_port),
591                                      b[0], b[1], b[2], b[3],
592                                      ntohs(remote.in6.sin6_port)) < 0)
593                                 return -ENOMEM;
594                 } else {
595                         char a[INET6_ADDRSTRLEN], b[INET6_ADDRSTRLEN];
596
597                         if (asprintf(&r,
598                                      "%s:%u-%s:%u",
599                                      inet_ntop(AF_INET6, &local.in6.sin6_addr, a, sizeof(a)),
600                                      ntohs(local.in6.sin6_port),
601                                      inet_ntop(AF_INET6, &remote.in6.sin6_addr, b, sizeof(b)),
602                                      ntohs(remote.in6.sin6_port)) < 0)
603                                 return -ENOMEM;
604                 }
605
606                 break;
607         }
608
609         case AF_UNIX: {
610                 struct ucred ucred;
611
612                 l = sizeof(ucred);
613                 if (getsockopt(fd, SOL_SOCKET, SO_PEERCRED, &ucred, &l) < 0)
614                         return -errno;
615
616                 if (asprintf(&r,
617                              "%u-%lu-%lu",
618                              nr,
619                              (unsigned long) ucred.pid,
620                              (unsigned long) ucred.uid) < 0)
621                         return -ENOMEM;
622
623                 break;
624         }
625
626         default:
627                 assert_not_reached("Unhandled socket type.");
628         }
629
630         *instance = r;
631         return 0;
632 }
633
634 static void socket_close_fds(Socket *s) {
635         SocketPort *p;
636
637         assert(s);
638
639         LIST_FOREACH(port, p, s->ports) {
640                 if (p->fd < 0)
641                         continue;
642
643                 unit_unwatch_fd(UNIT(s), &p->fd_watch);
644                 close_nointr_nofail(p->fd);
645
646                 /* One little note: we should never delete any sockets
647                  * in the file system here! After all some other
648                  * process we spawned might still have a reference of
649                  * this fd and wants to continue to use it. Therefore
650                  * we delete sockets in the file system before we
651                  * create a new one, not after we stopped using
652                  * one! */
653
654                 p->fd = -1;
655         }
656 }
657
658 static void socket_apply_socket_options(Socket *s, int fd) {
659         assert(s);
660         assert(fd >= 0);
661
662         if (s->keep_alive) {
663                 int b = s->keep_alive;
664                 if (setsockopt(fd, SOL_SOCKET, SO_KEEPALIVE, &b, sizeof(b)) < 0)
665                         log_warning("SO_KEEPALIVE failed: %m");
666         }
667
668         if (s->broadcast) {
669                 int one = 1;
670                 if (setsockopt(fd, SOL_SOCKET, SO_BROADCAST, &one, sizeof(one)) < 0)
671                         log_warning("SO_BROADCAST failed: %m");
672         }
673
674         if (s->pass_cred) {
675                 int one = 1;
676                 if (setsockopt(fd, SOL_SOCKET, SO_PASSCRED, &one, sizeof(one)) < 0)
677                         log_warning("SO_PASSCRED failed: %m");
678         }
679
680         if (s->priority >= 0)
681                 if (setsockopt(fd, SOL_SOCKET, SO_PRIORITY, &s->priority, sizeof(s->priority)) < 0)
682                         log_warning("SO_PRIORITY failed: %m");
683
684         if (s->receive_buffer > 0) {
685                 int value = (int) s->receive_buffer;
686                 if (setsockopt(fd, SOL_SOCKET, SO_RCVBUFFORCE, &value, sizeof(value)) < 0)
687                         log_warning("SO_RCVBUFFORCE failed: %m");
688         }
689
690         if (s->send_buffer > 0) {
691                 int value = (int) s->send_buffer;
692                 if (setsockopt(fd, SOL_SOCKET, SO_SNDBUFFORCE, &value, sizeof(value)) < 0)
693                         log_warning("SO_SNDBUFFORCE failed: %m");
694         }
695
696         if (s->mark >= 0)
697                 if (setsockopt(fd, SOL_SOCKET, SO_MARK, &s->mark, sizeof(s->mark)) < 0)
698                         log_warning("SO_MARK failed: %m");
699
700         if (s->ip_tos >= 0)
701                 if (setsockopt(fd, IPPROTO_IP, IP_TOS, &s->ip_tos, sizeof(s->ip_tos)) < 0)
702                         log_warning("IP_TOS failed: %m");
703
704         if (s->ip_ttl >= 0) {
705                 int r, x;
706
707                 r = setsockopt(fd, IPPROTO_IP, IP_TTL, &s->ip_ttl, sizeof(s->ip_ttl));
708
709                 if (socket_ipv6_is_supported())
710                         x = setsockopt(fd, IPPROTO_IPV6, IPV6_UNICAST_HOPS, &s->ip_ttl, sizeof(s->ip_ttl));
711                 else {
712                         x = -1;
713                         errno = EAFNOSUPPORT;
714                 }
715
716                 if (r < 0 && x < 0)
717                         log_warning("IP_TTL/IPV6_UNICAST_HOPS failed: %m");
718         }
719
720         if (s->tcp_congestion)
721                 if (setsockopt(fd, SOL_TCP, TCP_CONGESTION, s->tcp_congestion, strlen(s->tcp_congestion)+1) < 0)
722                         log_warning("TCP_CONGESTION failed: %m");
723 }
724
725 static void socket_apply_fifo_options(Socket *s, int fd) {
726         assert(s);
727         assert(fd >= 0);
728
729         if (s->pipe_size > 0)
730                 if (fcntl(fd, F_SETPIPE_SZ, s->pipe_size) < 0)
731                         log_warning("F_SETPIPE_SZ: %m");
732 }
733
734 static int fifo_address_create(
735                 const char *path,
736                 mode_t directory_mode,
737                 mode_t socket_mode,
738                 int *_fd) {
739
740         int fd = -1, r = 0;
741         struct stat st;
742         mode_t old_mask;
743
744         assert(path);
745         assert(_fd);
746
747         mkdir_parents(path, directory_mode);
748
749         if ((r = label_fifofile_set(path)) < 0)
750                 goto fail;
751
752         /* Enforce the right access mode for the fifo */
753         old_mask = umask(~ socket_mode);
754
755         /* Include the original umask in our mask */
756         umask(~socket_mode | old_mask);
757
758         r = mkfifo(path, socket_mode);
759         umask(old_mask);
760
761         if (r < 0 && errno != EEXIST) {
762                 r = -errno;
763                 goto fail;
764         }
765
766         if ((fd = open(path, O_RDWR|O_CLOEXEC|O_NOCTTY|O_NONBLOCK|O_NOFOLLOW)) < 0) {
767                 r = -errno;
768                 goto fail;
769         }
770
771         label_file_clear();
772
773         if (fstat(fd, &st) < 0) {
774                 r = -errno;
775                 goto fail;
776         }
777
778         if (!S_ISFIFO(st.st_mode) ||
779             (st.st_mode & 0777) != (socket_mode & ~old_mask) ||
780             st.st_uid != getuid() ||
781             st.st_gid != getgid()) {
782
783                 r = -EEXIST;
784                 goto fail;
785         }
786
787         *_fd = fd;
788         return 0;
789
790 fail:
791         label_file_clear();
792
793         if (fd >= 0)
794                 close_nointr_nofail(fd);
795
796         return r;
797 }
798
799 static int special_address_create(
800                 const char *path,
801                 int *_fd) {
802
803         int fd = -1, r = 0;
804         struct stat st;
805
806         assert(path);
807         assert(_fd);
808
809         if ((fd = open(path, O_RDONLY|O_CLOEXEC|O_NOCTTY|O_NONBLOCK|O_NOFOLLOW)) < 0) {
810                 r = -errno;
811                 goto fail;
812         }
813
814         if (fstat(fd, &st) < 0) {
815                 r = -errno;
816                 goto fail;
817         }
818
819         /* Check whether this is a /proc, /sys or /dev file or char device */
820         if (!S_ISREG(st.st_mode) && !S_ISCHR(st.st_mode)) {
821                 r = -EEXIST;
822                 goto fail;
823         }
824
825         *_fd = fd;
826         return 0;
827
828 fail:
829         if (fd >= 0)
830                 close_nointr_nofail(fd);
831
832         return r;
833 }
834
835 static int mq_address_create(
836                 const char *path,
837                 mode_t mq_mode,
838                 long maxmsg,
839                 long msgsize,
840                 int *_fd) {
841
842         int fd = -1, r = 0;
843         struct stat st;
844         mode_t old_mask;
845         struct mq_attr _attr, *attr = NULL;
846
847         assert(path);
848         assert(_fd);
849
850         if (maxmsg > 0 && msgsize > 0) {
851                 zero(_attr);
852                 _attr.mq_flags = O_NONBLOCK;
853                 _attr.mq_maxmsg = maxmsg;
854                 _attr.mq_msgsize = msgsize;
855                 attr = &_attr;
856         }
857
858         /* Enforce the right access mode for the mq */
859         old_mask = umask(~ mq_mode);
860
861         /* Include the original umask in our mask */
862         umask(~mq_mode | old_mask);
863
864         fd = mq_open(path, O_RDONLY|O_CLOEXEC|O_NONBLOCK|O_CREAT, mq_mode, attr);
865         umask(old_mask);
866
867         if (fd < 0) {
868                 r = -errno;
869                 goto fail;
870         }
871
872         if (fstat(fd, &st) < 0) {
873                 r = -errno;
874                 goto fail;
875         }
876
877         if ((st.st_mode & 0777) != (mq_mode & ~old_mask) ||
878             st.st_uid != getuid() ||
879             st.st_gid != getgid()) {
880
881                 r = -EEXIST;
882                 goto fail;
883         }
884
885         *_fd = fd;
886         return 0;
887
888 fail:
889         if (fd >= 0)
890                 close_nointr_nofail(fd);
891
892         return r;
893 }
894
895 static int socket_open_fds(Socket *s) {
896         SocketPort *p;
897         int r;
898         char *label = NULL;
899         bool know_label = false;
900
901         assert(s);
902
903         LIST_FOREACH(port, p, s->ports) {
904
905                 if (p->fd >= 0)
906                         continue;
907
908                 if (p->type == SOCKET_SOCKET) {
909
910                         if (!know_label) {
911
912                                 if ((r = socket_instantiate_service(s)) < 0)
913                                         return r;
914
915                                 if (s->service && s->service->exec_command[SERVICE_EXEC_START]) {
916                                         r = label_get_create_label_from_exe(s->service->exec_command[SERVICE_EXEC_START]->path, &label);
917
918                                         if (r < 0) {
919                                                 if (r != -EPERM)
920                                                         return r;
921                                         }
922                                 }
923
924                                 know_label = true;
925                         }
926
927                         if ((r = socket_address_listen(
928                                              &p->address,
929                                              s->backlog,
930                                              s->bind_ipv6_only,
931                                              s->bind_to_device,
932                                              s->free_bind,
933                                              s->transparent,
934                                              s->directory_mode,
935                                              s->socket_mode,
936                                              label,
937                                              &p->fd)) < 0)
938                                 goto rollback;
939
940                         socket_apply_socket_options(s, p->fd);
941
942                 } else  if (p->type == SOCKET_SPECIAL) {
943
944                         if ((r = special_address_create(
945                                              p->path,
946                                              &p->fd)) < 0)
947                                 goto rollback;
948
949                 } else  if (p->type == SOCKET_FIFO) {
950
951                         if ((r = fifo_address_create(
952                                              p->path,
953                                              s->directory_mode,
954                                              s->socket_mode,
955                                              &p->fd)) < 0)
956                                 goto rollback;
957
958                         socket_apply_fifo_options(s, p->fd);
959                 } else if (p->type == SOCKET_MQUEUE) {
960
961                         if ((r = mq_address_create(
962                                              p->path,
963                                              s->socket_mode,
964                                              s->mq_maxmsg,
965                                              s->mq_msgsize,
966                                              &p->fd)) < 0)
967                                 goto rollback;
968                 } else
969                         assert_not_reached("Unknown port type");
970         }
971
972         label_free(label);
973         return 0;
974
975 rollback:
976         socket_close_fds(s);
977         label_free(label);
978         return r;
979 }
980
981 static void socket_unwatch_fds(Socket *s) {
982         SocketPort *p;
983
984         assert(s);
985
986         LIST_FOREACH(port, p, s->ports) {
987                 if (p->fd < 0)
988                         continue;
989
990                 unit_unwatch_fd(UNIT(s), &p->fd_watch);
991         }
992 }
993
994 static int socket_watch_fds(Socket *s) {
995         SocketPort *p;
996         int r;
997
998         assert(s);
999
1000         LIST_FOREACH(port, p, s->ports) {
1001                 if (p->fd < 0)
1002                         continue;
1003
1004                 p->fd_watch.socket_accept =
1005                         s->accept &&
1006                         p->type == SOCKET_SOCKET &&
1007                         socket_address_can_accept(&p->address);
1008
1009                 if ((r = unit_watch_fd(UNIT(s), p->fd, EPOLLIN, &p->fd_watch)) < 0)
1010                         goto fail;
1011         }
1012
1013         return 0;
1014
1015 fail:
1016         socket_unwatch_fds(s);
1017         return r;
1018 }
1019
1020 static void socket_set_state(Socket *s, SocketState state) {
1021         SocketState old_state;
1022         assert(s);
1023
1024         old_state = s->state;
1025         s->state = state;
1026
1027         if (state != SOCKET_START_PRE &&
1028             state != SOCKET_START_POST &&
1029             state != SOCKET_STOP_PRE &&
1030             state != SOCKET_STOP_PRE_SIGTERM &&
1031             state != SOCKET_STOP_PRE_SIGKILL &&
1032             state != SOCKET_STOP_POST &&
1033             state != SOCKET_FINAL_SIGTERM &&
1034             state != SOCKET_FINAL_SIGKILL) {
1035                 unit_unwatch_timer(UNIT(s), &s->timer_watch);
1036                 socket_unwatch_control_pid(s);
1037                 s->control_command = NULL;
1038                 s->control_command_id = _SOCKET_EXEC_COMMAND_INVALID;
1039         }
1040
1041         if (state != SOCKET_LISTENING)
1042                 socket_unwatch_fds(s);
1043
1044         if (state != SOCKET_START_POST &&
1045             state != SOCKET_LISTENING &&
1046             state != SOCKET_RUNNING &&
1047             state != SOCKET_STOP_PRE &&
1048             state != SOCKET_STOP_PRE_SIGTERM &&
1049             state != SOCKET_STOP_PRE_SIGKILL)
1050                 socket_close_fds(s);
1051
1052         if (state != old_state)
1053                 log_debug("%s changed %s -> %s",
1054                           s->meta.id,
1055                           socket_state_to_string(old_state),
1056                           socket_state_to_string(state));
1057
1058         unit_notify(UNIT(s), state_translation_table[old_state], state_translation_table[state], true);
1059 }
1060
1061 static int socket_coldplug(Unit *u) {
1062         Socket *s = SOCKET(u);
1063         int r;
1064
1065         assert(s);
1066         assert(s->state == SOCKET_DEAD);
1067
1068         if (s->deserialized_state != s->state) {
1069
1070                 if (s->deserialized_state == SOCKET_START_PRE ||
1071                     s->deserialized_state == SOCKET_START_POST ||
1072                     s->deserialized_state == SOCKET_STOP_PRE ||
1073                     s->deserialized_state == SOCKET_STOP_PRE_SIGTERM ||
1074                     s->deserialized_state == SOCKET_STOP_PRE_SIGKILL ||
1075                     s->deserialized_state == SOCKET_STOP_POST ||
1076                     s->deserialized_state == SOCKET_FINAL_SIGTERM ||
1077                     s->deserialized_state == SOCKET_FINAL_SIGKILL) {
1078
1079                         if (s->control_pid <= 0)
1080                                 return -EBADMSG;
1081
1082                         if ((r = unit_watch_pid(UNIT(s), s->control_pid)) < 0)
1083                                 return r;
1084
1085                         if ((r = unit_watch_timer(UNIT(s), s->timeout_usec, &s->timer_watch)) < 0)
1086                                 return r;
1087                 }
1088
1089                 if (s->deserialized_state == SOCKET_START_POST ||
1090                     s->deserialized_state == SOCKET_LISTENING ||
1091                     s->deserialized_state == SOCKET_RUNNING ||
1092                     s->deserialized_state == SOCKET_STOP_PRE ||
1093                     s->deserialized_state == SOCKET_STOP_PRE_SIGTERM ||
1094                     s->deserialized_state == SOCKET_STOP_PRE_SIGKILL)
1095                         if ((r = socket_open_fds(s)) < 0)
1096                                 return r;
1097
1098                 if (s->deserialized_state == SOCKET_LISTENING)
1099                         if ((r = socket_watch_fds(s)) < 0)
1100                                 return r;
1101
1102                 socket_set_state(s, s->deserialized_state);
1103         }
1104
1105         return 0;
1106 }
1107
1108 static int socket_spawn(Socket *s, ExecCommand *c, pid_t *_pid) {
1109         pid_t pid;
1110         int r;
1111         char **argv;
1112
1113         assert(s);
1114         assert(c);
1115         assert(_pid);
1116
1117         if ((r = unit_watch_timer(UNIT(s), s->timeout_usec, &s->timer_watch)) < 0)
1118                 goto fail;
1119
1120         if (!(argv = unit_full_printf_strv(UNIT(s), c->argv))) {
1121                 r = -ENOMEM;
1122                 goto fail;
1123         }
1124
1125         r = exec_spawn(c,
1126                        argv,
1127                        &s->exec_context,
1128                        NULL, 0,
1129                        s->meta.manager->environment,
1130                        true,
1131                        true,
1132                        true,
1133                        s->meta.manager->confirm_spawn,
1134                        s->meta.cgroup_bondings,
1135                        s->meta.cgroup_attributes,
1136                        &pid);
1137
1138         strv_free(argv);
1139         if (r < 0)
1140                 goto fail;
1141
1142         if ((r = unit_watch_pid(UNIT(s), pid)) < 0)
1143                 /* FIXME: we need to do something here */
1144                 goto fail;
1145
1146         *_pid = pid;
1147
1148         return 0;
1149
1150 fail:
1151         unit_unwatch_timer(UNIT(s), &s->timer_watch);
1152
1153         return r;
1154 }
1155
1156 static void socket_enter_dead(Socket *s, bool success) {
1157         assert(s);
1158
1159         if (!success)
1160                 s->failure = true;
1161
1162         socket_set_state(s, s->failure ? SOCKET_FAILED : SOCKET_DEAD);
1163 }
1164
1165 static void socket_enter_signal(Socket *s, SocketState state, bool success);
1166
1167 static void socket_enter_stop_post(Socket *s, bool success) {
1168         int r;
1169         assert(s);
1170
1171         if (!success)
1172                 s->failure = true;
1173
1174         socket_unwatch_control_pid(s);
1175
1176         s->control_command_id = SOCKET_EXEC_STOP_POST;
1177
1178         if ((s->control_command = s->exec_command[SOCKET_EXEC_STOP_POST])) {
1179                 if ((r = socket_spawn(s, s->control_command, &s->control_pid)) < 0)
1180                         goto fail;
1181
1182                 socket_set_state(s, SOCKET_STOP_POST);
1183         } else
1184                 socket_enter_signal(s, SOCKET_FINAL_SIGTERM, true);
1185
1186         return;
1187
1188 fail:
1189         log_warning("%s failed to run 'stop-post' task: %s", s->meta.id, strerror(-r));
1190         socket_enter_signal(s, SOCKET_FINAL_SIGTERM, false);
1191 }
1192
1193 static void socket_enter_signal(Socket *s, SocketState state, bool success) {
1194         int r;
1195         Set *pid_set = NULL;
1196         bool wait_for_exit = false;
1197
1198         assert(s);
1199
1200         if (!success)
1201                 s->failure = true;
1202
1203         if (s->exec_context.kill_mode != KILL_NONE) {
1204                 int sig = (state == SOCKET_STOP_PRE_SIGTERM || state == SOCKET_FINAL_SIGTERM) ? s->exec_context.kill_signal : SIGKILL;
1205
1206                 if (s->control_pid > 0) {
1207                         if (kill_and_sigcont(s->control_pid, sig) < 0 && errno != ESRCH)
1208
1209                                 log_warning("Failed to kill control process %li: %m", (long) s->control_pid);
1210                         else
1211                                 wait_for_exit = true;
1212                 }
1213
1214                 if (s->exec_context.kill_mode == KILL_CONTROL_GROUP) {
1215
1216                         if (!(pid_set = set_new(trivial_hash_func, trivial_compare_func))) {
1217                                 r = -ENOMEM;
1218                                 goto fail;
1219                         }
1220
1221                         /* Exclude the control pid from being killed via the cgroup */
1222                         if (s->control_pid > 0)
1223                                 if ((r = set_put(pid_set, LONG_TO_PTR(s->control_pid))) < 0)
1224                                         goto fail;
1225
1226                         if ((r = cgroup_bonding_kill_list(s->meta.cgroup_bondings, sig, true, pid_set)) < 0) {
1227                                 if (r != -EAGAIN && r != -ESRCH && r != -ENOENT)
1228                                         log_warning("Failed to kill control group: %s", strerror(-r));
1229                         } else if (r > 0)
1230                                 wait_for_exit = true;
1231
1232                         set_free(pid_set);
1233                         pid_set = NULL;
1234                 }
1235         }
1236
1237         if (wait_for_exit) {
1238                 if ((r = unit_watch_timer(UNIT(s), s->timeout_usec, &s->timer_watch)) < 0)
1239                         goto fail;
1240
1241                 socket_set_state(s, state);
1242         } else if (state == SOCKET_STOP_PRE_SIGTERM || state == SOCKET_STOP_PRE_SIGKILL)
1243                 socket_enter_stop_post(s, true);
1244         else
1245                 socket_enter_dead(s, true);
1246
1247         return;
1248
1249 fail:
1250         log_warning("%s failed to kill processes: %s", s->meta.id, strerror(-r));
1251
1252         if (state == SOCKET_STOP_PRE_SIGTERM || state == SOCKET_STOP_PRE_SIGKILL)
1253                 socket_enter_stop_post(s, false);
1254         else
1255                 socket_enter_dead(s, false);
1256
1257         if (pid_set)
1258                 set_free(pid_set);
1259 }
1260
1261 static void socket_enter_stop_pre(Socket *s, bool success) {
1262         int r;
1263         assert(s);
1264
1265         if (!success)
1266                 s->failure = true;
1267
1268         socket_unwatch_control_pid(s);
1269
1270         s->control_command_id = SOCKET_EXEC_STOP_PRE;
1271
1272         if ((s->control_command = s->exec_command[SOCKET_EXEC_STOP_PRE])) {
1273                 if ((r = socket_spawn(s, s->control_command, &s->control_pid)) < 0)
1274                         goto fail;
1275
1276                 socket_set_state(s, SOCKET_STOP_PRE);
1277         } else
1278                 socket_enter_stop_post(s, true);
1279
1280         return;
1281
1282 fail:
1283         log_warning("%s failed to run 'stop-pre' task: %s", s->meta.id, strerror(-r));
1284         socket_enter_stop_post(s, false);
1285 }
1286
1287 static void socket_enter_listening(Socket *s) {
1288         int r;
1289         assert(s);
1290
1291         if ((r = socket_watch_fds(s)) < 0) {
1292                 log_warning("%s failed to watch sockets: %s", s->meta.id, strerror(-r));
1293                 goto fail;
1294         }
1295
1296         socket_set_state(s, SOCKET_LISTENING);
1297         return;
1298
1299 fail:
1300         socket_enter_stop_pre(s, false);
1301 }
1302
1303 static void socket_enter_start_post(Socket *s) {
1304         int r;
1305         assert(s);
1306
1307         if ((r = socket_open_fds(s)) < 0) {
1308                 log_warning("%s failed to listen on sockets: %s", s->meta.id, strerror(-r));
1309                 goto fail;
1310         }
1311
1312         socket_unwatch_control_pid(s);
1313
1314         s->control_command_id = SOCKET_EXEC_START_POST;
1315
1316         if ((s->control_command = s->exec_command[SOCKET_EXEC_START_POST])) {
1317                 if ((r = socket_spawn(s, s->control_command, &s->control_pid)) < 0) {
1318                         log_warning("%s failed to run 'start-post' task: %s", s->meta.id, strerror(-r));
1319                         goto fail;
1320                 }
1321
1322                 socket_set_state(s, SOCKET_START_POST);
1323         } else
1324                 socket_enter_listening(s);
1325
1326         return;
1327
1328 fail:
1329         socket_enter_stop_pre(s, false);
1330 }
1331
1332 static void socket_enter_start_pre(Socket *s) {
1333         int r;
1334         assert(s);
1335
1336         socket_unwatch_control_pid(s);
1337
1338         s->control_command_id = SOCKET_EXEC_START_PRE;
1339
1340         if ((s->control_command = s->exec_command[SOCKET_EXEC_START_PRE])) {
1341                 if ((r = socket_spawn(s, s->control_command, &s->control_pid)) < 0)
1342                         goto fail;
1343
1344                 socket_set_state(s, SOCKET_START_PRE);
1345         } else
1346                 socket_enter_start_post(s);
1347
1348         return;
1349
1350 fail:
1351         log_warning("%s failed to run 'start-pre' task: %s", s->meta.id, strerror(-r));
1352         socket_enter_dead(s, false);
1353 }
1354
1355 static void socket_enter_running(Socket *s, int cfd) {
1356         int r;
1357         DBusError error;
1358
1359         assert(s);
1360         dbus_error_init(&error);
1361
1362         /* We don't take connections anymore if we are supposed to
1363          * shut down anyway */
1364         if (unit_pending_inactive(UNIT(s))) {
1365                 log_debug("Suppressing connection request on %s since unit stop is scheduled.", s->meta.id);
1366
1367                 if (cfd >= 0)
1368                         close_nointr_nofail(cfd);
1369                 else  {
1370                         /* Flush all sockets by closing and reopening them */
1371                         socket_close_fds(s);
1372
1373                         if ((r = socket_watch_fds(s)) < 0) {
1374                                 log_warning("%s failed to watch sockets: %s", s->meta.id, strerror(-r));
1375                                 socket_enter_stop_pre(s, false);
1376                         }
1377                 }
1378
1379                 return;
1380         }
1381
1382         if (cfd < 0) {
1383                 bool pending = false;
1384                 Meta *i;
1385
1386                 /* If there's already a start pending don't bother to
1387                  * do anything */
1388                 LIST_FOREACH(units_by_type, i, s->meta.manager->units_by_type[UNIT_SERVICE]) {
1389                         Service *service = (Service *) i;
1390
1391                         if (!set_get(service->configured_sockets, s))
1392                                 continue;
1393
1394                         if (!unit_pending_active(UNIT(service)))
1395                                 continue;
1396
1397                         pending = true;
1398                         break;
1399                 }
1400
1401                 if (!pending)
1402                         if ((r = manager_add_job(s->meta.manager, JOB_START, UNIT(s->service), JOB_REPLACE, true, &error, NULL)) < 0)
1403                                 goto fail;
1404
1405                 socket_set_state(s, SOCKET_RUNNING);
1406         } else {
1407                 char *prefix, *instance = NULL, *name;
1408                 Service *service;
1409
1410                 if (s->n_connections >= s->max_connections) {
1411                         log_warning("Too many incoming connections (%u)", s->n_connections);
1412                         close_nointr_nofail(cfd);
1413                         return;
1414                 }
1415
1416                 if ((r = socket_instantiate_service(s)) < 0)
1417                         goto fail;
1418
1419                 if ((r = instance_from_socket(cfd, s->n_accepted, &instance)) < 0)
1420                         goto fail;
1421
1422                 if (!(prefix = unit_name_to_prefix(s->meta.id))) {
1423                         free(instance);
1424                         r = -ENOMEM;
1425                         goto fail;
1426                 }
1427
1428                 name = unit_name_build(prefix, instance, ".service");
1429                 free(prefix);
1430                 free(instance);
1431
1432                 if (!name) {
1433                         r = -ENOMEM;
1434                         goto fail;
1435                 }
1436
1437                 if ((r = unit_add_name(UNIT(s->service), name)) < 0) {
1438                         free(name);
1439                         goto fail;
1440                 }
1441
1442                 service = s->service;
1443                 s->service = NULL;
1444                 s->n_accepted ++;
1445
1446                 service->meta.no_gc = false;
1447
1448                 unit_choose_id(UNIT(service), name);
1449                 free(name);
1450
1451                 if ((r = service_set_socket_fd(service, cfd, s)) < 0)
1452                         goto fail;
1453
1454                 cfd = -1;
1455                 s->n_connections ++;
1456
1457                 if ((r = manager_add_job(s->meta.manager, JOB_START, UNIT(service), JOB_REPLACE, true, &error, NULL)) < 0)
1458                         goto fail;
1459
1460                 /* Notify clients about changed counters */
1461                 unit_add_to_dbus_queue(UNIT(s));
1462         }
1463
1464         return;
1465
1466 fail:
1467         log_warning("%s failed to queue socket startup job: %s", s->meta.id, bus_error(&error, r));
1468         socket_enter_stop_pre(s, false);
1469
1470         if (cfd >= 0)
1471                 close_nointr_nofail(cfd);
1472
1473         dbus_error_free(&error);
1474 }
1475
1476 static void socket_run_next(Socket *s, bool success) {
1477         int r;
1478
1479         assert(s);
1480         assert(s->control_command);
1481         assert(s->control_command->command_next);
1482
1483         if (!success)
1484                 s->failure = true;
1485
1486         socket_unwatch_control_pid(s);
1487
1488         s->control_command = s->control_command->command_next;
1489
1490         if ((r = socket_spawn(s, s->control_command, &s->control_pid)) < 0)
1491                 goto fail;
1492
1493         return;
1494
1495 fail:
1496         log_warning("%s failed to run next task: %s", s->meta.id, strerror(-r));
1497
1498         if (s->state == SOCKET_START_POST)
1499                 socket_enter_stop_pre(s, false);
1500         else if (s->state == SOCKET_STOP_POST)
1501                 socket_enter_dead(s, false);
1502         else
1503                 socket_enter_signal(s, SOCKET_FINAL_SIGTERM, false);
1504 }
1505
1506 static int socket_start(Unit *u) {
1507         Socket *s = SOCKET(u);
1508
1509         assert(s);
1510
1511         /* We cannot fulfill this request right now, try again later
1512          * please! */
1513         if (s->state == SOCKET_STOP_PRE ||
1514             s->state == SOCKET_STOP_PRE_SIGKILL ||
1515             s->state == SOCKET_STOP_PRE_SIGTERM ||
1516             s->state == SOCKET_STOP_POST ||
1517             s->state == SOCKET_FINAL_SIGTERM ||
1518             s->state == SOCKET_FINAL_SIGKILL)
1519                 return -EAGAIN;
1520
1521         if (s->state == SOCKET_START_PRE ||
1522             s->state == SOCKET_START_POST)
1523                 return 0;
1524
1525         /* Cannot run this without the service being around */
1526         if (s->service) {
1527                 if (s->service->meta.load_state != UNIT_LOADED) {
1528                         log_error("Socket service %s not loaded, refusing.", s->service->meta.id);
1529                         return -ENOENT;
1530                 }
1531
1532                 /* If the service is already active we cannot start the
1533                  * socket */
1534                 if (s->service->state != SERVICE_DEAD &&
1535                     s->service->state != SERVICE_FAILED &&
1536                     s->service->state != SERVICE_AUTO_RESTART) {
1537                         log_error("Socket service %s already active, refusing.", s->service->meta.id);
1538                         return -EBUSY;
1539                 }
1540
1541 #ifdef HAVE_SYSV_COMPAT
1542                 if (s->service->sysv_path) {
1543                         log_error("Using SysV services for socket activation is not supported. Refusing.");
1544                         return -ENOENT;
1545                 }
1546 #endif
1547         }
1548
1549         assert(s->state == SOCKET_DEAD || s->state == SOCKET_FAILED);
1550
1551         s->failure = false;
1552         socket_enter_start_pre(s);
1553         return 0;
1554 }
1555
1556 static int socket_stop(Unit *u) {
1557         Socket *s = SOCKET(u);
1558
1559         assert(s);
1560
1561         /* Already on it */
1562         if (s->state == SOCKET_STOP_PRE ||
1563             s->state == SOCKET_STOP_PRE_SIGTERM ||
1564             s->state == SOCKET_STOP_PRE_SIGKILL ||
1565             s->state == SOCKET_STOP_POST ||
1566             s->state == SOCKET_FINAL_SIGTERM ||
1567             s->state == SOCKET_FINAL_SIGKILL)
1568                 return 0;
1569
1570         /* If there's already something running we go directly into
1571          * kill mode. */
1572         if (s->state == SOCKET_START_PRE ||
1573             s->state == SOCKET_START_POST) {
1574                 socket_enter_signal(s, SOCKET_STOP_PRE_SIGTERM, true);
1575                 return -EAGAIN;
1576         }
1577
1578         assert(s->state == SOCKET_LISTENING || s->state == SOCKET_RUNNING);
1579
1580         socket_enter_stop_pre(s, true);
1581         return 0;
1582 }
1583
1584 static int socket_serialize(Unit *u, FILE *f, FDSet *fds) {
1585         Socket *s = SOCKET(u);
1586         SocketPort *p;
1587         int r;
1588
1589         assert(u);
1590         assert(f);
1591         assert(fds);
1592
1593         unit_serialize_item(u, f, "state", socket_state_to_string(s->state));
1594         unit_serialize_item(u, f, "failure", yes_no(s->failure));
1595         unit_serialize_item_format(u, f, "n-accepted", "%u", s->n_accepted);
1596
1597         if (s->control_pid > 0)
1598                 unit_serialize_item_format(u, f, "control-pid", "%lu", (unsigned long) s->control_pid);
1599
1600         if (s->control_command_id >= 0)
1601                 unit_serialize_item(u, f, "control-command", socket_exec_command_to_string(s->control_command_id));
1602
1603         LIST_FOREACH(port, p, s->ports) {
1604                 int copy;
1605
1606                 if (p->fd < 0)
1607                         continue;
1608
1609                 if ((copy = fdset_put_dup(fds, p->fd)) < 0)
1610                         return copy;
1611
1612                 if (p->type == SOCKET_SOCKET) {
1613                         char *t;
1614
1615                         if ((r = socket_address_print(&p->address, &t)) < 0)
1616                                 return r;
1617
1618                         if (socket_address_family(&p->address) == AF_NETLINK)
1619                                 unit_serialize_item_format(u, f, "netlink", "%i %s", copy, t);
1620                         else
1621                                 unit_serialize_item_format(u, f, "socket", "%i %i %s", copy, p->address.type, t);
1622                         free(t);
1623                 } else if (p->type == SOCKET_SPECIAL)
1624                         unit_serialize_item_format(u, f, "special", "%i %s", copy, p->path);
1625                 else {
1626                         assert(p->type == SOCKET_FIFO);
1627                         unit_serialize_item_format(u, f, "fifo", "%i %s", copy, p->path);
1628                 }
1629         }
1630
1631         return 0;
1632 }
1633
1634 static int socket_deserialize_item(Unit *u, const char *key, const char *value, FDSet *fds) {
1635         Socket *s = SOCKET(u);
1636
1637         assert(u);
1638         assert(key);
1639         assert(value);
1640         assert(fds);
1641
1642         if (streq(key, "state")) {
1643                 SocketState state;
1644
1645                 if ((state = socket_state_from_string(value)) < 0)
1646                         log_debug("Failed to parse state value %s", value);
1647                 else
1648                         s->deserialized_state = state;
1649         } else if (streq(key, "failure")) {
1650                 int b;
1651
1652                 if ((b = parse_boolean(value)) < 0)
1653                         log_debug("Failed to parse failure value %s", value);
1654                 else
1655                         s->failure = b || s->failure;
1656
1657         } else if (streq(key, "n-accepted")) {
1658                 unsigned k;
1659
1660                 if (safe_atou(value, &k) < 0)
1661                         log_debug("Failed to parse n-accepted value %s", value);
1662                 else
1663                         s->n_accepted += k;
1664         } else if (streq(key, "control-pid")) {
1665                 pid_t pid;
1666
1667                 if (parse_pid(value, &pid) < 0)
1668                         log_debug("Failed to parse control-pid value %s", value);
1669                 else
1670                         s->control_pid = pid;
1671         } else if (streq(key, "control-command")) {
1672                 SocketExecCommand id;
1673
1674                 if ((id = socket_exec_command_from_string(value)) < 0)
1675                         log_debug("Failed to parse exec-command value %s", value);
1676                 else {
1677                         s->control_command_id = id;
1678                         s->control_command = s->exec_command[id];
1679                 }
1680         } else if (streq(key, "fifo")) {
1681                 int fd, skip = 0;
1682                 SocketPort *p;
1683
1684                 if (sscanf(value, "%i %n", &fd, &skip) < 1 || fd < 0 || !fdset_contains(fds, fd))
1685                         log_debug("Failed to parse fifo value %s", value);
1686                 else {
1687
1688                         LIST_FOREACH(port, p, s->ports)
1689                                 if (p->type == SOCKET_FIFO &&
1690                                     streq_ptr(p->path, value+skip))
1691                                         break;
1692
1693                         if (p) {
1694                                 if (p->fd >= 0)
1695                                         close_nointr_nofail(p->fd);
1696                                 p->fd = fdset_remove(fds, fd);
1697                         }
1698                 }
1699
1700         } else if (streq(key, "special")) {
1701                 int fd, skip = 0;
1702                 SocketPort *p;
1703
1704                 if (sscanf(value, "%i %n", &fd, &skip) < 1 || fd < 0 || !fdset_contains(fds, fd))
1705                         log_debug("Failed to parse special value %s", value);
1706                 else {
1707
1708                         LIST_FOREACH(port, p, s->ports)
1709                                 if (p->type == SOCKET_SPECIAL &&
1710                                     streq_ptr(p->path, value+skip))
1711                                         break;
1712
1713                         if (p) {
1714                                 if (p->fd >= 0)
1715                                         close_nointr_nofail(p->fd);
1716                                 p->fd = fdset_remove(fds, fd);
1717                         }
1718                 }
1719
1720         } else if (streq(key, "socket")) {
1721                 int fd, type, skip = 0;
1722                 SocketPort *p;
1723
1724                 if (sscanf(value, "%i %i %n", &fd, &type, &skip) < 2 || fd < 0 || type < 0 || !fdset_contains(fds, fd))
1725                         log_debug("Failed to parse socket value %s", value);
1726                 else {
1727
1728                         LIST_FOREACH(port, p, s->ports)
1729                                 if (socket_address_is(&p->address, value+skip, type))
1730                                         break;
1731
1732                         if (p) {
1733                                 if (p->fd >= 0)
1734                                         close_nointr_nofail(p->fd);
1735                                 p->fd = fdset_remove(fds, fd);
1736                         }
1737                 }
1738
1739         } else if (streq(key, "netlink")) {
1740                 int fd, skip = 0;
1741                 SocketPort *p;
1742
1743                 if (sscanf(value, "%i %n", &fd, &skip) < 1 || fd < 0 || !fdset_contains(fds, fd))
1744                         log_debug("Failed to parse socket value %s", value);
1745                 else {
1746
1747                         LIST_FOREACH(port, p, s->ports)
1748                                 if (socket_address_is_netlink(&p->address, value+skip))
1749                                         break;
1750
1751                         if (p) {
1752                                 if (p->fd >= 0)
1753                                         close_nointr_nofail(p->fd);
1754                                 p->fd = fdset_remove(fds, fd);
1755                         }
1756                 }
1757
1758         } else
1759                 log_debug("Unknown serialization key '%s'", key);
1760
1761         return 0;
1762 }
1763
1764 static UnitActiveState socket_active_state(Unit *u) {
1765         assert(u);
1766
1767         return state_translation_table[SOCKET(u)->state];
1768 }
1769
1770 static const char *socket_sub_state_to_string(Unit *u) {
1771         assert(u);
1772
1773         return socket_state_to_string(SOCKET(u)->state);
1774 }
1775
1776 static bool socket_check_gc(Unit *u) {
1777         Socket *s = SOCKET(u);
1778
1779         assert(u);
1780
1781         return s->n_connections > 0;
1782 }
1783
1784 static void socket_fd_event(Unit *u, int fd, uint32_t events, Watch *w) {
1785         Socket *s = SOCKET(u);
1786         int cfd = -1;
1787
1788         assert(s);
1789         assert(fd >= 0);
1790
1791         if (s->state != SOCKET_LISTENING)
1792                 return;
1793
1794         log_debug("Incoming traffic on %s", u->meta.id);
1795
1796         if (events != EPOLLIN) {
1797
1798                 if (events & EPOLLHUP)
1799                         log_error("%s: Got POLLHUP on a listening socket. The service probably invoked shutdown() on it, and should better not do that.", u->meta.id);
1800                 else
1801                         log_error("%s: Got unexpected poll event (0x%x) on socket.", u->meta.id, events);
1802
1803                 goto fail;
1804         }
1805
1806         if (w->socket_accept) {
1807                 for (;;) {
1808
1809                         if ((cfd = accept4(fd, NULL, NULL, SOCK_NONBLOCK)) < 0) {
1810
1811                                 if (errno == EINTR)
1812                                         continue;
1813
1814                                 log_error("Failed to accept socket: %m");
1815                                 goto fail;
1816                         }
1817
1818                         break;
1819                 }
1820
1821                 socket_apply_socket_options(s, cfd);
1822         }
1823
1824         socket_enter_running(s, cfd);
1825         return;
1826
1827 fail:
1828         socket_enter_stop_pre(s, false);
1829 }
1830
1831 static void socket_sigchld_event(Unit *u, pid_t pid, int code, int status) {
1832         Socket *s = SOCKET(u);
1833         bool success;
1834
1835         assert(s);
1836         assert(pid >= 0);
1837
1838         if (pid != s->control_pid)
1839                 return;
1840
1841         s->control_pid = 0;
1842
1843         success = is_clean_exit(code, status);
1844
1845         if (s->control_command) {
1846                 exec_status_exit(&s->control_command->exec_status, &s->exec_context, pid, code, status);
1847
1848                 if (s->control_command->ignore)
1849                         success = true;
1850         }
1851
1852         log_full(success ? LOG_DEBUG : LOG_NOTICE,
1853                  "%s control process exited, code=%s status=%i", u->meta.id, sigchld_code_to_string(code), status);
1854         s->failure = s->failure || !success;
1855
1856         if (s->control_command && s->control_command->command_next && success) {
1857                 log_debug("%s running next command for state %s", u->meta.id, socket_state_to_string(s->state));
1858                 socket_run_next(s, success);
1859         } else {
1860                 s->control_command = NULL;
1861                 s->control_command_id = _SOCKET_EXEC_COMMAND_INVALID;
1862
1863                 /* No further commands for this step, so let's figure
1864                  * out what to do next */
1865
1866                 log_debug("%s got final SIGCHLD for state %s", u->meta.id, socket_state_to_string(s->state));
1867
1868                 switch (s->state) {
1869
1870                 case SOCKET_START_PRE:
1871                         if (success)
1872                                 socket_enter_start_post(s);
1873                         else
1874                                 socket_enter_signal(s, SOCKET_FINAL_SIGTERM, false);
1875                         break;
1876
1877                 case SOCKET_START_POST:
1878                         if (success)
1879                                 socket_enter_listening(s);
1880                         else
1881                                 socket_enter_stop_pre(s, false);
1882                         break;
1883
1884                 case SOCKET_STOP_PRE:
1885                 case SOCKET_STOP_PRE_SIGTERM:
1886                 case SOCKET_STOP_PRE_SIGKILL:
1887                         socket_enter_stop_post(s, success);
1888                         break;
1889
1890                 case SOCKET_STOP_POST:
1891                 case SOCKET_FINAL_SIGTERM:
1892                 case SOCKET_FINAL_SIGKILL:
1893                         socket_enter_dead(s, success);
1894                         break;
1895
1896                 default:
1897                         assert_not_reached("Uh, control process died at wrong time.");
1898                 }
1899         }
1900
1901         /* Notify clients about changed exit status */
1902         unit_add_to_dbus_queue(u);
1903 }
1904
1905 static void socket_timer_event(Unit *u, uint64_t elapsed, Watch *w) {
1906         Socket *s = SOCKET(u);
1907
1908         assert(s);
1909         assert(elapsed == 1);
1910         assert(w == &s->timer_watch);
1911
1912         switch (s->state) {
1913
1914         case SOCKET_START_PRE:
1915                 log_warning("%s starting timed out. Terminating.", u->meta.id);
1916                 socket_enter_signal(s, SOCKET_FINAL_SIGTERM, false);
1917                 break;
1918
1919         case SOCKET_START_POST:
1920                 log_warning("%s starting timed out. Stopping.", u->meta.id);
1921                 socket_enter_stop_pre(s, false);
1922                 break;
1923
1924         case SOCKET_STOP_PRE:
1925                 log_warning("%s stopping timed out. Terminating.", u->meta.id);
1926                 socket_enter_signal(s, SOCKET_STOP_PRE_SIGTERM, false);
1927                 break;
1928
1929         case SOCKET_STOP_PRE_SIGTERM:
1930                 if (s->exec_context.send_sigkill) {
1931                         log_warning("%s stopping timed out. Killing.", u->meta.id);
1932                         socket_enter_signal(s, SOCKET_STOP_PRE_SIGKILL, false);
1933                 } else {
1934                         log_warning("%s stopping timed out. Skipping SIGKILL. Ignoring.", u->meta.id);
1935                         socket_enter_stop_post(s, false);
1936                 }
1937                 break;
1938
1939         case SOCKET_STOP_PRE_SIGKILL:
1940                 log_warning("%s still around after SIGKILL. Ignoring.", u->meta.id);
1941                 socket_enter_stop_post(s, false);
1942                 break;
1943
1944         case SOCKET_STOP_POST:
1945                 log_warning("%s stopping timed out (2). Terminating.", u->meta.id);
1946                 socket_enter_signal(s, SOCKET_FINAL_SIGTERM, false);
1947                 break;
1948
1949         case SOCKET_FINAL_SIGTERM:
1950                 if (s->exec_context.send_sigkill) {
1951                         log_warning("%s stopping timed out (2). Killing.", u->meta.id);
1952                         socket_enter_signal(s, SOCKET_FINAL_SIGKILL, false);
1953                 } else {
1954                         log_warning("%s stopping timed out (2). Skipping SIGKILL. Ignoring.", u->meta.id);
1955                         socket_enter_dead(s, false);
1956                 }
1957                 break;
1958
1959         case SOCKET_FINAL_SIGKILL:
1960                 log_warning("%s still around after SIGKILL (2). Entering failed mode.", u->meta.id);
1961                 socket_enter_dead(s, false);
1962                 break;
1963
1964         default:
1965                 assert_not_reached("Timeout at wrong time.");
1966         }
1967 }
1968
1969 int socket_collect_fds(Socket *s, int **fds, unsigned *n_fds) {
1970         int *rfds;
1971         unsigned rn_fds, k;
1972         SocketPort *p;
1973
1974         assert(s);
1975         assert(fds);
1976         assert(n_fds);
1977
1978         /* Called from the service code for requesting our fds */
1979
1980         rn_fds = 0;
1981         LIST_FOREACH(port, p, s->ports)
1982                 if (p->fd >= 0)
1983                         rn_fds++;
1984
1985         if (rn_fds <= 0) {
1986                 *fds = NULL;
1987                 *n_fds = 0;
1988                 return 0;
1989         }
1990
1991         if (!(rfds = new(int, rn_fds)))
1992                 return -ENOMEM;
1993
1994         k = 0;
1995         LIST_FOREACH(port, p, s->ports)
1996                 if (p->fd >= 0)
1997                         rfds[k++] = p->fd;
1998
1999         assert(k == rn_fds);
2000
2001         *fds = rfds;
2002         *n_fds = rn_fds;
2003
2004         return 0;
2005 }
2006
2007 void socket_notify_service_dead(Socket *s) {
2008         assert(s);
2009
2010         /* The service is dead. Dang!
2011          *
2012          * This is strictly for one-instance-for-all-connections
2013          * services. */
2014
2015         if (s->state == SOCKET_RUNNING) {
2016                 log_debug("%s got notified about service death.", s->meta.id);
2017                 socket_enter_listening(s);
2018         }
2019 }
2020
2021 void socket_connection_unref(Socket *s) {
2022         assert(s);
2023
2024         /* The service is dead. Yay!
2025          *
2026          * This is strictly for one-instance-per-connection
2027          * services. */
2028
2029         assert(s->n_connections > 0);
2030         s->n_connections--;
2031
2032         log_debug("%s: One connection closed, %u left.", s->meta.id, s->n_connections);
2033 }
2034
2035 static void socket_reset_failed(Unit *u) {
2036         Socket *s = SOCKET(u);
2037
2038         assert(s);
2039
2040         if (s->state == SOCKET_FAILED)
2041                 socket_set_state(s, SOCKET_DEAD);
2042
2043         s->failure = false;
2044 }
2045
2046 static int socket_kill(Unit *u, KillWho who, KillMode mode, int signo, DBusError *error) {
2047         Socket *s = SOCKET(u);
2048         int r = 0;
2049         Set *pid_set = NULL;
2050
2051         assert(s);
2052
2053         if (who == KILL_MAIN) {
2054                 dbus_set_error(error, BUS_ERROR_NO_SUCH_PROCESS, "Socket units have no main processes");
2055                 return -ESRCH;
2056         }
2057
2058         if (s->control_pid <= 0 && who == KILL_CONTROL) {
2059                 dbus_set_error(error, BUS_ERROR_NO_SUCH_PROCESS, "No control process to kill");
2060                 return -ESRCH;
2061         }
2062
2063         if (who == KILL_CONTROL || who == KILL_ALL)
2064                 if (s->control_pid > 0)
2065                         if (kill(s->control_pid, signo) < 0)
2066                                 r = -errno;
2067
2068         if (who == KILL_ALL && mode == KILL_CONTROL_GROUP) {
2069                 int q;
2070
2071                 if (!(pid_set = set_new(trivial_hash_func, trivial_compare_func)))
2072                         return -ENOMEM;
2073
2074                 /* Exclude the control pid from being killed via the cgroup */
2075                 if (s->control_pid > 0)
2076                         if ((q = set_put(pid_set, LONG_TO_PTR(s->control_pid))) < 0) {
2077                                 r = q;
2078                                 goto finish;
2079                         }
2080
2081                 if ((q = cgroup_bonding_kill_list(s->meta.cgroup_bondings, signo, false, pid_set)) < 0)
2082                         if (q != -EAGAIN && q != -ESRCH && q != -ENOENT)
2083                                 r = q;
2084         }
2085
2086 finish:
2087         if (pid_set)
2088                 set_free(pid_set);
2089
2090         return r;
2091 }
2092
2093 static const char* const socket_state_table[_SOCKET_STATE_MAX] = {
2094         [SOCKET_DEAD] = "dead",
2095         [SOCKET_START_PRE] = "start-pre",
2096         [SOCKET_START_POST] = "start-post",
2097         [SOCKET_LISTENING] = "listening",
2098         [SOCKET_RUNNING] = "running",
2099         [SOCKET_STOP_PRE] = "stop-pre",
2100         [SOCKET_STOP_PRE_SIGTERM] = "stop-pre-sigterm",
2101         [SOCKET_STOP_PRE_SIGKILL] = "stop-pre-sigkill",
2102         [SOCKET_STOP_POST] = "stop-post",
2103         [SOCKET_FINAL_SIGTERM] = "final-sigterm",
2104         [SOCKET_FINAL_SIGKILL] = "final-sigkill",
2105         [SOCKET_FAILED] = "failed"
2106 };
2107
2108 DEFINE_STRING_TABLE_LOOKUP(socket_state, SocketState);
2109
2110 static const char* const socket_exec_command_table[_SOCKET_EXEC_COMMAND_MAX] = {
2111         [SOCKET_EXEC_START_PRE] = "StartPre",
2112         [SOCKET_EXEC_START_POST] = "StartPost",
2113         [SOCKET_EXEC_STOP_PRE] = "StopPre",
2114         [SOCKET_EXEC_STOP_POST] = "StopPost"
2115 };
2116
2117 DEFINE_STRING_TABLE_LOOKUP(socket_exec_command, SocketExecCommand);
2118
2119 const UnitVTable socket_vtable = {
2120         .suffix = ".socket",
2121         .sections =
2122                 "Unit\0"
2123                 "Socket\0"
2124                 "Install\0",
2125
2126         .init = socket_init,
2127         .done = socket_done,
2128         .load = socket_load,
2129
2130         .kill = socket_kill,
2131
2132         .coldplug = socket_coldplug,
2133
2134         .dump = socket_dump,
2135
2136         .start = socket_start,
2137         .stop = socket_stop,
2138
2139         .serialize = socket_serialize,
2140         .deserialize_item = socket_deserialize_item,
2141
2142         .active_state = socket_active_state,
2143         .sub_state_to_string = socket_sub_state_to_string,
2144
2145         .check_gc = socket_check_gc,
2146
2147         .fd_event = socket_fd_event,
2148         .sigchld_event = socket_sigchld_event,
2149         .timer_event = socket_timer_event,
2150
2151         .reset_failed = socket_reset_failed,
2152
2153         .bus_interface = "org.freedesktop.systemd1.Socket",
2154         .bus_message_handler = bus_socket_message_handler,
2155         .bus_invalidating_properties =  bus_socket_invalidating_properties
2156 };