chiark / gitweb /
socket: don't fail the socket on ENOTCONN
[elogind.git] / src / socket.c
1 /*-*- Mode: C; c-basic-offset: 8; indent-tabs-mode: nil -*-*/
2
3 /***
4   This file is part of systemd.
5
6   Copyright 2010 Lennart Poettering
7
8   systemd is free software; you can redistribute it and/or modify it
9   under the terms of the GNU General Public License as published by
10   the Free Software Foundation; either version 2 of the License, or
11   (at your option) any later version.
12
13   systemd is distributed in the hope that it will be useful, but
14   WITHOUT ANY WARRANTY; without even the implied warranty of
15   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16   General Public License for more details.
17
18   You should have received a copy of the GNU General Public License
19   along with systemd; If not, see <http://www.gnu.org/licenses/>.
20 ***/
21
22 #include <sys/types.h>
23 #include <sys/stat.h>
24 #include <unistd.h>
25 #include <errno.h>
26 #include <fcntl.h>
27 #include <sys/epoll.h>
28 #include <signal.h>
29 #include <arpa/inet.h>
30 #include <mqueue.h>
31
32 #include "unit.h"
33 #include "socket.h"
34 #include "netinet/tcp.h"
35 #include "log.h"
36 #include "load-dropin.h"
37 #include "load-fragment.h"
38 #include "strv.h"
39 #include "unit-name.h"
40 #include "dbus-socket.h"
41 #include "missing.h"
42 #include "special.h"
43 #include "bus-errors.h"
44 #include "label.h"
45 #include "exit-status.h"
46 #include "def.h"
47
48 static const UnitActiveState state_translation_table[_SOCKET_STATE_MAX] = {
49         [SOCKET_DEAD] = UNIT_INACTIVE,
50         [SOCKET_START_PRE] = UNIT_ACTIVATING,
51         [SOCKET_START_POST] = UNIT_ACTIVATING,
52         [SOCKET_LISTENING] = UNIT_ACTIVE,
53         [SOCKET_RUNNING] = UNIT_ACTIVE,
54         [SOCKET_STOP_PRE] = UNIT_DEACTIVATING,
55         [SOCKET_STOP_PRE_SIGTERM] = UNIT_DEACTIVATING,
56         [SOCKET_STOP_PRE_SIGKILL] = UNIT_DEACTIVATING,
57         [SOCKET_STOP_POST] = UNIT_DEACTIVATING,
58         [SOCKET_FINAL_SIGTERM] = UNIT_DEACTIVATING,
59         [SOCKET_FINAL_SIGKILL] = UNIT_DEACTIVATING,
60         [SOCKET_FAILED] = UNIT_FAILED
61 };
62
63 static void socket_init(Unit *u) {
64         Socket *s = SOCKET(u);
65
66         assert(u);
67         assert(u->load_state == UNIT_STUB);
68
69         s->backlog = SOMAXCONN;
70         s->timeout_usec = DEFAULT_TIMEOUT_USEC;
71         s->directory_mode = 0755;
72         s->socket_mode = 0666;
73
74         s->max_connections = 64;
75
76         s->priority = -1;
77         s->ip_tos = -1;
78         s->ip_ttl = -1;
79         s->mark = -1;
80
81         exec_context_init(&s->exec_context);
82         s->exec_context.std_output = u->manager->default_std_output;
83         s->exec_context.std_error = u->manager->default_std_error;
84
85         s->control_command_id = _SOCKET_EXEC_COMMAND_INVALID;
86 }
87
88 static void socket_unwatch_control_pid(Socket *s) {
89         assert(s);
90
91         if (s->control_pid <= 0)
92                 return;
93
94         unit_unwatch_pid(UNIT(s), s->control_pid);
95         s->control_pid = 0;
96 }
97
98 static void socket_done(Unit *u) {
99         Socket *s = SOCKET(u);
100         SocketPort *p;
101
102         assert(s);
103
104         while ((p = s->ports)) {
105                 LIST_REMOVE(SocketPort, port, s->ports, p);
106
107                 if (p->fd >= 0) {
108                         unit_unwatch_fd(UNIT(s), &p->fd_watch);
109                         close_nointr_nofail(p->fd);
110                 }
111
112                 free(p->path);
113                 free(p);
114         }
115
116         exec_context_done(&s->exec_context);
117         exec_command_free_array(s->exec_command, _SOCKET_EXEC_COMMAND_MAX);
118         s->control_command = NULL;
119
120         socket_unwatch_control_pid(s);
121
122         unit_ref_unset(&s->service);
123
124         free(s->tcp_congestion);
125         s->tcp_congestion = NULL;
126
127         free(s->bind_to_device);
128         s->bind_to_device = NULL;
129
130         unit_unwatch_timer(u, &s->timer_watch);
131 }
132
133 static int socket_instantiate_service(Socket *s) {
134         char *prefix, *name;
135         int r;
136         Unit *u;
137
138         assert(s);
139
140         /* This fills in s->service if it isn't filled in yet. For
141          * Accept=yes sockets we create the next connection service
142          * here. For Accept=no this is mostly a NOP since the service
143          * is figured out at load time anyway. */
144
145         if (UNIT_DEREF(s->service))
146                 return 0;
147
148         assert(s->accept);
149
150         if (!(prefix = unit_name_to_prefix(UNIT(s)->id)))
151                 return -ENOMEM;
152
153         r = asprintf(&name, "%s@%u.service", prefix, s->n_accepted);
154         free(prefix);
155
156         if (r < 0)
157                 return -ENOMEM;
158
159         r = manager_load_unit(UNIT(s)->manager, name, NULL, NULL, &u);
160         free(name);
161
162         if (r < 0)
163                 return r;
164
165 #ifdef HAVE_SYSV_COMPAT
166         if (SERVICE(u)->sysv_path) {
167                 log_error("Using SysV services for socket activation is not supported. Refusing.");
168                 return -ENOENT;
169         }
170 #endif
171
172         u->no_gc = true;
173         unit_ref_set(&s->service, u);
174
175         return unit_add_two_dependencies(UNIT(s), UNIT_BEFORE, UNIT_TRIGGERS, u, false);
176 }
177
178 static bool have_non_accept_socket(Socket *s) {
179         SocketPort *p;
180
181         assert(s);
182
183         if (!s->accept)
184                 return true;
185
186         LIST_FOREACH(port, p, s->ports) {
187
188                 if (p->type != SOCKET_SOCKET)
189                         return true;
190
191                 if (!socket_address_can_accept(&p->address))
192                         return true;
193         }
194
195         return false;
196 }
197
198 static int socket_verify(Socket *s) {
199         assert(s);
200
201         if (UNIT(s)->load_state != UNIT_LOADED)
202                 return 0;
203
204         if (!s->ports) {
205                 log_error("%s lacks Listen setting. Refusing.", UNIT(s)->id);
206                 return -EINVAL;
207         }
208
209         if (s->accept && have_non_accept_socket(s)) {
210                 log_error("%s configured for accepting sockets, but sockets are non-accepting. Refusing.", UNIT(s)->id);
211                 return -EINVAL;
212         }
213
214         if (s->accept && s->max_connections <= 0) {
215                 log_error("%s's MaxConnection setting too small. Refusing.", UNIT(s)->id);
216                 return -EINVAL;
217         }
218
219         if (s->accept && UNIT_DEREF(s->service)) {
220                 log_error("Explicit service configuration for accepting sockets not supported on %s. Refusing.", UNIT(s)->id);
221                 return -EINVAL;
222         }
223
224         if (s->exec_context.pam_name && s->exec_context.kill_mode != KILL_CONTROL_GROUP) {
225                 log_error("%s has PAM enabled. Kill mode must be set to 'control-group'. Refusing.", UNIT(s)->id);
226                 return -EINVAL;
227         }
228
229         return 0;
230 }
231
232 static bool socket_needs_mount(Socket *s, const char *prefix) {
233         SocketPort *p;
234
235         assert(s);
236
237         LIST_FOREACH(port, p, s->ports) {
238
239                 if (p->type == SOCKET_SOCKET) {
240                         if (socket_address_needs_mount(&p->address, prefix))
241                                 return true;
242                 } else if (p->type == SOCKET_FIFO || p->type == SOCKET_SPECIAL) {
243                         if (path_startswith(p->path, prefix))
244                                 return true;
245                 }
246         }
247
248         return false;
249 }
250
251 int socket_add_one_mount_link(Socket *s, Mount *m) {
252         int r;
253
254         assert(s);
255         assert(m);
256
257         if (UNIT(s)->load_state != UNIT_LOADED ||
258             UNIT(m)->load_state != UNIT_LOADED)
259                 return 0;
260
261         if (!socket_needs_mount(s, m->where))
262                 return 0;
263
264         if ((r = unit_add_two_dependencies(UNIT(s), UNIT_AFTER, UNIT_REQUIRES, UNIT(m), true)) < 0)
265                 return r;
266
267         return 0;
268 }
269
270 static int socket_add_mount_links(Socket *s) {
271         Unit *other;
272         int r;
273
274         assert(s);
275
276         LIST_FOREACH(units_by_type, other, UNIT(s)->manager->units_by_type[UNIT_MOUNT])
277                 if ((r = socket_add_one_mount_link(s, MOUNT(other))) < 0)
278                         return r;
279
280         return 0;
281 }
282
283 static int socket_add_device_link(Socket *s) {
284         char *t;
285         int r;
286
287         assert(s);
288
289         if (!s->bind_to_device)
290                 return 0;
291
292         if (asprintf(&t, "/sys/subsystem/net/devices/%s", s->bind_to_device) < 0)
293                 return -ENOMEM;
294
295         r = unit_add_node_link(UNIT(s), t, false);
296         free(t);
297
298         return r;
299 }
300
301 static int socket_add_default_dependencies(Socket *s) {
302         int r;
303         assert(s);
304
305         if (UNIT(s)->manager->running_as == MANAGER_SYSTEM) {
306                 if ((r = unit_add_dependency_by_name(UNIT(s), UNIT_BEFORE, SPECIAL_SOCKETS_TARGET, NULL, true)) < 0)
307                         return r;
308
309                 if ((r = unit_add_two_dependencies_by_name(UNIT(s), UNIT_AFTER, UNIT_REQUIRES, SPECIAL_SYSINIT_TARGET, NULL, true)) < 0)
310                         return r;
311         }
312
313         return unit_add_two_dependencies_by_name(UNIT(s), UNIT_BEFORE, UNIT_CONFLICTS, SPECIAL_SHUTDOWN_TARGET, NULL, true);
314 }
315
316 static bool socket_has_exec(Socket *s) {
317         unsigned i;
318         assert(s);
319
320         for (i = 0; i < _SOCKET_EXEC_COMMAND_MAX; i++)
321                 if (s->exec_command[i])
322                         return true;
323
324         return false;
325 }
326
327 static int socket_load(Unit *u) {
328         Socket *s = SOCKET(u);
329         int r;
330
331         assert(u);
332         assert(u->load_state == UNIT_STUB);
333
334         if ((r = unit_load_fragment_and_dropin(u)) < 0)
335                 return r;
336
337         /* This is a new unit? Then let's add in some extras */
338         if (u->load_state == UNIT_LOADED) {
339
340                 if (have_non_accept_socket(s)) {
341
342                         if (!UNIT_DEREF(s->service)) {
343                                 Unit *x;
344
345                                 r = unit_load_related_unit(u, ".service", &x);
346                                 if (r < 0)
347                                         return r;
348
349                                 unit_ref_set(&s->service, x);
350                         }
351
352                         r = unit_add_two_dependencies(u, UNIT_BEFORE, UNIT_TRIGGERS, UNIT_DEREF(s->service), true);
353                         if (r < 0)
354                                 return r;
355                 }
356
357                 if ((r = socket_add_mount_links(s)) < 0)
358                         return r;
359
360                 if ((r = socket_add_device_link(s)) < 0)
361                         return r;
362
363                 if (socket_has_exec(s))
364                         if ((r = unit_add_exec_dependencies(u, &s->exec_context)) < 0)
365                                 return r;
366
367                 if ((r = unit_add_default_cgroups(u)) < 0)
368                         return r;
369
370                 if (UNIT(s)->default_dependencies)
371                         if ((r = socket_add_default_dependencies(s)) < 0)
372                                 return r;
373         }
374
375         return socket_verify(s);
376 }
377
378 static const char* listen_lookup(int family, int type) {
379
380         if (family == AF_NETLINK)
381                 return "ListenNetlink";
382
383         if (type == SOCK_STREAM)
384                 return "ListenStream";
385         else if (type == SOCK_DGRAM)
386                 return "ListenDatagram";
387         else if (type == SOCK_SEQPACKET)
388                 return "ListenSequentialPacket";
389
390         assert_not_reached("Unknown socket type");
391         return NULL;
392 }
393
394 static void socket_dump(Unit *u, FILE *f, const char *prefix) {
395
396         SocketExecCommand c;
397         Socket *s = SOCKET(u);
398         SocketPort *p;
399         const char *prefix2;
400         char *p2;
401
402         assert(s);
403         assert(f);
404
405         p2 = strappend(prefix, "\t");
406         prefix2 = p2 ? p2 : prefix;
407
408         fprintf(f,
409                 "%sSocket State: %s\n"
410                 "%sBindIPv6Only: %s\n"
411                 "%sBacklog: %u\n"
412                 "%sSocketMode: %04o\n"
413                 "%sDirectoryMode: %04o\n"
414                 "%sKeepAlive: %s\n"
415                 "%sFreeBind: %s\n"
416                 "%sTransparent: %s\n"
417                 "%sBroadcast: %s\n"
418                 "%sPassCrededentials: %s\n"
419                 "%sTCPCongestion: %s\n",
420                 prefix, socket_state_to_string(s->state),
421                 prefix, socket_address_bind_ipv6_only_to_string(s->bind_ipv6_only),
422                 prefix, s->backlog,
423                 prefix, s->socket_mode,
424                 prefix, s->directory_mode,
425                 prefix, yes_no(s->keep_alive),
426                 prefix, yes_no(s->free_bind),
427                 prefix, yes_no(s->transparent),
428                 prefix, yes_no(s->broadcast),
429                 prefix, yes_no(s->pass_cred),
430                 prefix, strna(s->tcp_congestion));
431
432         if (s->control_pid > 0)
433                 fprintf(f,
434                         "%sControl PID: %lu\n",
435                         prefix, (unsigned long) s->control_pid);
436
437         if (s->bind_to_device)
438                 fprintf(f,
439                         "%sBindToDevice: %s\n",
440                         prefix, s->bind_to_device);
441
442         if (s->accept)
443                 fprintf(f,
444                         "%sAccepted: %u\n"
445                         "%sNConnections: %u\n"
446                         "%sMaxConnections: %u\n",
447                         prefix, s->n_accepted,
448                         prefix, s->n_connections,
449                         prefix, s->max_connections);
450
451         if (s->priority >= 0)
452                 fprintf(f,
453                         "%sPriority: %i\n",
454                         prefix, s->priority);
455
456         if (s->receive_buffer > 0)
457                 fprintf(f,
458                         "%sReceiveBuffer: %zu\n",
459                         prefix, s->receive_buffer);
460
461         if (s->send_buffer > 0)
462                 fprintf(f,
463                         "%sSendBuffer: %zu\n",
464                         prefix, s->send_buffer);
465
466         if (s->ip_tos >= 0)
467                 fprintf(f,
468                         "%sIPTOS: %i\n",
469                         prefix, s->ip_tos);
470
471         if (s->ip_ttl >= 0)
472                 fprintf(f,
473                         "%sIPTTL: %i\n",
474                         prefix, s->ip_ttl);
475
476         if (s->pipe_size > 0)
477                 fprintf(f,
478                         "%sPipeSize: %zu\n",
479                         prefix, s->pipe_size);
480
481         if (s->mark >= 0)
482                 fprintf(f,
483                         "%sMark: %i\n",
484                         prefix, s->mark);
485
486         if (s->mq_maxmsg > 0)
487                 fprintf(f,
488                         "%sMessageQueueMaxMessages: %li\n",
489                         prefix, s->mq_maxmsg);
490
491         if (s->mq_msgsize > 0)
492                 fprintf(f,
493                         "%sMessageQueueMessageSize: %li\n",
494                         prefix, s->mq_msgsize);
495
496         LIST_FOREACH(port, p, s->ports) {
497
498                 if (p->type == SOCKET_SOCKET) {
499                         const char *t;
500                         int r;
501                         char *k = NULL;
502
503                         if ((r = socket_address_print(&p->address, &k)) < 0)
504                                 t = strerror(-r);
505                         else
506                                 t = k;
507
508                         fprintf(f, "%s%s: %s\n", prefix, listen_lookup(socket_address_family(&p->address), p->address.type), t);
509                         free(k);
510                 } else if (p->type == SOCKET_SPECIAL)
511                         fprintf(f, "%sListenSpecial: %s\n", prefix, p->path);
512                 else if (p->type == SOCKET_MQUEUE)
513                         fprintf(f, "%sListenMessageQueue: %s\n", prefix, p->path);
514                 else
515                         fprintf(f, "%sListenFIFO: %s\n", prefix, p->path);
516         }
517
518         exec_context_dump(&s->exec_context, f, prefix);
519
520         for (c = 0; c < _SOCKET_EXEC_COMMAND_MAX; c++) {
521                 if (!s->exec_command[c])
522                         continue;
523
524                 fprintf(f, "%s-> %s:\n",
525                         prefix, socket_exec_command_to_string(c));
526
527                 exec_command_dump_list(s->exec_command[c], f, prefix2);
528         }
529
530         free(p2);
531 }
532
533 static int instance_from_socket(int fd, unsigned nr, char **instance) {
534         socklen_t l;
535         char *r;
536         union {
537                 struct sockaddr sa;
538                 struct sockaddr_un un;
539                 struct sockaddr_in in;
540                 struct sockaddr_in6 in6;
541                 struct sockaddr_storage storage;
542         } local, remote;
543
544         assert(fd >= 0);
545         assert(instance);
546
547         l = sizeof(local);
548         if (getsockname(fd, &local.sa, &l) < 0)
549                 return -errno;
550
551         l = sizeof(remote);
552         if (getpeername(fd, &remote.sa, &l) < 0)
553                 return -errno;
554
555         switch (local.sa.sa_family) {
556
557         case AF_INET: {
558                 uint32_t
559                         a = ntohl(local.in.sin_addr.s_addr),
560                         b = ntohl(remote.in.sin_addr.s_addr);
561
562                 if (asprintf(&r,
563                              "%u.%u.%u.%u:%u-%u.%u.%u.%u:%u",
564                              a >> 24, (a >> 16) & 0xFF, (a >> 8) & 0xFF, a & 0xFF,
565                              ntohs(local.in.sin_port),
566                              b >> 24, (b >> 16) & 0xFF, (b >> 8) & 0xFF, b & 0xFF,
567                              ntohs(remote.in.sin_port)) < 0)
568                         return -ENOMEM;
569
570                 break;
571         }
572
573         case AF_INET6: {
574                 static const char ipv4_prefix[] = {
575                         0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0xFF, 0xFF
576                 };
577
578                 if (memcmp(&local.in6.sin6_addr, ipv4_prefix, sizeof(ipv4_prefix)) == 0 &&
579                     memcmp(&remote.in6.sin6_addr, ipv4_prefix, sizeof(ipv4_prefix)) == 0) {
580                         const uint8_t
581                                 *a = local.in6.sin6_addr.s6_addr+12,
582                                 *b = remote.in6.sin6_addr.s6_addr+12;
583
584                         if (asprintf(&r,
585                                      "%u.%u.%u.%u:%u-%u.%u.%u.%u:%u",
586                                      a[0], a[1], a[2], a[3],
587                                      ntohs(local.in6.sin6_port),
588                                      b[0], b[1], b[2], b[3],
589                                      ntohs(remote.in6.sin6_port)) < 0)
590                                 return -ENOMEM;
591                 } else {
592                         char a[INET6_ADDRSTRLEN], b[INET6_ADDRSTRLEN];
593
594                         if (asprintf(&r,
595                                      "%s:%u-%s:%u",
596                                      inet_ntop(AF_INET6, &local.in6.sin6_addr, a, sizeof(a)),
597                                      ntohs(local.in6.sin6_port),
598                                      inet_ntop(AF_INET6, &remote.in6.sin6_addr, b, sizeof(b)),
599                                      ntohs(remote.in6.sin6_port)) < 0)
600                                 return -ENOMEM;
601                 }
602
603                 break;
604         }
605
606         case AF_UNIX: {
607                 struct ucred ucred;
608
609                 l = sizeof(ucred);
610                 if (getsockopt(fd, SOL_SOCKET, SO_PEERCRED, &ucred, &l) < 0)
611                         return -errno;
612
613                 if (asprintf(&r,
614                              "%u-%lu-%lu",
615                              nr,
616                              (unsigned long) ucred.pid,
617                              (unsigned long) ucred.uid) < 0)
618                         return -ENOMEM;
619
620                 break;
621         }
622
623         default:
624                 assert_not_reached("Unhandled socket type.");
625         }
626
627         *instance = r;
628         return 0;
629 }
630
631 static void socket_close_fds(Socket *s) {
632         SocketPort *p;
633
634         assert(s);
635
636         LIST_FOREACH(port, p, s->ports) {
637                 if (p->fd < 0)
638                         continue;
639
640                 unit_unwatch_fd(UNIT(s), &p->fd_watch);
641                 close_nointr_nofail(p->fd);
642
643                 /* One little note: we should never delete any sockets
644                  * in the file system here! After all some other
645                  * process we spawned might still have a reference of
646                  * this fd and wants to continue to use it. Therefore
647                  * we delete sockets in the file system before we
648                  * create a new one, not after we stopped using
649                  * one! */
650
651                 p->fd = -1;
652         }
653 }
654
655 static void socket_apply_socket_options(Socket *s, int fd) {
656         assert(s);
657         assert(fd >= 0);
658
659         if (s->keep_alive) {
660                 int b = s->keep_alive;
661                 if (setsockopt(fd, SOL_SOCKET, SO_KEEPALIVE, &b, sizeof(b)) < 0)
662                         log_warning("SO_KEEPALIVE failed: %m");
663         }
664
665         if (s->broadcast) {
666                 int one = 1;
667                 if (setsockopt(fd, SOL_SOCKET, SO_BROADCAST, &one, sizeof(one)) < 0)
668                         log_warning("SO_BROADCAST failed: %m");
669         }
670
671         if (s->pass_cred) {
672                 int one = 1;
673                 if (setsockopt(fd, SOL_SOCKET, SO_PASSCRED, &one, sizeof(one)) < 0)
674                         log_warning("SO_PASSCRED failed: %m");
675         }
676
677         if (s->priority >= 0)
678                 if (setsockopt(fd, SOL_SOCKET, SO_PRIORITY, &s->priority, sizeof(s->priority)) < 0)
679                         log_warning("SO_PRIORITY failed: %m");
680
681         if (s->receive_buffer > 0) {
682                 int value = (int) s->receive_buffer;
683                 if (setsockopt(fd, SOL_SOCKET, SO_RCVBUFFORCE, &value, sizeof(value)) < 0)
684                         log_warning("SO_RCVBUFFORCE failed: %m");
685         }
686
687         if (s->send_buffer > 0) {
688                 int value = (int) s->send_buffer;
689                 if (setsockopt(fd, SOL_SOCKET, SO_SNDBUFFORCE, &value, sizeof(value)) < 0)
690                         log_warning("SO_SNDBUFFORCE failed: %m");
691         }
692
693         if (s->mark >= 0)
694                 if (setsockopt(fd, SOL_SOCKET, SO_MARK, &s->mark, sizeof(s->mark)) < 0)
695                         log_warning("SO_MARK failed: %m");
696
697         if (s->ip_tos >= 0)
698                 if (setsockopt(fd, IPPROTO_IP, IP_TOS, &s->ip_tos, sizeof(s->ip_tos)) < 0)
699                         log_warning("IP_TOS failed: %m");
700
701         if (s->ip_ttl >= 0) {
702                 int r, x;
703
704                 r = setsockopt(fd, IPPROTO_IP, IP_TTL, &s->ip_ttl, sizeof(s->ip_ttl));
705
706                 if (socket_ipv6_is_supported())
707                         x = setsockopt(fd, IPPROTO_IPV6, IPV6_UNICAST_HOPS, &s->ip_ttl, sizeof(s->ip_ttl));
708                 else {
709                         x = -1;
710                         errno = EAFNOSUPPORT;
711                 }
712
713                 if (r < 0 && x < 0)
714                         log_warning("IP_TTL/IPV6_UNICAST_HOPS failed: %m");
715         }
716
717         if (s->tcp_congestion)
718                 if (setsockopt(fd, SOL_TCP, TCP_CONGESTION, s->tcp_congestion, strlen(s->tcp_congestion)+1) < 0)
719                         log_warning("TCP_CONGESTION failed: %m");
720 }
721
722 static void socket_apply_fifo_options(Socket *s, int fd) {
723         assert(s);
724         assert(fd >= 0);
725
726         if (s->pipe_size > 0)
727                 if (fcntl(fd, F_SETPIPE_SZ, s->pipe_size) < 0)
728                         log_warning("F_SETPIPE_SZ: %m");
729 }
730
731 static int fifo_address_create(
732                 const char *path,
733                 mode_t directory_mode,
734                 mode_t socket_mode,
735                 int *_fd) {
736
737         int fd = -1, r = 0;
738         struct stat st;
739         mode_t old_mask;
740
741         assert(path);
742         assert(_fd);
743
744         mkdir_parents(path, directory_mode);
745
746         if ((r = label_fifofile_set(path)) < 0)
747                 goto fail;
748
749         /* Enforce the right access mode for the fifo */
750         old_mask = umask(~ socket_mode);
751
752         /* Include the original umask in our mask */
753         umask(~socket_mode | old_mask);
754
755         r = mkfifo(path, socket_mode);
756         umask(old_mask);
757
758         if (r < 0 && errno != EEXIST) {
759                 r = -errno;
760                 goto fail;
761         }
762
763         if ((fd = open(path, O_RDWR|O_CLOEXEC|O_NOCTTY|O_NONBLOCK|O_NOFOLLOW)) < 0) {
764                 r = -errno;
765                 goto fail;
766         }
767
768         label_file_clear();
769
770         if (fstat(fd, &st) < 0) {
771                 r = -errno;
772                 goto fail;
773         }
774
775         if (!S_ISFIFO(st.st_mode) ||
776             (st.st_mode & 0777) != (socket_mode & ~old_mask) ||
777             st.st_uid != getuid() ||
778             st.st_gid != getgid()) {
779
780                 r = -EEXIST;
781                 goto fail;
782         }
783
784         *_fd = fd;
785         return 0;
786
787 fail:
788         label_file_clear();
789
790         if (fd >= 0)
791                 close_nointr_nofail(fd);
792
793         return r;
794 }
795
796 static int special_address_create(
797                 const char *path,
798                 int *_fd) {
799
800         int fd = -1, r = 0;
801         struct stat st;
802
803         assert(path);
804         assert(_fd);
805
806         if ((fd = open(path, O_RDONLY|O_CLOEXEC|O_NOCTTY|O_NONBLOCK|O_NOFOLLOW)) < 0) {
807                 r = -errno;
808                 goto fail;
809         }
810
811         if (fstat(fd, &st) < 0) {
812                 r = -errno;
813                 goto fail;
814         }
815
816         /* Check whether this is a /proc, /sys or /dev file or char device */
817         if (!S_ISREG(st.st_mode) && !S_ISCHR(st.st_mode)) {
818                 r = -EEXIST;
819                 goto fail;
820         }
821
822         *_fd = fd;
823         return 0;
824
825 fail:
826         if (fd >= 0)
827                 close_nointr_nofail(fd);
828
829         return r;
830 }
831
832 static int mq_address_create(
833                 const char *path,
834                 mode_t mq_mode,
835                 long maxmsg,
836                 long msgsize,
837                 int *_fd) {
838
839         int fd = -1, r = 0;
840         struct stat st;
841         mode_t old_mask;
842         struct mq_attr _attr, *attr = NULL;
843
844         assert(path);
845         assert(_fd);
846
847         if (maxmsg > 0 && msgsize > 0) {
848                 zero(_attr);
849                 _attr.mq_flags = O_NONBLOCK;
850                 _attr.mq_maxmsg = maxmsg;
851                 _attr.mq_msgsize = msgsize;
852                 attr = &_attr;
853         }
854
855         /* Enforce the right access mode for the mq */
856         old_mask = umask(~ mq_mode);
857
858         /* Include the original umask in our mask */
859         umask(~mq_mode | old_mask);
860
861         fd = mq_open(path, O_RDONLY|O_CLOEXEC|O_NONBLOCK|O_CREAT, mq_mode, attr);
862         umask(old_mask);
863
864         if (fd < 0) {
865                 r = -errno;
866                 goto fail;
867         }
868
869         if (fstat(fd, &st) < 0) {
870                 r = -errno;
871                 goto fail;
872         }
873
874         if ((st.st_mode & 0777) != (mq_mode & ~old_mask) ||
875             st.st_uid != getuid() ||
876             st.st_gid != getgid()) {
877
878                 r = -EEXIST;
879                 goto fail;
880         }
881
882         *_fd = fd;
883         return 0;
884
885 fail:
886         if (fd >= 0)
887                 close_nointr_nofail(fd);
888
889         return r;
890 }
891
892 static int socket_open_fds(Socket *s) {
893         SocketPort *p;
894         int r;
895         char *label = NULL;
896         bool know_label = false;
897
898         assert(s);
899
900         LIST_FOREACH(port, p, s->ports) {
901
902                 if (p->fd >= 0)
903                         continue;
904
905                 if (p->type == SOCKET_SOCKET) {
906
907                         if (!know_label) {
908
909                                 if ((r = socket_instantiate_service(s)) < 0)
910                                         return r;
911
912                                 if (UNIT_DEREF(s->service) &&
913                                     SERVICE(UNIT_DEREF(s->service))->exec_command[SERVICE_EXEC_START]) {
914                                         r = label_get_create_label_from_exe(SERVICE(UNIT_DEREF(s->service))->exec_command[SERVICE_EXEC_START]->path, &label);
915
916                                         if (r < 0) {
917                                                 if (r != -EPERM)
918                                                         return r;
919                                         }
920                                 }
921
922                                 know_label = true;
923                         }
924
925                         if ((r = socket_address_listen(
926                                              &p->address,
927                                              s->backlog,
928                                              s->bind_ipv6_only,
929                                              s->bind_to_device,
930                                              s->free_bind,
931                                              s->transparent,
932                                              s->directory_mode,
933                                              s->socket_mode,
934                                              label,
935                                              &p->fd)) < 0)
936                                 goto rollback;
937
938                         socket_apply_socket_options(s, p->fd);
939
940                 } else  if (p->type == SOCKET_SPECIAL) {
941
942                         if ((r = special_address_create(
943                                              p->path,
944                                              &p->fd)) < 0)
945                                 goto rollback;
946
947                 } else  if (p->type == SOCKET_FIFO) {
948
949                         if ((r = fifo_address_create(
950                                              p->path,
951                                              s->directory_mode,
952                                              s->socket_mode,
953                                              &p->fd)) < 0)
954                                 goto rollback;
955
956                         socket_apply_fifo_options(s, p->fd);
957                 } else if (p->type == SOCKET_MQUEUE) {
958
959                         if ((r = mq_address_create(
960                                              p->path,
961                                              s->socket_mode,
962                                              s->mq_maxmsg,
963                                              s->mq_msgsize,
964                                              &p->fd)) < 0)
965                                 goto rollback;
966                 } else
967                         assert_not_reached("Unknown port type");
968         }
969
970         label_free(label);
971         return 0;
972
973 rollback:
974         socket_close_fds(s);
975         label_free(label);
976         return r;
977 }
978
979 static void socket_unwatch_fds(Socket *s) {
980         SocketPort *p;
981
982         assert(s);
983
984         LIST_FOREACH(port, p, s->ports) {
985                 if (p->fd < 0)
986                         continue;
987
988                 unit_unwatch_fd(UNIT(s), &p->fd_watch);
989         }
990 }
991
992 static int socket_watch_fds(Socket *s) {
993         SocketPort *p;
994         int r;
995
996         assert(s);
997
998         LIST_FOREACH(port, p, s->ports) {
999                 if (p->fd < 0)
1000                         continue;
1001
1002                 p->fd_watch.socket_accept =
1003                         s->accept &&
1004                         p->type == SOCKET_SOCKET &&
1005                         socket_address_can_accept(&p->address);
1006
1007                 if ((r = unit_watch_fd(UNIT(s), p->fd, EPOLLIN, &p->fd_watch)) < 0)
1008                         goto fail;
1009         }
1010
1011         return 0;
1012
1013 fail:
1014         socket_unwatch_fds(s);
1015         return r;
1016 }
1017
1018 static void socket_set_state(Socket *s, SocketState state) {
1019         SocketState old_state;
1020         assert(s);
1021
1022         old_state = s->state;
1023         s->state = state;
1024
1025         if (state != SOCKET_START_PRE &&
1026             state != SOCKET_START_POST &&
1027             state != SOCKET_STOP_PRE &&
1028             state != SOCKET_STOP_PRE_SIGTERM &&
1029             state != SOCKET_STOP_PRE_SIGKILL &&
1030             state != SOCKET_STOP_POST &&
1031             state != SOCKET_FINAL_SIGTERM &&
1032             state != SOCKET_FINAL_SIGKILL) {
1033                 unit_unwatch_timer(UNIT(s), &s->timer_watch);
1034                 socket_unwatch_control_pid(s);
1035                 s->control_command = NULL;
1036                 s->control_command_id = _SOCKET_EXEC_COMMAND_INVALID;
1037         }
1038
1039         if (state != SOCKET_LISTENING)
1040                 socket_unwatch_fds(s);
1041
1042         if (state != SOCKET_START_POST &&
1043             state != SOCKET_LISTENING &&
1044             state != SOCKET_RUNNING &&
1045             state != SOCKET_STOP_PRE &&
1046             state != SOCKET_STOP_PRE_SIGTERM &&
1047             state != SOCKET_STOP_PRE_SIGKILL)
1048                 socket_close_fds(s);
1049
1050         if (state != old_state)
1051                 log_debug("%s changed %s -> %s",
1052                           UNIT(s)->id,
1053                           socket_state_to_string(old_state),
1054                           socket_state_to_string(state));
1055
1056         unit_notify(UNIT(s), state_translation_table[old_state], state_translation_table[state], true);
1057 }
1058
1059 static int socket_coldplug(Unit *u) {
1060         Socket *s = SOCKET(u);
1061         int r;
1062
1063         assert(s);
1064         assert(s->state == SOCKET_DEAD);
1065
1066         if (s->deserialized_state != s->state) {
1067
1068                 if (s->deserialized_state == SOCKET_START_PRE ||
1069                     s->deserialized_state == SOCKET_START_POST ||
1070                     s->deserialized_state == SOCKET_STOP_PRE ||
1071                     s->deserialized_state == SOCKET_STOP_PRE_SIGTERM ||
1072                     s->deserialized_state == SOCKET_STOP_PRE_SIGKILL ||
1073                     s->deserialized_state == SOCKET_STOP_POST ||
1074                     s->deserialized_state == SOCKET_FINAL_SIGTERM ||
1075                     s->deserialized_state == SOCKET_FINAL_SIGKILL) {
1076
1077                         if (s->control_pid <= 0)
1078                                 return -EBADMSG;
1079
1080                         if ((r = unit_watch_pid(UNIT(s), s->control_pid)) < 0)
1081                                 return r;
1082
1083                         if ((r = unit_watch_timer(UNIT(s), s->timeout_usec, &s->timer_watch)) < 0)
1084                                 return r;
1085                 }
1086
1087                 if (s->deserialized_state == SOCKET_START_POST ||
1088                     s->deserialized_state == SOCKET_LISTENING ||
1089                     s->deserialized_state == SOCKET_RUNNING ||
1090                     s->deserialized_state == SOCKET_STOP_PRE ||
1091                     s->deserialized_state == SOCKET_STOP_PRE_SIGTERM ||
1092                     s->deserialized_state == SOCKET_STOP_PRE_SIGKILL)
1093                         if ((r = socket_open_fds(s)) < 0)
1094                                 return r;
1095
1096                 if (s->deserialized_state == SOCKET_LISTENING)
1097                         if ((r = socket_watch_fds(s)) < 0)
1098                                 return r;
1099
1100                 socket_set_state(s, s->deserialized_state);
1101         }
1102
1103         return 0;
1104 }
1105
1106 static int socket_spawn(Socket *s, ExecCommand *c, pid_t *_pid) {
1107         pid_t pid;
1108         int r;
1109         char **argv;
1110
1111         assert(s);
1112         assert(c);
1113         assert(_pid);
1114
1115         if ((r = unit_watch_timer(UNIT(s), s->timeout_usec, &s->timer_watch)) < 0)
1116                 goto fail;
1117
1118         if (!(argv = unit_full_printf_strv(UNIT(s), c->argv))) {
1119                 r = -ENOMEM;
1120                 goto fail;
1121         }
1122
1123         r = exec_spawn(c,
1124                        argv,
1125                        &s->exec_context,
1126                        NULL, 0,
1127                        UNIT(s)->manager->environment,
1128                        true,
1129                        true,
1130                        true,
1131                        UNIT(s)->manager->confirm_spawn,
1132                        UNIT(s)->cgroup_bondings,
1133                        UNIT(s)->cgroup_attributes,
1134                        &pid);
1135
1136         strv_free(argv);
1137         if (r < 0)
1138                 goto fail;
1139
1140         if ((r = unit_watch_pid(UNIT(s), pid)) < 0)
1141                 /* FIXME: we need to do something here */
1142                 goto fail;
1143
1144         *_pid = pid;
1145
1146         return 0;
1147
1148 fail:
1149         unit_unwatch_timer(UNIT(s), &s->timer_watch);
1150
1151         return r;
1152 }
1153
1154 static void socket_enter_dead(Socket *s, bool success) {
1155         assert(s);
1156
1157         if (!success)
1158                 s->failure = true;
1159
1160         socket_set_state(s, s->failure ? SOCKET_FAILED : SOCKET_DEAD);
1161 }
1162
1163 static void socket_enter_signal(Socket *s, SocketState state, bool success);
1164
1165 static void socket_enter_stop_post(Socket *s, bool success) {
1166         int r;
1167         assert(s);
1168
1169         if (!success)
1170                 s->failure = true;
1171
1172         socket_unwatch_control_pid(s);
1173
1174         s->control_command_id = SOCKET_EXEC_STOP_POST;
1175
1176         if ((s->control_command = s->exec_command[SOCKET_EXEC_STOP_POST])) {
1177                 if ((r = socket_spawn(s, s->control_command, &s->control_pid)) < 0)
1178                         goto fail;
1179
1180                 socket_set_state(s, SOCKET_STOP_POST);
1181         } else
1182                 socket_enter_signal(s, SOCKET_FINAL_SIGTERM, true);
1183
1184         return;
1185
1186 fail:
1187         log_warning("%s failed to run 'stop-post' task: %s", UNIT(s)->id, strerror(-r));
1188         socket_enter_signal(s, SOCKET_FINAL_SIGTERM, false);
1189 }
1190
1191 static void socket_enter_signal(Socket *s, SocketState state, bool success) {
1192         int r;
1193         Set *pid_set = NULL;
1194         bool wait_for_exit = false;
1195
1196         assert(s);
1197
1198         if (!success)
1199                 s->failure = true;
1200
1201         if (s->exec_context.kill_mode != KILL_NONE) {
1202                 int sig = (state == SOCKET_STOP_PRE_SIGTERM || state == SOCKET_FINAL_SIGTERM) ? s->exec_context.kill_signal : SIGKILL;
1203
1204                 if (s->control_pid > 0) {
1205                         if (kill_and_sigcont(s->control_pid, sig) < 0 && errno != ESRCH)
1206
1207                                 log_warning("Failed to kill control process %li: %m", (long) s->control_pid);
1208                         else
1209                                 wait_for_exit = true;
1210                 }
1211
1212                 if (s->exec_context.kill_mode == KILL_CONTROL_GROUP) {
1213
1214                         if (!(pid_set = set_new(trivial_hash_func, trivial_compare_func))) {
1215                                 r = -ENOMEM;
1216                                 goto fail;
1217                         }
1218
1219                         /* Exclude the control pid from being killed via the cgroup */
1220                         if (s->control_pid > 0)
1221                                 if ((r = set_put(pid_set, LONG_TO_PTR(s->control_pid))) < 0)
1222                                         goto fail;
1223
1224                         if ((r = cgroup_bonding_kill_list(UNIT(s)->cgroup_bondings, sig, true, pid_set)) < 0) {
1225                                 if (r != -EAGAIN && r != -ESRCH && r != -ENOENT)
1226                                         log_warning("Failed to kill control group: %s", strerror(-r));
1227                         } else if (r > 0)
1228                                 wait_for_exit = true;
1229
1230                         set_free(pid_set);
1231                         pid_set = NULL;
1232                 }
1233         }
1234
1235         if (wait_for_exit) {
1236                 if ((r = unit_watch_timer(UNIT(s), s->timeout_usec, &s->timer_watch)) < 0)
1237                         goto fail;
1238
1239                 socket_set_state(s, state);
1240         } else if (state == SOCKET_STOP_PRE_SIGTERM || state == SOCKET_STOP_PRE_SIGKILL)
1241                 socket_enter_stop_post(s, true);
1242         else
1243                 socket_enter_dead(s, true);
1244
1245         return;
1246
1247 fail:
1248         log_warning("%s failed to kill processes: %s", UNIT(s)->id, strerror(-r));
1249
1250         if (state == SOCKET_STOP_PRE_SIGTERM || state == SOCKET_STOP_PRE_SIGKILL)
1251                 socket_enter_stop_post(s, false);
1252         else
1253                 socket_enter_dead(s, false);
1254
1255         if (pid_set)
1256                 set_free(pid_set);
1257 }
1258
1259 static void socket_enter_stop_pre(Socket *s, bool success) {
1260         int r;
1261         assert(s);
1262
1263         if (!success)
1264                 s->failure = true;
1265
1266         socket_unwatch_control_pid(s);
1267
1268         s->control_command_id = SOCKET_EXEC_STOP_PRE;
1269
1270         if ((s->control_command = s->exec_command[SOCKET_EXEC_STOP_PRE])) {
1271                 if ((r = socket_spawn(s, s->control_command, &s->control_pid)) < 0)
1272                         goto fail;
1273
1274                 socket_set_state(s, SOCKET_STOP_PRE);
1275         } else
1276                 socket_enter_stop_post(s, true);
1277
1278         return;
1279
1280 fail:
1281         log_warning("%s failed to run 'stop-pre' task: %s", UNIT(s)->id, strerror(-r));
1282         socket_enter_stop_post(s, false);
1283 }
1284
1285 static void socket_enter_listening(Socket *s) {
1286         int r;
1287         assert(s);
1288
1289         if ((r = socket_watch_fds(s)) < 0) {
1290                 log_warning("%s failed to watch sockets: %s", UNIT(s)->id, strerror(-r));
1291                 goto fail;
1292         }
1293
1294         socket_set_state(s, SOCKET_LISTENING);
1295         return;
1296
1297 fail:
1298         socket_enter_stop_pre(s, false);
1299 }
1300
1301 static void socket_enter_start_post(Socket *s) {
1302         int r;
1303         assert(s);
1304
1305         if ((r = socket_open_fds(s)) < 0) {
1306                 log_warning("%s failed to listen on sockets: %s", UNIT(s)->id, strerror(-r));
1307                 goto fail;
1308         }
1309
1310         socket_unwatch_control_pid(s);
1311
1312         s->control_command_id = SOCKET_EXEC_START_POST;
1313
1314         if ((s->control_command = s->exec_command[SOCKET_EXEC_START_POST])) {
1315                 if ((r = socket_spawn(s, s->control_command, &s->control_pid)) < 0) {
1316                         log_warning("%s failed to run 'start-post' task: %s", UNIT(s)->id, strerror(-r));
1317                         goto fail;
1318                 }
1319
1320                 socket_set_state(s, SOCKET_START_POST);
1321         } else
1322                 socket_enter_listening(s);
1323
1324         return;
1325
1326 fail:
1327         socket_enter_stop_pre(s, false);
1328 }
1329
1330 static void socket_enter_start_pre(Socket *s) {
1331         int r;
1332         assert(s);
1333
1334         socket_unwatch_control_pid(s);
1335
1336         s->control_command_id = SOCKET_EXEC_START_PRE;
1337
1338         if ((s->control_command = s->exec_command[SOCKET_EXEC_START_PRE])) {
1339                 if ((r = socket_spawn(s, s->control_command, &s->control_pid)) < 0)
1340                         goto fail;
1341
1342                 socket_set_state(s, SOCKET_START_PRE);
1343         } else
1344                 socket_enter_start_post(s);
1345
1346         return;
1347
1348 fail:
1349         log_warning("%s failed to run 'start-pre' task: %s", UNIT(s)->id, strerror(-r));
1350         socket_enter_dead(s, false);
1351 }
1352
1353 static void socket_enter_running(Socket *s, int cfd) {
1354         int r;
1355         DBusError error;
1356
1357         assert(s);
1358         dbus_error_init(&error);
1359
1360         /* We don't take connections anymore if we are supposed to
1361          * shut down anyway */
1362         if (unit_pending_inactive(UNIT(s))) {
1363                 log_debug("Suppressing connection request on %s since unit stop is scheduled.", UNIT(s)->id);
1364
1365                 if (cfd >= 0)
1366                         close_nointr_nofail(cfd);
1367                 else  {
1368                         /* Flush all sockets by closing and reopening them */
1369                         socket_close_fds(s);
1370
1371                         r = socket_watch_fds(s);
1372                         if (r < 0) {
1373                                 log_warning("%s failed to watch sockets: %s", UNIT(s)->id, strerror(-r));
1374                                 socket_enter_stop_pre(s, false);
1375                         }
1376                 }
1377
1378                 return;
1379         }
1380
1381         if (cfd < 0) {
1382                 Iterator i;
1383                 Unit *u;
1384                 bool pending = false;
1385
1386                 /* If there's already a start pending don't bother to
1387                  * do anything */
1388                 SET_FOREACH(u, UNIT(s)->dependencies[UNIT_TRIGGERS], i)
1389                         if (unit_pending_active(u)) {
1390                                 pending = true;
1391                                 break;
1392                         }
1393
1394                 if (!pending) {
1395                         r = manager_add_job(UNIT(s)->manager, JOB_START, UNIT_DEREF(s->service), JOB_REPLACE, true, &error, NULL);
1396                         if (r < 0)
1397                                 goto fail;
1398                 }
1399
1400                 socket_set_state(s, SOCKET_RUNNING);
1401         } else {
1402                 char *prefix, *instance = NULL, *name;
1403                 Service *service;
1404
1405                 if (s->n_connections >= s->max_connections) {
1406                         log_warning("Too many incoming connections (%u)", s->n_connections);
1407                         close_nointr_nofail(cfd);
1408                         return;
1409                 }
1410
1411                 r = socket_instantiate_service(s);
1412                 if (r < 0)
1413                         goto fail;
1414
1415                 r = instance_from_socket(cfd, s->n_accepted, &instance);
1416                 if (r < 0) {
1417                         if (r != -ENOTCONN)
1418                                 goto fail;
1419
1420                         /* ENOTCONN is legitimate if TCP RST was received.
1421                          * This connection is over, but the socket unit lives on. */
1422                         close_nointr_nofail(cfd);
1423                         return;
1424                 }
1425
1426                 prefix = unit_name_to_prefix(UNIT(s)->id);
1427                 if (!prefix) {
1428                         free(instance);
1429                         r = -ENOMEM;
1430                         goto fail;
1431                 }
1432
1433                 name = unit_name_build(prefix, instance, ".service");
1434                 free(prefix);
1435                 free(instance);
1436
1437                 if (!name) {
1438                         r = -ENOMEM;
1439                         goto fail;
1440                 }
1441
1442                 r = unit_add_name(UNIT_DEREF(s->service), name);
1443                 if (r < 0) {
1444                         free(name);
1445                         goto fail;
1446                 }
1447
1448                 service = SERVICE(UNIT_DEREF(s->service));
1449                 unit_ref_unset(&s->service);
1450                 s->n_accepted ++;
1451
1452                 UNIT(service)->no_gc = false;
1453
1454                 unit_choose_id(UNIT(service), name);
1455                 free(name);
1456
1457                 r = service_set_socket_fd(service, cfd, s);
1458                 if (r < 0)
1459                         goto fail;
1460
1461                 cfd = -1;
1462                 s->n_connections ++;
1463
1464                 r = manager_add_job(UNIT(s)->manager, JOB_START, UNIT(service), JOB_REPLACE, true, &error, NULL);
1465                 if (r < 0)
1466                         goto fail;
1467
1468                 /* Notify clients about changed counters */
1469                 unit_add_to_dbus_queue(UNIT(s));
1470         }
1471
1472         return;
1473
1474 fail:
1475         log_warning("%s failed to queue socket startup job: %s", UNIT(s)->id, bus_error(&error, r));
1476         socket_enter_stop_pre(s, false);
1477
1478         if (cfd >= 0)
1479                 close_nointr_nofail(cfd);
1480
1481         dbus_error_free(&error);
1482 }
1483
1484 static void socket_run_next(Socket *s, bool success) {
1485         int r;
1486
1487         assert(s);
1488         assert(s->control_command);
1489         assert(s->control_command->command_next);
1490
1491         if (!success)
1492                 s->failure = true;
1493
1494         socket_unwatch_control_pid(s);
1495
1496         s->control_command = s->control_command->command_next;
1497
1498         if ((r = socket_spawn(s, s->control_command, &s->control_pid)) < 0)
1499                 goto fail;
1500
1501         return;
1502
1503 fail:
1504         log_warning("%s failed to run next task: %s", UNIT(s)->id, strerror(-r));
1505
1506         if (s->state == SOCKET_START_POST)
1507                 socket_enter_stop_pre(s, false);
1508         else if (s->state == SOCKET_STOP_POST)
1509                 socket_enter_dead(s, false);
1510         else
1511                 socket_enter_signal(s, SOCKET_FINAL_SIGTERM, false);
1512 }
1513
1514 static int socket_start(Unit *u) {
1515         Socket *s = SOCKET(u);
1516
1517         assert(s);
1518
1519         /* We cannot fulfill this request right now, try again later
1520          * please! */
1521         if (s->state == SOCKET_STOP_PRE ||
1522             s->state == SOCKET_STOP_PRE_SIGKILL ||
1523             s->state == SOCKET_STOP_PRE_SIGTERM ||
1524             s->state == SOCKET_STOP_POST ||
1525             s->state == SOCKET_FINAL_SIGTERM ||
1526             s->state == SOCKET_FINAL_SIGKILL)
1527                 return -EAGAIN;
1528
1529         if (s->state == SOCKET_START_PRE ||
1530             s->state == SOCKET_START_POST)
1531                 return 0;
1532
1533         /* Cannot run this without the service being around */
1534         if (UNIT_DEREF(s->service)) {
1535                 Service *service;
1536
1537                 service = SERVICE(UNIT_DEREF(s->service));
1538
1539                 if (UNIT(service)->load_state != UNIT_LOADED) {
1540                         log_error("Socket service %s not loaded, refusing.", UNIT(service)->id);
1541                         return -ENOENT;
1542                 }
1543
1544                 /* If the service is already active we cannot start the
1545                  * socket */
1546                 if (service->state != SERVICE_DEAD &&
1547                     service->state != SERVICE_FAILED &&
1548                     service->state != SERVICE_AUTO_RESTART) {
1549                         log_error("Socket service %s already active, refusing.", UNIT(service)->id);
1550                         return -EBUSY;
1551                 }
1552
1553 #ifdef HAVE_SYSV_COMPAT
1554                 if (service->sysv_path) {
1555                         log_error("Using SysV services for socket activation is not supported. Refusing.");
1556                         return -ENOENT;
1557                 }
1558 #endif
1559         }
1560
1561         assert(s->state == SOCKET_DEAD || s->state == SOCKET_FAILED);
1562
1563         s->failure = false;
1564         socket_enter_start_pre(s);
1565         return 0;
1566 }
1567
1568 static int socket_stop(Unit *u) {
1569         Socket *s = SOCKET(u);
1570
1571         assert(s);
1572
1573         /* Already on it */
1574         if (s->state == SOCKET_STOP_PRE ||
1575             s->state == SOCKET_STOP_PRE_SIGTERM ||
1576             s->state == SOCKET_STOP_PRE_SIGKILL ||
1577             s->state == SOCKET_STOP_POST ||
1578             s->state == SOCKET_FINAL_SIGTERM ||
1579             s->state == SOCKET_FINAL_SIGKILL)
1580                 return 0;
1581
1582         /* If there's already something running we go directly into
1583          * kill mode. */
1584         if (s->state == SOCKET_START_PRE ||
1585             s->state == SOCKET_START_POST) {
1586                 socket_enter_signal(s, SOCKET_STOP_PRE_SIGTERM, true);
1587                 return -EAGAIN;
1588         }
1589
1590         assert(s->state == SOCKET_LISTENING || s->state == SOCKET_RUNNING);
1591
1592         socket_enter_stop_pre(s, true);
1593         return 0;
1594 }
1595
1596 static int socket_serialize(Unit *u, FILE *f, FDSet *fds) {
1597         Socket *s = SOCKET(u);
1598         SocketPort *p;
1599         int r;
1600
1601         assert(u);
1602         assert(f);
1603         assert(fds);
1604
1605         unit_serialize_item(u, f, "state", socket_state_to_string(s->state));
1606         unit_serialize_item(u, f, "failure", yes_no(s->failure));
1607         unit_serialize_item_format(u, f, "n-accepted", "%u", s->n_accepted);
1608
1609         if (s->control_pid > 0)
1610                 unit_serialize_item_format(u, f, "control-pid", "%lu", (unsigned long) s->control_pid);
1611
1612         if (s->control_command_id >= 0)
1613                 unit_serialize_item(u, f, "control-command", socket_exec_command_to_string(s->control_command_id));
1614
1615         LIST_FOREACH(port, p, s->ports) {
1616                 int copy;
1617
1618                 if (p->fd < 0)
1619                         continue;
1620
1621                 if ((copy = fdset_put_dup(fds, p->fd)) < 0)
1622                         return copy;
1623
1624                 if (p->type == SOCKET_SOCKET) {
1625                         char *t;
1626
1627                         if ((r = socket_address_print(&p->address, &t)) < 0)
1628                                 return r;
1629
1630                         if (socket_address_family(&p->address) == AF_NETLINK)
1631                                 unit_serialize_item_format(u, f, "netlink", "%i %s", copy, t);
1632                         else
1633                                 unit_serialize_item_format(u, f, "socket", "%i %i %s", copy, p->address.type, t);
1634                         free(t);
1635                 } else if (p->type == SOCKET_SPECIAL)
1636                         unit_serialize_item_format(u, f, "special", "%i %s", copy, p->path);
1637                 else {
1638                         assert(p->type == SOCKET_FIFO);
1639                         unit_serialize_item_format(u, f, "fifo", "%i %s", copy, p->path);
1640                 }
1641         }
1642
1643         return 0;
1644 }
1645
1646 static int socket_deserialize_item(Unit *u, const char *key, const char *value, FDSet *fds) {
1647         Socket *s = SOCKET(u);
1648
1649         assert(u);
1650         assert(key);
1651         assert(value);
1652         assert(fds);
1653
1654         if (streq(key, "state")) {
1655                 SocketState state;
1656
1657                 if ((state = socket_state_from_string(value)) < 0)
1658                         log_debug("Failed to parse state value %s", value);
1659                 else
1660                         s->deserialized_state = state;
1661         } else if (streq(key, "failure")) {
1662                 int b;
1663
1664                 if ((b = parse_boolean(value)) < 0)
1665                         log_debug("Failed to parse failure value %s", value);
1666                 else
1667                         s->failure = b || s->failure;
1668
1669         } else if (streq(key, "n-accepted")) {
1670                 unsigned k;
1671
1672                 if (safe_atou(value, &k) < 0)
1673                         log_debug("Failed to parse n-accepted value %s", value);
1674                 else
1675                         s->n_accepted += k;
1676         } else if (streq(key, "control-pid")) {
1677                 pid_t pid;
1678
1679                 if (parse_pid(value, &pid) < 0)
1680                         log_debug("Failed to parse control-pid value %s", value);
1681                 else
1682                         s->control_pid = pid;
1683         } else if (streq(key, "control-command")) {
1684                 SocketExecCommand id;
1685
1686                 if ((id = socket_exec_command_from_string(value)) < 0)
1687                         log_debug("Failed to parse exec-command value %s", value);
1688                 else {
1689                         s->control_command_id = id;
1690                         s->control_command = s->exec_command[id];
1691                 }
1692         } else if (streq(key, "fifo")) {
1693                 int fd, skip = 0;
1694                 SocketPort *p;
1695
1696                 if (sscanf(value, "%i %n", &fd, &skip) < 1 || fd < 0 || !fdset_contains(fds, fd))
1697                         log_debug("Failed to parse fifo value %s", value);
1698                 else {
1699
1700                         LIST_FOREACH(port, p, s->ports)
1701                                 if (p->type == SOCKET_FIFO &&
1702                                     streq_ptr(p->path, value+skip))
1703                                         break;
1704
1705                         if (p) {
1706                                 if (p->fd >= 0)
1707                                         close_nointr_nofail(p->fd);
1708                                 p->fd = fdset_remove(fds, fd);
1709                         }
1710                 }
1711
1712         } else if (streq(key, "special")) {
1713                 int fd, skip = 0;
1714                 SocketPort *p;
1715
1716                 if (sscanf(value, "%i %n", &fd, &skip) < 1 || fd < 0 || !fdset_contains(fds, fd))
1717                         log_debug("Failed to parse special value %s", value);
1718                 else {
1719
1720                         LIST_FOREACH(port, p, s->ports)
1721                                 if (p->type == SOCKET_SPECIAL &&
1722                                     streq_ptr(p->path, value+skip))
1723                                         break;
1724
1725                         if (p) {
1726                                 if (p->fd >= 0)
1727                                         close_nointr_nofail(p->fd);
1728                                 p->fd = fdset_remove(fds, fd);
1729                         }
1730                 }
1731
1732         } else if (streq(key, "socket")) {
1733                 int fd, type, skip = 0;
1734                 SocketPort *p;
1735
1736                 if (sscanf(value, "%i %i %n", &fd, &type, &skip) < 2 || fd < 0 || type < 0 || !fdset_contains(fds, fd))
1737                         log_debug("Failed to parse socket value %s", value);
1738                 else {
1739
1740                         LIST_FOREACH(port, p, s->ports)
1741                                 if (socket_address_is(&p->address, value+skip, type))
1742                                         break;
1743
1744                         if (p) {
1745                                 if (p->fd >= 0)
1746                                         close_nointr_nofail(p->fd);
1747                                 p->fd = fdset_remove(fds, fd);
1748                         }
1749                 }
1750
1751         } else if (streq(key, "netlink")) {
1752                 int fd, skip = 0;
1753                 SocketPort *p;
1754
1755                 if (sscanf(value, "%i %n", &fd, &skip) < 1 || fd < 0 || !fdset_contains(fds, fd))
1756                         log_debug("Failed to parse socket value %s", value);
1757                 else {
1758
1759                         LIST_FOREACH(port, p, s->ports)
1760                                 if (socket_address_is_netlink(&p->address, value+skip))
1761                                         break;
1762
1763                         if (p) {
1764                                 if (p->fd >= 0)
1765                                         close_nointr_nofail(p->fd);
1766                                 p->fd = fdset_remove(fds, fd);
1767                         }
1768                 }
1769
1770         } else
1771                 log_debug("Unknown serialization key '%s'", key);
1772
1773         return 0;
1774 }
1775
1776 static UnitActiveState socket_active_state(Unit *u) {
1777         assert(u);
1778
1779         return state_translation_table[SOCKET(u)->state];
1780 }
1781
1782 static const char *socket_sub_state_to_string(Unit *u) {
1783         assert(u);
1784
1785         return socket_state_to_string(SOCKET(u)->state);
1786 }
1787
1788 static bool socket_check_gc(Unit *u) {
1789         Socket *s = SOCKET(u);
1790
1791         assert(u);
1792
1793         return s->n_connections > 0;
1794 }
1795
1796 static void socket_fd_event(Unit *u, int fd, uint32_t events, Watch *w) {
1797         Socket *s = SOCKET(u);
1798         int cfd = -1;
1799
1800         assert(s);
1801         assert(fd >= 0);
1802
1803         if (s->state != SOCKET_LISTENING)
1804                 return;
1805
1806         log_debug("Incoming traffic on %s", u->id);
1807
1808         if (events != EPOLLIN) {
1809
1810                 if (events & EPOLLHUP)
1811                         log_error("%s: Got POLLHUP on a listening socket. The service probably invoked shutdown() on it, and should better not do that.", u->id);
1812                 else
1813                         log_error("%s: Got unexpected poll event (0x%x) on socket.", u->id, events);
1814
1815                 goto fail;
1816         }
1817
1818         if (w->socket_accept) {
1819                 for (;;) {
1820
1821                         if ((cfd = accept4(fd, NULL, NULL, SOCK_NONBLOCK)) < 0) {
1822
1823                                 if (errno == EINTR)
1824                                         continue;
1825
1826                                 log_error("Failed to accept socket: %m");
1827                                 goto fail;
1828                         }
1829
1830                         break;
1831                 }
1832
1833                 socket_apply_socket_options(s, cfd);
1834         }
1835
1836         socket_enter_running(s, cfd);
1837         return;
1838
1839 fail:
1840         socket_enter_stop_pre(s, false);
1841 }
1842
1843 static void socket_sigchld_event(Unit *u, pid_t pid, int code, int status) {
1844         Socket *s = SOCKET(u);
1845         bool success;
1846
1847         assert(s);
1848         assert(pid >= 0);
1849
1850         if (pid != s->control_pid)
1851                 return;
1852
1853         s->control_pid = 0;
1854
1855         success = is_clean_exit(code, status);
1856
1857         if (s->control_command) {
1858                 exec_status_exit(&s->control_command->exec_status, &s->exec_context, pid, code, status);
1859
1860                 if (s->control_command->ignore)
1861                         success = true;
1862         }
1863
1864         log_full(success ? LOG_DEBUG : LOG_NOTICE,
1865                  "%s control process exited, code=%s status=%i", u->id, sigchld_code_to_string(code), status);
1866         s->failure = s->failure || !success;
1867
1868         if (s->control_command && s->control_command->command_next && success) {
1869                 log_debug("%s running next command for state %s", u->id, socket_state_to_string(s->state));
1870                 socket_run_next(s, success);
1871         } else {
1872                 s->control_command = NULL;
1873                 s->control_command_id = _SOCKET_EXEC_COMMAND_INVALID;
1874
1875                 /* No further commands for this step, so let's figure
1876                  * out what to do next */
1877
1878                 log_debug("%s got final SIGCHLD for state %s", u->id, socket_state_to_string(s->state));
1879
1880                 switch (s->state) {
1881
1882                 case SOCKET_START_PRE:
1883                         if (success)
1884                                 socket_enter_start_post(s);
1885                         else
1886                                 socket_enter_signal(s, SOCKET_FINAL_SIGTERM, false);
1887                         break;
1888
1889                 case SOCKET_START_POST:
1890                         if (success)
1891                                 socket_enter_listening(s);
1892                         else
1893                                 socket_enter_stop_pre(s, false);
1894                         break;
1895
1896                 case SOCKET_STOP_PRE:
1897                 case SOCKET_STOP_PRE_SIGTERM:
1898                 case SOCKET_STOP_PRE_SIGKILL:
1899                         socket_enter_stop_post(s, success);
1900                         break;
1901
1902                 case SOCKET_STOP_POST:
1903                 case SOCKET_FINAL_SIGTERM:
1904                 case SOCKET_FINAL_SIGKILL:
1905                         socket_enter_dead(s, success);
1906                         break;
1907
1908                 default:
1909                         assert_not_reached("Uh, control process died at wrong time.");
1910                 }
1911         }
1912
1913         /* Notify clients about changed exit status */
1914         unit_add_to_dbus_queue(u);
1915 }
1916
1917 static void socket_timer_event(Unit *u, uint64_t elapsed, Watch *w) {
1918         Socket *s = SOCKET(u);
1919
1920         assert(s);
1921         assert(elapsed == 1);
1922         assert(w == &s->timer_watch);
1923
1924         switch (s->state) {
1925
1926         case SOCKET_START_PRE:
1927                 log_warning("%s starting timed out. Terminating.", u->id);
1928                 socket_enter_signal(s, SOCKET_FINAL_SIGTERM, false);
1929                 break;
1930
1931         case SOCKET_START_POST:
1932                 log_warning("%s starting timed out. Stopping.", u->id);
1933                 socket_enter_stop_pre(s, false);
1934                 break;
1935
1936         case SOCKET_STOP_PRE:
1937                 log_warning("%s stopping timed out. Terminating.", u->id);
1938                 socket_enter_signal(s, SOCKET_STOP_PRE_SIGTERM, false);
1939                 break;
1940
1941         case SOCKET_STOP_PRE_SIGTERM:
1942                 if (s->exec_context.send_sigkill) {
1943                         log_warning("%s stopping timed out. Killing.", u->id);
1944                         socket_enter_signal(s, SOCKET_STOP_PRE_SIGKILL, false);
1945                 } else {
1946                         log_warning("%s stopping timed out. Skipping SIGKILL. Ignoring.", u->id);
1947                         socket_enter_stop_post(s, false);
1948                 }
1949                 break;
1950
1951         case SOCKET_STOP_PRE_SIGKILL:
1952                 log_warning("%s still around after SIGKILL. Ignoring.", u->id);
1953                 socket_enter_stop_post(s, false);
1954                 break;
1955
1956         case SOCKET_STOP_POST:
1957                 log_warning("%s stopping timed out (2). Terminating.", u->id);
1958                 socket_enter_signal(s, SOCKET_FINAL_SIGTERM, false);
1959                 break;
1960
1961         case SOCKET_FINAL_SIGTERM:
1962                 if (s->exec_context.send_sigkill) {
1963                         log_warning("%s stopping timed out (2). Killing.", u->id);
1964                         socket_enter_signal(s, SOCKET_FINAL_SIGKILL, false);
1965                 } else {
1966                         log_warning("%s stopping timed out (2). Skipping SIGKILL. Ignoring.", u->id);
1967                         socket_enter_dead(s, false);
1968                 }
1969                 break;
1970
1971         case SOCKET_FINAL_SIGKILL:
1972                 log_warning("%s still around after SIGKILL (2). Entering failed mode.", u->id);
1973                 socket_enter_dead(s, false);
1974                 break;
1975
1976         default:
1977                 assert_not_reached("Timeout at wrong time.");
1978         }
1979 }
1980
1981 int socket_collect_fds(Socket *s, int **fds, unsigned *n_fds) {
1982         int *rfds;
1983         unsigned rn_fds, k;
1984         SocketPort *p;
1985
1986         assert(s);
1987         assert(fds);
1988         assert(n_fds);
1989
1990         /* Called from the service code for requesting our fds */
1991
1992         rn_fds = 0;
1993         LIST_FOREACH(port, p, s->ports)
1994                 if (p->fd >= 0)
1995                         rn_fds++;
1996
1997         if (rn_fds <= 0) {
1998                 *fds = NULL;
1999                 *n_fds = 0;
2000                 return 0;
2001         }
2002
2003         if (!(rfds = new(int, rn_fds)))
2004                 return -ENOMEM;
2005
2006         k = 0;
2007         LIST_FOREACH(port, p, s->ports)
2008                 if (p->fd >= 0)
2009                         rfds[k++] = p->fd;
2010
2011         assert(k == rn_fds);
2012
2013         *fds = rfds;
2014         *n_fds = rn_fds;
2015
2016         return 0;
2017 }
2018
2019 void socket_notify_service_dead(Socket *s) {
2020         assert(s);
2021
2022         /* The service is dead. Dang!
2023          *
2024          * This is strictly for one-instance-for-all-connections
2025          * services. */
2026
2027         if (s->state == SOCKET_RUNNING) {
2028                 log_debug("%s got notified about service death.", UNIT(s)->id);
2029                 socket_enter_listening(s);
2030         }
2031 }
2032
2033 void socket_connection_unref(Socket *s) {
2034         assert(s);
2035
2036         /* The service is dead. Yay!
2037          *
2038          * This is strictly for one-instance-per-connection
2039          * services. */
2040
2041         assert(s->n_connections > 0);
2042         s->n_connections--;
2043
2044         log_debug("%s: One connection closed, %u left.", UNIT(s)->id, s->n_connections);
2045 }
2046
2047 static void socket_reset_failed(Unit *u) {
2048         Socket *s = SOCKET(u);
2049
2050         assert(s);
2051
2052         if (s->state == SOCKET_FAILED)
2053                 socket_set_state(s, SOCKET_DEAD);
2054
2055         s->failure = false;
2056 }
2057
2058 static int socket_kill(Unit *u, KillWho who, KillMode mode, int signo, DBusError *error) {
2059         Socket *s = SOCKET(u);
2060         int r = 0;
2061         Set *pid_set = NULL;
2062
2063         assert(s);
2064
2065         if (who == KILL_MAIN) {
2066                 dbus_set_error(error, BUS_ERROR_NO_SUCH_PROCESS, "Socket units have no main processes");
2067                 return -ESRCH;
2068         }
2069
2070         if (s->control_pid <= 0 && who == KILL_CONTROL) {
2071                 dbus_set_error(error, BUS_ERROR_NO_SUCH_PROCESS, "No control process to kill");
2072                 return -ESRCH;
2073         }
2074
2075         if (who == KILL_CONTROL || who == KILL_ALL)
2076                 if (s->control_pid > 0)
2077                         if (kill(s->control_pid, signo) < 0)
2078                                 r = -errno;
2079
2080         if (who == KILL_ALL && mode == KILL_CONTROL_GROUP) {
2081                 int q;
2082
2083                 if (!(pid_set = set_new(trivial_hash_func, trivial_compare_func)))
2084                         return -ENOMEM;
2085
2086                 /* Exclude the control pid from being killed via the cgroup */
2087                 if (s->control_pid > 0)
2088                         if ((q = set_put(pid_set, LONG_TO_PTR(s->control_pid))) < 0) {
2089                                 r = q;
2090                                 goto finish;
2091                         }
2092
2093                 if ((q = cgroup_bonding_kill_list(UNIT(s)->cgroup_bondings, signo, false, pid_set)) < 0)
2094                         if (q != -EAGAIN && q != -ESRCH && q != -ENOENT)
2095                                 r = q;
2096         }
2097
2098 finish:
2099         if (pid_set)
2100                 set_free(pid_set);
2101
2102         return r;
2103 }
2104
2105 static const char* const socket_state_table[_SOCKET_STATE_MAX] = {
2106         [SOCKET_DEAD] = "dead",
2107         [SOCKET_START_PRE] = "start-pre",
2108         [SOCKET_START_POST] = "start-post",
2109         [SOCKET_LISTENING] = "listening",
2110         [SOCKET_RUNNING] = "running",
2111         [SOCKET_STOP_PRE] = "stop-pre",
2112         [SOCKET_STOP_PRE_SIGTERM] = "stop-pre-sigterm",
2113         [SOCKET_STOP_PRE_SIGKILL] = "stop-pre-sigkill",
2114         [SOCKET_STOP_POST] = "stop-post",
2115         [SOCKET_FINAL_SIGTERM] = "final-sigterm",
2116         [SOCKET_FINAL_SIGKILL] = "final-sigkill",
2117         [SOCKET_FAILED] = "failed"
2118 };
2119
2120 DEFINE_STRING_TABLE_LOOKUP(socket_state, SocketState);
2121
2122 static const char* const socket_exec_command_table[_SOCKET_EXEC_COMMAND_MAX] = {
2123         [SOCKET_EXEC_START_PRE] = "StartPre",
2124         [SOCKET_EXEC_START_POST] = "StartPost",
2125         [SOCKET_EXEC_STOP_PRE] = "StopPre",
2126         [SOCKET_EXEC_STOP_POST] = "StopPost"
2127 };
2128
2129 DEFINE_STRING_TABLE_LOOKUP(socket_exec_command, SocketExecCommand);
2130
2131 const UnitVTable socket_vtable = {
2132         .suffix = ".socket",
2133         .object_size = sizeof(Socket),
2134         .sections =
2135                 "Unit\0"
2136                 "Socket\0"
2137                 "Install\0",
2138
2139         .init = socket_init,
2140         .done = socket_done,
2141         .load = socket_load,
2142
2143         .kill = socket_kill,
2144
2145         .coldplug = socket_coldplug,
2146
2147         .dump = socket_dump,
2148
2149         .start = socket_start,
2150         .stop = socket_stop,
2151
2152         .serialize = socket_serialize,
2153         .deserialize_item = socket_deserialize_item,
2154
2155         .active_state = socket_active_state,
2156         .sub_state_to_string = socket_sub_state_to_string,
2157
2158         .check_gc = socket_check_gc,
2159
2160         .fd_event = socket_fd_event,
2161         .sigchld_event = socket_sigchld_event,
2162         .timer_event = socket_timer_event,
2163
2164         .reset_failed = socket_reset_failed,
2165
2166         .bus_interface = "org.freedesktop.systemd1.Socket",
2167         .bus_message_handler = bus_socket_message_handler,
2168         .bus_invalidating_properties =  bus_socket_invalidating_properties
2169 };