/* ISC license. */ #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include "defaults.h" #include "initctl.h" #define STAGE4_FILE "stage 4" #define SCANPREFIX SCANDIRFULL "/" #define SCANPREFIXLEN (sizeof(SCANPREFIX) - 1) #define DOTPREFIX ".s6-linux-init-shutdownd:" #define DOTPREFIXLEN (sizeof(DOTPREFIX) - 1) #define DOTSUFFIX ":XXXXXX" #define DOTSUFFIXLEN (sizeof(DOTSUFFIX) - 1) #define CONTAINERDIR S6_LINUX_INIT_TMPFS "/" CONTAINER_RESULTS #define USAGE "s6-linux-init-shutdownd [ -d notif ] [ -c basedir ] [ -g gracetime ] [ -C ] [ -B ]" #define dieusage() strerr_dieusage(100, USAGE) static char const *basedir = BASEDIR ; static int inns = 0 ; static int nologger = 0 ; struct at_s { int fd ; char const *name ; } ; static int renametemp (char const *s, mode_t mode, void *data) { struct at_s *at = data ; (void)mode ; return renameat(at->fd, at->name, at->fd, s) ; } static int mkrenametemp (int fd, char const *src, char *dst) { struct at_s at = { .fd = fd, .name = src } ; return mkfiletemp(dst, &renametemp, 0700, &at) ; } static inline void run_stage3 (char const *basedir) { pid_t pid ; size_t basedirlen = strlen(basedir) ; char stage3[basedirlen + sizeof("/scripts/" STAGE3)] ; char const *stage3_argv[2] = { stage3, 0 } ; memcpy(stage3, basedir, basedirlen) ; memcpy(stage3 + basedirlen, "/scripts/" STAGE3, sizeof("/scripts/" STAGE3)) ; pid = child_spawn0(stage3_argv[0], stage3_argv, (char const *const *)environ) ; if (pid) { int wstat ; if (wait_pid(pid, &wstat) == -1) strerr_diefu1sys(111, "waitpid") ; if (WIFSIGNALED(wstat)) { char fmt[UINT_FMT] ; fmt[uint_fmt(fmt, WTERMSIG(wstat))] = 0 ; strerr_warnw3x(stage3, " was killed by signal ", fmt) ; } else if (WEXITSTATUS(wstat)) { char fmt[UINT_FMT] ; fmt[uint_fmt(fmt, WEXITSTATUS(wstat))] = 0 ; strerr_warnw3x(stage3, " exited ", fmt) ; } } else strerr_warnwu2sys("spawn ", stage3) ; } static inline void prepare_shutdown (buffer *b, tain *deadline, unsigned int *grace_time) { uint32_t u ; char pack[TAIN_PACK + 4] ; ssize_t r = sanitize_read(buffer_get(b, pack, TAIN_PACK + 4)) ; if (r == -1) strerr_diefu1sys(111, "read from pipe") ; if (r < TAIN_PACK + 4) strerr_dief1x(101, "bad shutdown protocol") ; tain_unpack(pack, deadline) ; tain_add_g(deadline, deadline) ; uint32_unpack_big(pack + TAIN_PACK, &u) ; if (u && u <= 300000) *grace_time = u ; } static inline void handle_fifo (buffer *b, char *what, tain *deadline, unsigned int *grace_time) { for (;;) { char c ; ssize_t r = sanitize_read(buffer_get(b, &c, 1)) ; if (r == -1) strerr_diefu1sys(111, "read from pipe") ; else if (!r) break ; switch (c) { case 'S' : case 'h' : case 'p' : case 'r' : *what = c ; prepare_shutdown(b, deadline, grace_time) ; break ; case 'c' : *what = 'S' ; tain_add_g(deadline, &tain_infinite_relative) ; break ; default : { char s[2] = { c, 0 } ; strerr_warnw2x("unknown command: ", s) ; } break ; } } } static void restore_console (void) { fd_close(1) ; if (open2("/dev/console", O_WRONLY) != 1 && open2("/dev/null", O_WRONLY) != 1) strerr_warnwu1sys("open /dev/console for writing") ; else if (fd_copy(2, 1) < 0) strerr_warnwu1sys("fd_copy") ; } static inline void prepare_stage4 (char const *basedir, char what) { buffer b ; int fd ; char buf[512] ; size_t sabase = satmp.len ; if (inns) { char s[2] = { what, '\n' } ; if (mkdir(CONTAINERDIR, 0755) < 0 && errno != EEXIST) strerr_diefu1sys(111, "mkdir " CONTAINERDIR) ; if (!openwritenclose_unsafe(CONTAINERDIR "/haltcode", s, 2)) strerr_diefu1sys(111, "write to " CONTAINERDIR "/haltcode") ; } unlink_void(STAGE4_FILE ".new") ; fd = open_excl(STAGE4_FILE ".new") ; if (fd == -1) strerr_diefu3sys(111, "open ", STAGE4_FILE ".new", " for writing") ; buffer_init(&b, &buffer_write, fd, buf, 512) ; if (inns) { if (buffer_puts(&b, "#!" EXECLINE_SHEBANGPREFIX "execlineb -P\n\n" EXECLINE_EXTBINPREFIX "foreground { " S6_EXTBINPREFIX "s6-svc -Ox -- . }\n" EXECLINE_EXTBINPREFIX "background\n{\n ") < 0 || (!nologger && buffer_puts(&b, EXECLINE_EXTBINPREFIX "foreground { " S6_EXTBINPREFIX "s6-svc -Oxc -- " SCANPREFIX LOGGER_SERVICEDIR " }\n ") < 0) || buffer_putsflush(&b, S6_EXTBINPREFIX "s6-svscanctl -b -- " SCANDIRFULL "\n}\n") < 0) strerr_diefu2sys(111, "write to ", STAGE4_FILE ".new") ; } else { if (buffer_puts(&b, "#!" EXECLINE_SHEBANGPREFIX "execlineb -P\n\n" EXECLINE_EXTBINPREFIX "foreground { " S6_LINUX_INIT_BINPREFIX "s6-linux-init-umountall }\n" EXECLINE_EXTBINPREFIX "foreground { ") < 0 || !string_quote(&satmp, basedir, strlen(basedir)) || buffer_put(&b, satmp.s + sabase, satmp.len - sabase) < 0 || buffer_puts(&b, "/scripts/" STAGE4 " }\n" S6_LINUX_INIT_BINPREFIX "s6-linux-init-hpr -f -") < 0 || buffer_put(&b, &what, 1) < 0 || buffer_putsflush(&b, "\n") < 0) strerr_diefu2sys(111, "write to ", STAGE4_FILE ".new") ; satmp.len = sabase ; } if (fchmod(fd, S_IRWXU) == -1) strerr_diefu2sys(111, "fchmod ", STAGE4_FILE ".new") ; fd_close(fd) ; if (rename(STAGE4_FILE ".new", STAGE4_FILE) == -1) strerr_diefu4sys(111, "rename ", STAGE4_FILE ".new", " to ", STAGE4_FILE) ; } static inline void unsupervise_tree (void) { char const *except[3] = { SHUTDOWND_SERVICEDIR, nologger ? 0 : LOGGER_SERVICEDIR, 0 } ; DIR *dir = opendir(SCANDIRFULL) ; int fdd ; if (!dir) strerr_diefu1sys(111, "opendir " SCANDIRFULL) ; fdd = dirfd(dir) ; if (fdd == -1) strerr_diefu1sys(111, "dir_fd " SCANDIRFULL) ; for (;;) { char const *const *p = except ; direntry *d ; errno = 0 ; d = readdir(dir) ; if (!d) break ; if (d->d_name[0] == '.') continue ; for (; *p ; p++) if (!strcmp(*p, d->d_name)) break ; if (!*p) { size_t dlen = strlen(d->d_name) ; char fn[SCANPREFIXLEN + DOTPREFIXLEN + dlen + DOTSUFFIXLEN + 1] ; memcpy(fn, SCANPREFIX DOTPREFIX, SCANPREFIXLEN + DOTPREFIXLEN) ; memcpy(fn + SCANPREFIXLEN + DOTPREFIXLEN, d->d_name, dlen) ; memcpy(fn + SCANPREFIXLEN + DOTPREFIXLEN + dlen, DOTSUFFIX, DOTSUFFIXLEN + 1) ; if (mkrenametemp(fdd, d->d_name, fn + SCANPREFIXLEN) == -1) { strerr_warnwu4sys("rename " SCANPREFIX, d->d_name, " to something based on ", fn) ; unlinkat(fdd, d->d_name, 0) ; /* if it still fails, too bad, it will restart in stage 4 and race */ } LOLDEBUG("unsupervise_tree: renamed %s to %s", d->d_name, fn) ; s6_svc_writectl(fn, S6_SUPERVISE_CTLDIR, "d", 1) ; } #if DEBUG else LOLDEBUG("unsupervise_tree: found %s, not touching", *p) ; #endif } if (errno) strerr_diefu1sys(111, "readdir " SCANDIRFULL) ; dir_close(dir) ; s6_svc_write(SCANDIRFULL "/" S6_SVSCAN_CTLDIR "/control", "an", 2) ; } int main (int argc, char const *const *argv) { unsigned int grace_time = 3000 ; tain deadline ; int fdr, fdw ; unsigned int notif = 0 ; buffer b ; char what = 'S' ; char buf[64] ; PROG = "s6-linux-init-shutdownd" ; { subgetopt l = SUBGETOPT_ZERO ; for (;;) { int opt = subgetopt_r(argc, argv, "d:c:g:CB", &l) ; if (opt == -1) break ; switch (opt) { case 'd' : if (!uint0_scan(l.arg, ¬if)) dieusage() ; break ; case 'c' : basedir = l.arg ; break ; case 'g' : if (!uint0_scan(l.arg, &grace_time)) dieusage() ; break ; case 'C' : inns = 1 ; break ; case 'B' : nologger = 1 ; break ; default : dieusage() ; } } argc -= l.ind ; argv += l.ind ; } if (basedir[0] != '/') strerr_dief2x(100, "basedir", " must be an absolute path") ; if (notif) { if (notif < 3) strerr_dief1x(100, "notification fd must be 3 or more") ; if (fcntl(notif, F_GETFD) < 0) strerr_dief1sys(100, "invalid notification fd") ; } if (grace_time > 300000) grace_time = 300000 ; /* if we're in stage 4, exec it immediately */ { char const *stage4_argv[2] = { "./" STAGE4_FILE, 0 } ; if (!inns && !nologger) { int fd[2] ; int e ; fd[0] = fcntl(1, F_DUPFD_CLOEXEC, 0) ; if (fd[0] < 0) strerr_diefu2sys(111, "dup std", "out") ; fd[1] = fcntl(2, F_DUPFD_CLOEXEC, 0) ; if (fd[1] < 0) strerr_diefu2sys(111, "dup std", "err") ; restore_console() ; execv(stage4_argv[0], (char **)stage4_argv) ; e = errno ; if (fd_move2(1, fd[0], 2, fd[1]) < 0) strerr_warnwu1sys("restore fds") ; errno = e ; } else execv(stage4_argv[0], (char **)stage4_argv) ; if (errno != ENOENT) strerr_warnwu2sys("exec ", stage4_argv[0]) ; } fdr = openc_read(SHUTDOWND_FIFO) ; if (fdr == -1) strerr_diefu3sys(111, "open ", SHUTDOWND_FIFO, " for reading") ; fdw = openc_write(SHUTDOWND_FIFO) ; if (fdw == -1) strerr_diefu3sys(111, "open ", SHUTDOWND_FIFO, " for writing") ; if (!sig_altignore(SIGPIPE)) strerr_diefu1sys(111, "ignore SIGPIPE") ; buffer_init(&b, &buffer_read, fdr, buf, 64) ; tain_now_set_stopwatch_g() ; tain_add_g(&deadline, &tain_infinite_relative) ; if (notif) { write(notif, "\n", 1) ; close(notif) ; notif = 0 ; } for (;;) { iopause_fd x = { .fd = fdr, .events = IOPAUSE_READ } ; int r = iopause_g(&x, 1, &deadline) ; if (r == -1) strerr_diefu1sys(111, "iopause") ; if (!r) { LOLDEBUG("run_stage3: starting") ; run_stage3(basedir) ; LOLDEBUG("run_stage3: done") ; tain_now_g() ; if (what != 'S') break ; tain_add_g(&deadline, &tain_infinite_relative) ; continue ; } if (x.revents & IOPAUSE_READ) handle_fifo(&b, &what, &deadline, &grace_time) ; } fd_close(fdw) ; fd_close(fdr) ; if (!inns && !nologger) restore_console() ; /* The end is coming! */ prepare_stage4(basedir, what) ; LOLDEBUG("unsupervise_tree: starting") ; unsupervise_tree() ; LOLDEBUG("unsupervise_tree: done") ; if (!sig_ignore(SIGTERM)) strerr_warnwu1sys("ignore SIGTERM") ; if (!inns) { sync() ; strerr_warni1x("sending all processes the TERM signal...") ; } LOLDEBUG("sending SIGTERM and SIGCONT") ; kill(-1, SIGTERM) ; kill(-1, SIGCONT) ; tain_from_millisecs(&deadline, grace_time) ; tain_now_g() ; tain_add_g(&deadline, &deadline) ; deepsleepuntil_g(&deadline) ; if (!inns) { sync() ; strerr_warni1x("sending all processes the KILL signal...") ; } LOLDEBUG("sending SIGKILL") ; kill(-1, SIGKILL) ; return 0 ; }