-
Notifications
You must be signed in to change notification settings - Fork 127
/
ctr_exit.c
223 lines (190 loc) · 5.37 KB
/
ctr_exit.c
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
#define _GNU_SOURCE
#include "ctr_exit.h"
#include "cli.h" // opt_exit_command, opt_exit_delay
#include "utils.h"
#include "parent_pipe_fd.h"
#include "globals.h"
#include "ctr_logging.h"
#include "close_fds.h"
#include <errno.h>
#include <glib.h>
#include <glib-unix.h>
#include <signal.h>
#include <stdlib.h>
#include <sys/prctl.h>
#include <unistd.h>
volatile pid_t container_pid = -1;
volatile pid_t create_pid = -1;
void on_sigchld(G_GNUC_UNUSED int signal)
{
raise(SIGUSR1);
}
void on_sig_exit(int signal)
{
if (container_pid > 0) {
if (kill(container_pid, signal) == 0)
return;
} else if (create_pid > 0) {
if (kill(create_pid, signal) == 0)
return;
if (errno == ESRCH) {
/* The create_pid process might have exited, so try container_pid again. */
if (container_pid > 0 && kill(container_pid, signal) == 0)
return;
}
}
/* Just force a check if we get here. */
raise(SIGUSR1);
}
static void check_child_processes(GHashTable *pid_to_handler, GHashTable *cache)
{
for (;;) {
int status;
pid_t pid = waitpid(-1, &status, WNOHANG);
if (pid < 0 && errno == EINTR)
continue;
if (pid < 0 && errno == ECHILD) {
g_main_loop_quit(main_loop);
return;
}
if (pid < 0)
pexit("Failed to read child process status");
if (pid == 0)
return;
/* If we got here, pid > 0, so we have a valid pid to check. */
void (*cb)(GPid, int, gpointer) = g_hash_table_lookup(pid_to_handler, &pid);
if (cb) {
cb(pid, status, 0);
} else if (cache) {
pid_t *k = g_malloc(sizeof(pid_t));
int *v = g_malloc(sizeof(int));
if (k == NULL || v == NULL)
pexit("Failed to allocate memory");
*k = pid;
*v = status;
g_hash_table_insert(cache, k, v);
}
}
}
gboolean check_child_processes_cb(gpointer user_data)
{
struct pid_check_data *data = (struct pid_check_data *)user_data;
check_child_processes(data->pid_to_handler, data->exit_status_cache);
return G_SOURCE_REMOVE;
}
gboolean on_sigusr1_cb(gpointer user_data)
{
struct pid_check_data *data = (struct pid_check_data *)user_data;
check_child_processes(data->pid_to_handler, data->exit_status_cache);
return G_SOURCE_CONTINUE;
}
gboolean timeout_cb(G_GNUC_UNUSED gpointer user_data)
{
timed_out = TRUE;
ninfo("Timed out, killing main loop");
g_main_loop_quit(main_loop);
return G_SOURCE_REMOVE;
}
int get_exit_status(int status)
{
if (WIFEXITED(status))
return WEXITSTATUS(status);
if (WIFSIGNALED(status))
return 128 + WTERMSIG(status);
return -1;
}
void runtime_exit_cb(G_GNUC_UNUSED GPid pid, int status, G_GNUC_UNUSED gpointer user_data)
{
runtime_status = status;
create_pid = -1;
g_main_loop_quit(main_loop);
}
void container_exit_cb(G_GNUC_UNUSED GPid pid, int status, G_GNUC_UNUSED gpointer user_data)
{
if (get_exit_status(status) != 0) {
ninfof("container %d exited with status %d", pid, get_exit_status(status));
}
container_status = status;
container_pid = -1;
/* In the case of a quickly exiting exec command, the container exit callback
sometimes gets called earlier than the pid exit callback. If we quit the loop at that point
we risk falsely telling the caller of conmon the runtime call failed (because runtime status
wouldn't be set). Instead, don't quit the loop until runtime exit is also called, which should
shortly after. */
if (opt_api_version >= 1 && create_pid > 0 && opt_exec && opt_terminal) {
ndebugf("container pid return handled before runtime pid return. Not quitting yet.");
return;
}
g_main_loop_quit(main_loop);
}
void do_exit_command()
{
if (signal(SIGCHLD, SIG_DFL) == SIG_ERR) {
_pexit("Failed to reset signal for SIGCHLD");
}
/*
* Close everything except stdin, stdout and stderr.
*/
close_all_fds_ge_than(3);
/*
* We don't want the exit command to be reaped by the parent conmon
* as that would prevent double-fork from doing its job.
* Unfortunately, that also means that any new subchildren from
* still running processes could also get lost
*/
if (prctl(PR_SET_CHILD_SUBREAPER, 0) != 0) {
nwarn("Failed to disable self subreaper attribute - might wait for indirect children a long time");
}
pid_t exit_pid = fork();
if (exit_pid < 0) {
_pexit("Failed to fork");
}
if (exit_pid) {
int ret, exit_status = 0;
/*
* Make sure to cleanup any zombie process that the container runtime
* could have left around.
*/
do {
int tmp;
exit_status = 0;
ret = waitpid(-1, &tmp, 0);
if (ret == exit_pid)
exit_status = get_exit_status(tmp);
} while ((ret < 0 && errno == EINTR) || ret > 0);
if (exit_status)
_exit(exit_status);
return;
}
/* Count the additional args, if any. */
size_t n_args = 0;
if (opt_exit_args)
for (; opt_exit_args[n_args]; n_args++)
;
gchar **args = malloc(sizeof(gchar *) * (n_args + 2));
if (args == NULL)
_exit(EXIT_FAILURE);
args[0] = opt_exit_command;
if (opt_exit_args)
for (n_args = 0; opt_exit_args[n_args]; n_args++)
args[n_args + 1] = opt_exit_args[n_args];
args[n_args + 1] = NULL;
if (opt_exit_delay) {
ndebugf("Sleeping for %d seconds before executing exit command", opt_exit_delay);
sleep(opt_exit_delay);
}
execv(opt_exit_command, args);
/* Should not happen, but better be safe. */
_exit(EXIT_FAILURE);
}
void reap_children()
{
/* We need to reap any zombies (from an OCI runtime that errored) before
exiting */
while (waitpid(-1, NULL, WNOHANG) > 0)
;
}
void handle_signal(G_GNUC_UNUSED const int signum)
{
exit(EXIT_FAILURE);
}