-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathc_aot_compile.h
523 lines (442 loc) · 16.5 KB
/
c_aot_compile.h
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
#pragma once
/**
* ahead of time compilation using c compiler. c source is compiled, then loaded
*/
#include <dlfcn.h>
#include <fcntl.h>
#include <string.h>
#include <stdbool.h>
#include <stdio.h>
#include <stdlib.h>
#include <sys/mman.h>
#include <sys/wait.h>
#include <unistd.h>
#include <errno.h>
#include <string.h>
#include <stdarg.h>
// ================================= error handling =====================================
// this is a super basic and dead simple string manipulation lib, for use by the aot lib's error messages
// malloc formatted string
static char* c_aot_err_printf_owned(const char* format, ...) {
va_list args;
va_start(args, format);
int size = vsnprintf(NULL, 0, format, args);
va_end(args);
if (size < 0) {
return NULL;
}
size += 1; // for null char
char* ret = malloc(size * sizeof(char));
if (!ret) {
return NULL;
}
va_start(args, format);
vsnprintf(ret, size, format, args);
va_end(args);
return ret;
}
// concatenate two strings.
// args:
// - are owned (malloc)
// - can be NULL (treated as empty)
// - will be freed by this function
//
// return value:
// - can be NULL
// - is owned (malloc)
static char* c_aot_err_strcat(char* first, char* second) {
const char* first_used = first ? first : "";
const char* second_used = second ? second : "";
size_t next_size = strlen(first_used) + strlen(second_used) + 1; // +1 for terminator
char* ret = malloc(next_size * sizeof(char));
if (ret) {
char* ret_walk = ret;
while (*first_used != '\0') {
*ret_walk++ = *first_used++;
}
while (*second_used != '\0') {
*ret_walk++ = *second_used++;
}
*ret_walk++ = '\0';
}
free(first);
free(second);
return ret;
}
// perror_arg is a string literal, just like the arg to perror
//
// error_msg_so_far arg:
// - is owned (malloc)
// - can be NULL (treated as empty)
// - will be freed by this function
static char* c_aot_err_strcat_perror(char* error_msg_so_far, const char* perror_arg) {
char* formatted = c_aot_err_printf_owned("%s: %s\n", perror_arg, strerror(errno));
char* ret = c_aot_err_strcat(error_msg_so_far, formatted);
return ret;
}
// appends data with length to the error message. if null bytes are
// contained in the data, then it will appear to terminate early
//
// error_msg_so_far arg:
// - is owned (malloc)
// - can be NULL (treated as empty)
// - will be freed by this function
//
// data is NOT owned and will point to num_elements bytes
static char* c_aot_err_strcat_len(char* error_msg_so_far, const char* data, size_t num_elements) {
char* msg_used = error_msg_so_far ? error_msg_so_far : "";
char* ret = malloc((strlen(msg_used) + num_elements + 1) * sizeof(char));
if (ret) {
char* ret_walk = ret;
while (*msg_used != '\0') {
*ret_walk++ = *msg_used++;
}
for (size_t i = 0; i < num_elements; ++i) {
*ret_walk++ = data[i];
}
*ret_walk++ = '\0';
}
free(error_msg_so_far);
return ret;
}
// ================================== c aot result type ==========================
enum c_aot_compile_result_type {
C_AOT_COMPILE_OK,
C_AOT_COMPILE_ERR,
};
union c_aot_compile_result_value {
// only if C_AOT_COMPILE_OK.
// OWNED, must be freed with dlclose
// never NULL
void* dl_handle;
// only if C_AOT_COMPILE_ERR.
// OWNED, must be freed with free.
// never NULL
char* error_msg;
};
// variant type. either err with error message, or ok with handle
struct c_aot_compile_result {
enum c_aot_compile_result_type type;
union c_aot_compile_result_value value;
};
// ================================== c aot result type wrapper of string manipulation functions ==========================
// checks if OK value is contained. destroys it.
//
// returns OWNED error message (NULL on no error)
static char* c_aot_compile_result_convert_to_err(struct c_aot_compile_result* ret) {
if (ret->type != C_AOT_COMPILE_OK) {
// already contains error. nothing to do
return NULL;
}
void* dl_handle_to_destroy = ret->value.dl_handle;
ret->value.dl_handle = NULL;
ret->type = C_AOT_COMPILE_ERR;
ret->value.error_msg = NULL; // intentionally redundant (ptr union already set)
if (dl_handle_to_destroy == NULL) {
// ok value was contained, but it wasn't set yet. nothing more to do
return NULL;
}
// do destruction of previously contained ok value
if (dlclose(dl_handle_to_destroy) == 0) {
return NULL; // no err
}
char* reason = dlerror();
char* reason_msg;
if (reason) {
reason_msg = c_aot_err_printf_owned("dlclose: %s\n", reason);
} else {
// make owned on either branch
reason_msg = strdup("dlclose failed for an unknown reason\n");
}
return reason_msg;
}
static void c_aot_compile_result_append_error(struct c_aot_compile_result* ret, char* msg) {
char* destroy_error = c_aot_compile_result_convert_to_err(ret);
ret->value.error_msg = c_aot_err_strcat(ret->value.error_msg, msg);
ret->value.error_msg = c_aot_err_strcat(ret->value.error_msg, destroy_error);
}
static void c_aot_compile_result_append_error_perror(struct c_aot_compile_result* ret, const char* perror_arg) {
char* destroy_error = c_aot_compile_result_convert_to_err(ret);
ret->value.error_msg = c_aot_err_strcat_perror(ret->value.error_msg, perror_arg);
ret->value.error_msg = c_aot_err_strcat(ret->value.error_msg, destroy_error);
}
static void c_aot_compile_result_append_error_len(struct c_aot_compile_result* ret, const char* data, size_t num_elements) {
char* destroy_error = c_aot_compile_result_convert_to_err(ret);
ret->value.error_msg = c_aot_err_strcat_len(ret->value.error_msg, data, num_elements);
ret->value.error_msg = c_aot_err_strcat(ret->value.error_msg, destroy_error);
}
// ==========================================================================================================
// compiler_args is a null terminating list of cstr args which are passed to the
// compiler. some args are already specified; compiler_args is appended to
// existing args.
struct c_aot_compile_result c_aot_compile(const char* c_compiler, const char* program_begin, const char* program_end, const char* const* compiler_args) {
int stdin_pipe[2] = {-1, -1};
int stderr_pipe[2] = {-1, -1};
// a memory file must be used here instead of a pipe, as otherwise this causes
// gcc output to fail (/usr/bin/ld: final link failed: Illegal seek)
int code_fd = -1;
struct c_aot_compile_result ret;
ret.type = C_AOT_COMPILE_OK;
ret.value.dl_handle = NULL;
pid_t pid;
if (pipe(stdin_pipe) == -1) {
c_aot_compile_result_append_error_perror(&ret, "pipe");
goto end;
}
if (pipe(stderr_pipe) == -1) {
c_aot_compile_result_append_error_perror(&ret, "pipe");
goto end;
}
code_fd = memfd_create("dynamic_compiled_shared_library", 0);
if (code_fd == -1) {
c_aot_compile_result_append_error_perror(&ret, "memfd_create");
goto end;
}
char compile_output_file[32];
{
int printf_result = snprintf(compile_output_file, //
sizeof(compile_output_file), "/dev/fd/%d", code_fd);
if (printf_result < 0 || (unsigned long)printf_result >= sizeof(compile_output_file)) {
c_aot_compile_result_append_error(&ret, strdup("format error\n"));
goto end;
}
}
pid = fork();
if (pid < 0) {
c_aot_compile_result_append_error_perror(&ret, "fork");
goto end;
}
if (pid == 0) {
// child process
if (dup2(stdin_pipe[0], STDIN_FILENO) == -1 || //
dup2(stderr_pipe[1], STDERR_FILENO) == -1) {
perror("dup2 failed before compiler started");
exit(EXIT_FAILURE); // in child process - exit now
}
int dev_null = open("/dev/null", O_WRONLY);
if (dev_null == -1) {
perror("open failed before compiler started");
exit(EXIT_FAILURE); // in child process - exit now
}
if (dup2(dev_null, STDOUT_FILENO) == -1) {
perror("dup2 failed before compiler started");
exit(EXIT_FAILURE); // in child process - exit now
}
if (close(stdin_pipe[1]) == -1) {
// must close stdin writer or else it will keep child process alive
// as it waits for input
perror("close failed before compiler started");
exit(EXIT_FAILURE); // in child process - exit now
}
char compile_output_file_arg[34];
{
int printf_result = snprintf(compile_output_file_arg, //
sizeof(compile_output_file_arg), "-o%s", compile_output_file);
if (printf_result < 0 || (unsigned long)printf_result >= sizeof(compile_output_file_arg)) {
fputs("format error before compiler started", stderr);
exit(EXIT_FAILURE); // in child process - exit now
}
}
size_t num_extra_args = 0;
while (compiler_args[num_extra_args] != 0) {
++num_extra_args;
}
// copy required since args are non const
char* args[9 + num_extra_args];
// first arg always is self
const char* arg0_const = c_compiler;
size_t arg0_size = strlen(arg0_const) + 1;
char arg0[arg0_size];
memcpy(arg0, arg0_const, arg0_size);
args[0] = arg0;
// don't use temp files during compilation; pipes instead
const char* arg1_const = "-pipe";
size_t arg1_size = strlen(arg1_const) + 1;
char arg1[arg1_size];
memcpy(arg1, arg1_const, arg1_size);
args[1] = arg1;
// shouldn't be needed, but just to be safe. the code shouldn't be
// moved from the memory file after it is written.
const char* arg2_const = "-fPIC";
size_t arg2_size = strlen(arg2_const) + 1;
char arg2[arg2_size];
memcpy(arg2, arg2_const, arg2_size);
args[2] = arg2;
const char* arg3_const = "-shared"; // shared object (resolve symbols)
size_t arg3_size = strlen(arg3_const) + 1;
char arg3[arg3_size];
memcpy(arg3, arg3_const, arg3_size);
args[3] = arg3;
const char* arg4_const = "-O2"; // optimize a good amount (priority is for fast runtime)
size_t arg4_size = strlen(arg4_const) + 1;
char arg4[arg4_size];
memcpy(arg4, arg4_const, arg4_size);
args[4] = arg4;
const char* arg5_const = "-xc"; // stdin contains c language
size_t arg5_size = strlen(arg5_const) + 1;
char arg5[arg5_size];
memcpy(arg5, arg5_const, arg5_size);
args[5] = arg5;
args[6] = compile_output_file_arg; // write compiled shared object to memory file
const char* arg7_const = "-"; // no further files to compile will be specified. only stdin
size_t arg7_size = strlen(arg7_const) + 1;
char arg7[arg7_size];
memcpy(arg7, arg7_const, arg7_size);
args[7] = arg7;
size_t extra_args_arena_size = 0;
for (size_t i = 0; i < num_extra_args; ++i) {
extra_args_arena_size += strlen(compiler_args[i]) + 1;
}
char extra_args_arena[extra_args_arena_size];
{
char* extra_args_arena_walk = extra_args_arena;
for (size_t i = 0; i < num_extra_args; ++i) {
const char* the_arg = compiler_args[i];
args[8 + i] = extra_args_arena_walk;
while (1) {
char ch = *the_arg++;
bool complete = ch == '\0';
*extra_args_arena_walk++ = ch; // includes null
if (complete) break;
}
}
}
args[sizeof(args) / sizeof(*args) - 1] = (char*)NULL; // execl args are null terminating
// pass ENV vars. append TMPDIR so gcc, clang won't use disk for temp files
size_t env_count = 0;
extern char **environ;
while (environ[env_count] != 0) {
++env_count;
}
env_count += 2; // +1 for new var, +1 for NULL
char* env[env_count];
for (size_t i = 0; i < env_count - 2; ++i) {
env[i] = environ[i];
}
// copy required since env non const
const char* env_to_add_const = "TMPDIR=/dev/shm";
size_t env_to_add_size = strlen(env_to_add_const) + 1;
char env_to_add[env_to_add_size];
memcpy(env_to_add, env_to_add_const, env_to_add_size);
env[env_count - 2] = env_to_add; // place it last (highest precedence)
env[env_count - 1] = (char*)NULL; // env null terminating
execvpe(c_compiler, args, env);
perror("execl failed before compiler started"); // only reached on error
exit(EXIT_FAILURE); // in child process - exit now
// all other fds will be closed by OS on child process exit.
// this is required by the code_pipe (can't be closed before execl)
}
// parent process
// write then close the input
if (write(stdin_pipe[1], program_begin, program_end - program_begin) == -1) {
c_aot_compile_result_append_error_perror(&ret, "write");
goto end;
}
// must close stdin writer or else it will keep child process alive as it
// waits for input
{
int close_result = close(stdin_pipe[1]);
stdin_pipe[1] = -1;
if (close_result == -1) {
c_aot_compile_result_append_error_perror(&ret, "close");
goto end;
}
}
// must close output streams here, or else it will keep the parent
// blocking on read as it waits for the input from child to end
{
int close_result = close(stderr_pipe[1]);
stderr_pipe[1] = -1;
if (close_result == -1) {
c_aot_compile_result_append_error_perror(&ret, "close");
goto end;
}
}
{
// the compiler might be producing stderr.
// something must be reading it, or else the stderr write will block if the compiler's error is very large.
// reading will always occur, but only if there is a failure exit status then it will be displayed.
// only n bytes will be read, and the reset is discarded (constant space)
const size_t COMPILER_STDERR_BUF_CAPACITY = 500;
size_t compiler_stderr_size = 0;
char compiler_stderr_buf[COMPILER_STDERR_BUF_CAPACITY];
bool compiler_stderr_was_truncated = false;
while (compiler_stderr_size != COMPILER_STDERR_BUF_CAPACITY) {
size_t read_ret = read(stderr_pipe[0], compiler_stderr_buf + compiler_stderr_size, COMPILER_STDERR_BUF_CAPACITY - compiler_stderr_size);
if (read_ret < 0) {
c_aot_compile_result_append_error_perror(&ret, "reading compiler's stderr");
goto end;
}
if (read_ret == 0) {
goto after_discard_compiler_stderr;
}
compiler_stderr_size += read_ret;
}
// the stderr buffer is full, discard any remaining
while (1) {
char discard[1024];
size_t read_ret = read(stderr_pipe[0], discard, sizeof(discard) / sizeof(char));
if (read_ret < 0) {
c_aot_compile_result_append_error_perror(&ret, "reading compiler's stderr");
goto end;
}
if (read_ret == 0) {
break;
}
// if this point is reached, then some amount of bytes has been discarded
compiler_stderr_was_truncated = true;
}
after_discard_compiler_stderr:
int child_return_status;
if (waitpid(pid, &child_return_status, 0) == -1) {
c_aot_compile_result_append_error_perror(&ret, "waitpid");
goto end;
}
if (WIFEXITED(child_return_status)) {
child_return_status = WEXITSTATUS(child_return_status);
}
if (child_return_status != 0) {
char* formatted_str = c_aot_err_printf_owned("child process for compiler \"%s\" exited with code %d. stderr:\n", c_compiler, child_return_status);
c_aot_compile_result_append_error(&ret, formatted_str);
c_aot_compile_result_append_error_len(&ret, compiler_stderr_buf, compiler_stderr_size);
if (compiler_stderr_was_truncated) {
char* truncate_msg_formatted = c_aot_err_printf_owned("\n... stderr from \"%s\" was truncated\n", c_compiler);
c_aot_compile_result_append_error(&ret, truncate_msg_formatted);
}
goto end;
}
}
{
void* handle = dlopen(compile_output_file, RTLD_NOW);
if (handle == NULL) {
char* reason = dlerror();
char* fmt_err;
if (reason) {
fmt_err = c_aot_err_printf_owned("dlopen: %s\n", reason);
} else {
fmt_err = strdup("dlopen failed for an unknown reason");
}
c_aot_compile_result_append_error(&ret, fmt_err);
goto end;
}
if (ret.type == C_AOT_COMPILE_OK) {
ret.value.dl_handle = handle;
}
}
end:
int close_errored = 0;
if (stdin_pipe[0] != -1) close_errored |= close(stdin_pipe[0]);
if (stdin_pipe[1] != -1) close_errored |= close(stdin_pipe[1]);
if (stderr_pipe[0] != -1) close_errored |= close(stderr_pipe[0]);
if (stderr_pipe[1] != -1) close_errored |= close(stderr_pipe[1]);
if (code_fd != -1) close_errored |= close(code_fd);
if (close_errored) {
c_aot_compile_result_append_error_perror(&ret, "close");
}
return ret;
}
// overload for compile
struct c_aot_compile_result c_aot_compile_no_args(const char* c_compiler, const char* program_begin, const char* program_end) {
const char* compiler_args = NULL;
return c_aot_compile(c_compiler, program_begin, program_end, &compiler_args);
}