diff options
Diffstat (limited to 'src/kmk/kmkbuiltin.c')
-rw-r--r-- | src/kmk/kmkbuiltin.c | 507 |
1 files changed, 507 insertions, 0 deletions
diff --git a/src/kmk/kmkbuiltin.c b/src/kmk/kmkbuiltin.c new file mode 100644 index 0000000..8f00e98 --- /dev/null +++ b/src/kmk/kmkbuiltin.c @@ -0,0 +1,507 @@ +/* $Id: kmkbuiltin.c 3389 2020-06-26 17:16:26Z bird $ */ +/** @file + * kMk Builtin command execution. + */ + +/* + * Copyright (c) 2005-2018 knut st. osmundsen <bird-kBuild-spamx@anduin.net> + * + * This file is part of kBuild. + * + * kBuild is free software; you can redistribute it and/or modify + * it under the terms of the GNU General Public License as published by + * the Free Software Foundation; either version 3 of the License, or + * (at your option) any later version. + * + * kBuild is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + * GNU General Public License for more details. + * + * You should have received a copy of the GNU General Public License + * along with kBuild. If not, see <http://www.gnu.org/licenses/> + * + */ + + +/********************************************************************************************************************************* +* Header Files * +*********************************************************************************************************************************/ +#include <string.h> +#include <stdlib.h> +#include <stdio.h> +#include <ctype.h> +#include <assert.h> +#include <sys/stat.h> +#ifdef _MSC_VER +# include <io.h> +#endif + +#include "makeint.h" +#include "job.h" +#include "variable.h" +#if defined(KBUILD_OS_WINDOWS) && defined(CONFIG_NEW_WIN_CHILDREN) +# include "w32/winchildren.h" +#endif +#include "kmkbuiltin/err.h" +#include "kmkbuiltin.h" + +#ifndef _MSC_VER +extern char **environ; +#endif + + +/********************************************************************************************************************************* +* Global Variables * +*********************************************************************************************************************************/ +#ifdef CONFIG_WITH_KMK_BUILTIN_STATS +extern int print_stats_flag; +#endif + + + +int kmk_builtin_command(const char *pszCmd, struct child *pChild, char ***ppapszArgvToSpawn, pid_t *pPidSpawned) +{ + int argc; + char **argv; + int rc; + char *pszzCmd; + char *pszDst; + int fOldStyle = 0; + + /* + * Check and skip the prefix. + */ + if (strncmp(pszCmd, "kmk_builtin_", sizeof("kmk_builtin_") - 1)) + { + fprintf(stderr, "kmk_builtin: Invalid command prefix '%s'!\n", pszCmd); + return 1; + } + + /* + * Parse arguments. + */ + rc = 0; + argc = 0; + argv = NULL; + pszzCmd = pszDst = (char *)strdup(pszCmd); + if (!pszDst) + { + fprintf(stderr, "kmk_builtin: out of memory. argc=%d\n", argc); + return 1; + } + do + { + const char * const pszSrcStart = pszCmd; + char ch; + char chQuote; + + /* + * Start new argument. + */ + if (!(argc % 16)) + { + void *pv = realloc(argv, sizeof(char *) * (argc + 17)); + if (!pv) + { + fprintf(stderr, "kmk_builtin: out of memory. argc=%d\n", argc); + rc = 1; + break; + } + argv = (char **)pv; + } + argv[argc++] = pszDst; + argv[argc] = NULL; + + if (!fOldStyle) + { + /* + * Process the next argument, bourne style. + */ + chQuote = 0; + ch = *pszCmd++; + do + { + /* Unquoted mode? */ + if (chQuote == 0) + { + if (ch != '\'' && ch != '"') + { + if (!isspace(ch)) + { + if (ch != '\\') + *pszDst++ = ch; + else + { + ch = *pszCmd++; + if (ch == '\n') /* escaped end-of-line */ + break; + if (ch == '\r' && *pszCmd == '\n') /* escaped end-of-line */ + { + pszCmd++; + break; + } + if (ch) + *pszDst++ = ch; + else + { + fprintf(stderr, "kmk_builtin: Incomplete escape sequence in argument %d: %s\n", + argc, pszSrcStart); + rc = 1; + break; + } + } + } + else + break; + } + else + chQuote = ch; + } + /* Quoted mode */ + else if (ch != chQuote) + { + if ( ch != '\\' + || chQuote == '\'') + *pszDst++ = ch; + else + { + ch = *pszCmd++; + if (ch) + { + if ( ch != '\\' + && ch != '"' + && ch != '`' + && ch != '$' + && ch != '\n') + *pszDst++ = '\\'; + *pszDst++ = ch; + } + else + { + fprintf(stderr, "kmk_builtin: Unbalanced quote in argument %d: %s\n", argc, pszSrcStart); + rc = 1; + break; + } + } + } + else + chQuote = 0; + } while ((ch = *pszCmd++) != '\0'); + } + else + { + /* + * Old style in case we ever need it. + */ + ch = *pszCmd++; + if (ch != '"' && ch != '\'') + { + do + *pszDst++ = ch; + while ((ch = *pszCmd++) != '\0' && !isspace(ch)); + } + else + { + chQuote = ch; + for (;;) + { + char *pszEnd = strchr(pszCmd, chQuote); + if (pszEnd) + { + fprintf(stderr, "kmk_builtin: Unbalanced quote in argument %d: %s\n", argc, pszSrcStart); + rc = 1; + break; + } + memcpy(pszDst, pszCmd, pszEnd - pszCmd); + pszDst += pszEnd - pszCmd; + if (pszEnd[1] != chQuote) + break; + *pszDst++ = chQuote; + } + } + } + *pszDst++ = '\0'; + + /* + * Skip argument separators (IFS=space() for now). Check for EOS. + */ + if (ch != 0) + while ( (ch = *pszCmd) + && ( isspace(ch) + || (ch == '\\' && (pszCmd[1] == '\n' || (pszCmd[1] == '\r' && pszCmd[2] == '\n'))))) + pszCmd++; + if (ch == 0) + break; + } while (rc == 0); + + /* + * Execute the command if parsing was successful. + */ + if (rc == 0) + rc = kmk_builtin_command_parsed(argc, argv, pChild, ppapszArgvToSpawn, pPidSpawned); + + /* clean up and return. */ + free(argv); + free(pszzCmd); + return rc; +} + + +/** + * kmk built command. + */ +static const KMKBUILTINENTRY g_aBuiltIns[] = +{ +#define BUILTIN_ENTRY(a_fn, a_sz, a_uFnSignature, fMtSafe, fNeedEnv) \ + { { { sizeof(a_sz) - 1, a_sz, } }, { (uintptr_t)a_fn }, a_uFnSignature, fMtSafe, fNeedEnv } + + /* More frequently used commands: */ + BUILTIN_ENTRY(kmk_builtin_append, "append", FN_SIG_MAIN_SPAWNS, 0, 0), + BUILTIN_ENTRY(kmk_builtin_printf, "printf", FN_SIG_MAIN, 0, 0), + BUILTIN_ENTRY(kmk_builtin_echo, "echo", FN_SIG_MAIN, 0, 0), + BUILTIN_ENTRY(kmk_builtin_install, "install", FN_SIG_MAIN, 1, 0), + BUILTIN_ENTRY(kmk_builtin_kDepObj, "kDepObj", FN_SIG_MAIN, 1, 0), +#ifdef KBUILD_OS_WINDOWS + BUILTIN_ENTRY(kmk_builtin_kSubmit, "kSubmit", FN_SIG_MAIN_SPAWNS, 0, 1), + BUILTIN_ENTRY(kmk_builtin_kill, "kill", FN_SIG_MAIN, 0, 0), +#endif + BUILTIN_ENTRY(kmk_builtin_mkdir, "mkdir", FN_SIG_MAIN, 0, 0), + BUILTIN_ENTRY(kmk_builtin_mv, "mv", FN_SIG_MAIN, 0, 0), + BUILTIN_ENTRY(kmk_builtin_redirect, "redirect", FN_SIG_MAIN_SPAWNS, 1, 1), + BUILTIN_ENTRY(kmk_builtin_rm, "rm", FN_SIG_MAIN, 1, 1), + BUILTIN_ENTRY(kmk_builtin_rmdir, "rmdir", FN_SIG_MAIN, 0, 0), + BUILTIN_ENTRY(kmk_builtin_test, "test", FN_SIG_MAIN_TO_SPAWN, 0, 0), + /* Less frequently used commands: */ + BUILTIN_ENTRY(kmk_builtin_kDepIDB, "kDepIDB", FN_SIG_MAIN, 0, 0), + BUILTIN_ENTRY(kmk_builtin_chmod, "chmod", FN_SIG_MAIN, 0, 0), + BUILTIN_ENTRY(kmk_builtin_cp, "cp", FN_SIG_MAIN, 1, 1), + BUILTIN_ENTRY(kmk_builtin_expr, "expr", FN_SIG_MAIN, 0, 0), + BUILTIN_ENTRY(kmk_builtin_ln, "ln", FN_SIG_MAIN, 0, 0), + BUILTIN_ENTRY(kmk_builtin_md5sum, "md5sum", FN_SIG_MAIN, 1, 0), + BUILTIN_ENTRY(kmk_builtin_cmp, "cmp", FN_SIG_MAIN, 0, 0), + BUILTIN_ENTRY(kmk_builtin_cat, "cat", FN_SIG_MAIN, 0, 0), + BUILTIN_ENTRY(kmk_builtin_touch, "touch", FN_SIG_MAIN, 0, 0), + BUILTIN_ENTRY(kmk_builtin_sleep, "sleep", FN_SIG_MAIN, 1, 0), + BUILTIN_ENTRY(kmk_builtin_dircache, "dircache", FN_SIG_MAIN, 0, 0), +}; + +#ifdef CONFIG_WITH_KMK_BUILTIN_STATS +/** Statistics running in parallel to g_aBuiltIns. */ +struct +{ + big_int cNs; + unsigned cTimes; + unsigned cAsyncTimes; +} g_aBuiltInStats[sizeof(g_aBuiltIns) / sizeof(g_aBuiltIns[0])]; +#endif + + +int kmk_builtin_command_parsed(int argc, char **argv, struct child *pChild, char ***ppapszArgvToSpawn, pid_t *pPidSpawned) +{ + /* + * Check and skip the prefix. + */ + static const char s_szPrefix[] = "kmk_builtin_"; + const char *pszCmd = argv[0]; + if (strncmp(pszCmd, s_szPrefix, sizeof(s_szPrefix) - 1) == 0) + { + struct KMKBUILTINENTRY const *pEntry; + size_t cchAndStart; +#if K_ENDIAN == K_ENDIAN_BIG + size_t cch; +#endif + int cLeft; + + pszCmd += sizeof(s_szPrefix) - 1; + + /* + * Calc the length and start word to avoid calling memcmp/strcmp on each entry. + */ +#if K_ARCH_BITS != 64 && K_ARCH_BITS != 32 +# error "PORT ME!" +#endif + cchAndStart = strlen(pszCmd); +#if K_ENDIAN == K_ENDIAN_BIG + cch = cchAndStart; + cchAndStart <<= K_ARCH_BITS - 8; + switch (cch) + { + default: /* fall thru */ +# if K_ARCH_BITS >= 64 + case 7: cchAndStart |= (size_t)pszCmd[6]; /* fall thru */ + case 6: cchAndStart |= (size_t)pszCmd[5] << (K_ARCH_BITS - 56); /* fall thru */ + case 5: cchAndStart |= (size_t)pszCmd[4] << (K_ARCH_BITS - 48); /* fall thru */ + case 4: cchAndStart |= (size_t)pszCmd[3] << (K_ARCH_BITS - 40); /* fall thru */ +# endif + /* fall thru - gcc 8.2.0 is confused by # endif */ + case 3: cchAndStart |= (size_t)pszCmd[2] << (K_ARCH_BITS - 32); /* fall thru */ + case 2: cchAndStart |= (size_t)pszCmd[1] << (K_ARCH_BITS - 24); /* fall thru */ + case 1: cchAndStart |= (size_t)pszCmd[0] << (K_ARCH_BITS - 16); /* fall thru */ + case 0: break; + } +#else + switch (cchAndStart) + { + default: /* fall thru */ +# if K_ARCH_BITS >= 64 + case 7: cchAndStart |= (size_t)pszCmd[6] << 56; /* fall thru */ + case 6: cchAndStart |= (size_t)pszCmd[5] << 48; /* fall thru */ + case 5: cchAndStart |= (size_t)pszCmd[4] << 40; /* fall thru */ + case 4: cchAndStart |= (size_t)pszCmd[3] << 32; /* fall thru */ +# endif + /* fall thru - gcc 8.2.0 is confused by # endif */ + case 3: cchAndStart |= (size_t)pszCmd[2] << 24; /* fall thru */ + case 2: cchAndStart |= (size_t)pszCmd[1] << 16; /* fall thru */ + case 1: cchAndStart |= (size_t)pszCmd[0] << 8; /* fall thru */ + case 0: break; + } +#endif + + /* + * Look up the builtin command in the table. + */ + pEntry = &g_aBuiltIns[0]; + cLeft = sizeof(g_aBuiltIns) / sizeof(g_aBuiltIns[0]); + while (cLeft-- > 0) + if ( pEntry->uName.cchAndStart != cchAndStart + || ( pEntry->uName.s.cch >= sizeof(cchAndStart) + && memcmp(pEntry->uName.s.sz, pszCmd, pEntry->uName.s.cch) != 0) ) + pEntry++; + else + { + /* + * That's a match! + * + * First get the environment if it is actually needed. This is + * especially important when we run on a worker thread as it must + * not under any circumstances do stuff like target_environment. + */ + int rc; + char **papszEnvVars = NULL; + if (pEntry->fNeedEnv) + { + papszEnvVars = pChild->environment; + if (!papszEnvVars) + pChild->environment = papszEnvVars = target_environment(pChild->file); + } + +#if defined(KBUILD_OS_WINDOWS) && defined(CONFIG_NEW_WIN_CHILDREN) + /* + * If the built-in is multi thread safe, we will run it on a job slot thread. + */ + if (pEntry->fMtSafe) + { + rc = MkWinChildCreateBuiltIn(pEntry, argc, argv, papszEnvVars, pChild, pPidSpawned); +# ifdef CONFIG_WITH_KMK_BUILTIN_STATS + g_aBuiltInStats[pEntry - &g_aBuiltIns[0]].cAsyncTimes++; +# endif + } + else +#endif + { + /* + * Call the worker function. + */ +#ifdef CONFIG_WITH_KMK_BUILTIN_STATS + big_int nsStart = print_stats_flag ? nano_timestamp() : 0; +#endif + KMKBUILTINCTX Ctx; + assert(g_fUMask == umask(g_fUMask)); + + Ctx.pszProgName = pEntry->uName.s.sz; + Ctx.pOut = pChild ? &pChild->output : NULL; + + if (pEntry->uFnSignature == FN_SIG_MAIN) + rc = pEntry->u.pfnMain(argc, argv, papszEnvVars, &Ctx); + else if (pEntry->uFnSignature == FN_SIG_MAIN_SPAWNS) + rc = pEntry->u.pfnMainSpawns(argc, argv, papszEnvVars, &Ctx, pChild, pPidSpawned); + else if (pEntry->uFnSignature == FN_SIG_MAIN_TO_SPAWN) + { + /* + * When we got something to execute, check if the child is a kmk_builtin thing. + * We recurse here, both because I'm lazy and because it's easier to debug a + * problem then (the call stack shows what's been going on). + */ + rc = pEntry->u.pfnMainToSpawn(argc, argv, papszEnvVars, &Ctx, ppapszArgvToSpawn); + if ( !rc + && *ppapszArgvToSpawn + && !strncmp(**ppapszArgvToSpawn, s_szPrefix, sizeof(s_szPrefix) - 1)) + { + char **argv_new = *ppapszArgvToSpawn; + int argc_new = 1; + while (argv_new[argc_new]) + argc_new++; + + assert(argv_new[0] != argv[0]); + assert(!*pPidSpawned); + + *ppapszArgvToSpawn = NULL; + rc = kmk_builtin_command_parsed(argc_new, argv_new, pChild, ppapszArgvToSpawn, pPidSpawned); + + free(argv_new[0]); + free(argv_new); + } + } + else + rc = 99; + + assert(g_fUMask == umask(g_fUMask)); /* builtin command must preserve umask! */ + +#ifdef CONFIG_WITH_KMK_BUILTIN_STATS + if (print_stats_flag) + { + uintptr_t iEntry = pEntry - &g_aBuiltIns[0]; + g_aBuiltInStats[iEntry].cTimes++; + g_aBuiltInStats[iEntry].cNs += nano_timestamp() - nsStart; + } +#endif + } + return rc; + } + + /* + * No match! :-( + */ + fprintf(stderr, "kmk_builtin: Unknown command '%s%s'!\n", s_szPrefix, pszCmd); + } + else + fprintf(stderr, "kmk_builtin: Invalid command prefix '%s'!\n", pszCmd); + return 1; +} + +#ifndef KBUILD_OS_WINDOWS +/** Dummy. */ +int kmk_builtin_dircache(int argc, char **argv, char **envp, PKMKBUILTINCTX pCtx) +{ + (void)argc; (void)argv; (void)envp; (void)pCtx; + return 0; +} +#endif + +#ifdef CONFIG_WITH_KMK_BUILTIN_STATS +/** + * Prints the statistiscs to the given output stream. + */ +extern void kmk_builtin_print_stats(FILE *pOutput, const char *pszPrefix) +{ + const unsigned cEntries = sizeof(g_aBuiltInStats) / sizeof(g_aBuiltInStats[0]); + unsigned i; + assert(print_stats_flag); + fprintf(pOutput, "\n%skmk built-in command statistics:\n", pszPrefix); + for (i = 0; i < cEntries; i++) + if (g_aBuiltInStats[i].cTimes > 0) + { + char szTotal[64]; + char szAvg[64]; + format_elapsed_nano(szTotal, sizeof(szTotal), g_aBuiltInStats[i].cNs); + format_elapsed_nano(szAvg, sizeof(szAvg), g_aBuiltInStats[i].cNs / g_aBuiltInStats[i].cTimes); + fprintf(pOutput, "%s kmk_builtin_%-9s: %4u times, %9s total, %9s/call\n", + pszPrefix, g_aBuiltIns[i].uName.s.sz, g_aBuiltInStats[i].cTimes, szTotal, szAvg); + } + else if (g_aBuiltInStats[i].cAsyncTimes > 0) + fprintf(pOutput, "%s kmk_builtin_%-9s: %4u times in worker thread\n", + pszPrefix, g_aBuiltIns[i].uName.s.sz, g_aBuiltInStats[i].cAsyncTimes); +} +#endif + |