/* * * honggfuzz - file operations * ----------------------------------------- * * Author: Robert Swiecki * * Copyright 2010-2015 by Google Inc. All Rights Reserved. * * Licensed under the Apache License, Version 2.0 (the "License"); you may * not use this file except in compliance with the License. You may obtain * a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or * implied. See the License for the specific language governing * permissions and limitations under the License. * */ #include "input.h" #include #include #include #include #include #include #include #include #include #include #include #include #include #include "libhfcommon/common.h" #include "libhfcommon/files.h" #include "mangle.h" #include "subproc.h" #if defined(_HF_ARCH_LINUX) #include #if defined(__NR_memfd_create) #include #endif /* defined(__NR_memfd_create) */ #endif /* defined(_HF_ARCH_LINUX) */ #include "libhfcommon/log.h" #include "libhfcommon/util.h" void input_setSize(run_t* run, size_t sz) { if (sz > run->global->maxFileSz) { PLOG_F("Too large size requested: %zu > maxSize: %zu", sz, run->global->maxFileSz); } run->dynamicFileSz = sz; } static bool input_getDirStatsAndRewind(honggfuzz_t* hfuzz) { rewinddir(hfuzz->io.inputDirPtr); size_t maxSize = 0U; size_t fileCnt = 0U; for (;;) { errno = 0; struct dirent* entry = readdir(hfuzz->io.inputDirPtr); if (entry == NULL && errno == EINTR) { continue; } if (entry == NULL && errno != 0) { PLOG_W("readdir('%s')", hfuzz->io.inputDir); return false; } if (entry == NULL) { break; } char fname[PATH_MAX]; snprintf(fname, sizeof(fname), "%s/%s", hfuzz->io.inputDir, entry->d_name); LOG_D("Analyzing file '%s'", fname); struct stat st; if (stat(fname, &st) == -1) { LOG_W("Couldn't stat() the '%s' file", fname); continue; } if (!S_ISREG(st.st_mode)) { LOG_D("'%s' is not a regular file, skipping", fname); continue; } if (hfuzz->maxFileSz != 0UL && st.st_size > (off_t)hfuzz->maxFileSz) { LOG_W("File '%s' is bigger than maximal defined file size (-F): %" PRId64 " > %" PRId64, fname, (int64_t)st.st_size, (int64_t)hfuzz->maxFileSz); } if ((size_t)st.st_size > maxSize) { maxSize = st.st_size; } fileCnt++; } ATOMIC_SET(hfuzz->io.fileCnt, fileCnt); if (hfuzz->maxFileSz == 0U) { if (maxSize < 8192) { hfuzz->maxFileSz = 8192; } else if (maxSize > _HF_INPUT_MAX_SIZE) { hfuzz->maxFileSz = _HF_INPUT_MAX_SIZE; } else { hfuzz->maxFileSz = maxSize; } } if (hfuzz->io.fileCnt == 0U) { LOG_W("No usable files in the input directory '%s'", hfuzz->io.inputDir); } LOG_D("Re-read the '%s', maxFileSz:%zu, number of usable files:%zu", hfuzz->io.inputDir, hfuzz->maxFileSz, hfuzz->io.fileCnt); rewinddir(hfuzz->io.inputDirPtr); return true; } bool input_getNext(run_t* run, char* fname, bool rewind) { static pthread_mutex_t input_mutex = PTHREAD_MUTEX_INITIALIZER; MX_SCOPED_LOCK(&input_mutex); if (run->global->io.fileCnt == 0U) { LOG_W("No useful files in the input directory"); return false; } for (;;) { errno = 0; struct dirent* entry = readdir(run->global->io.inputDirPtr); if (entry == NULL && errno == EINTR) { continue; } if (entry == NULL && errno != 0) { PLOG_W("readdir_r('%s')", run->global->io.inputDir); return false; } if (entry == NULL && rewind == false) { return false; } if (entry == NULL && rewind == true) { if (input_getDirStatsAndRewind(run->global) == false) { LOG_E("input_getDirStatsAndRewind('%s')", run->global->io.inputDir); return false; } continue; } snprintf(fname, PATH_MAX, "%s/%s", run->global->io.inputDir, entry->d_name); struct stat st; if (stat(fname, &st) == -1) { LOG_W("Couldn't stat() the '%s' file", fname); continue; } if (!S_ISREG(st.st_mode)) { LOG_D("'%s' is not a regular file, skipping", fname); continue; } return true; } } bool input_init(honggfuzz_t* hfuzz) { hfuzz->io.fileCnt = 0U; if (!hfuzz->io.inputDir) { LOG_W("No input file/dir specified"); return false; } int dir_fd = open(hfuzz->io.inputDir, O_DIRECTORY | O_RDONLY | O_CLOEXEC); if (dir_fd == -1) { PLOG_W("open('%s', O_DIRECTORY|O_RDONLY|O_CLOEXEC)", hfuzz->io.inputDir); return false; } if ((hfuzz->io.inputDirPtr = fdopendir(dir_fd)) == NULL) { close(dir_fd); PLOG_W("opendir('%s')", hfuzz->io.inputDir); return false; } if (input_getDirStatsAndRewind(hfuzz) == false) { hfuzz->io.fileCnt = 0U; LOG_W("input_getDirStatsAndRewind('%s')", hfuzz->io.inputDir); return false; } return true; } bool input_parseDictionary(honggfuzz_t* hfuzz) { FILE* fDict = fopen(hfuzz->dictionaryFile, "rb"); if (fDict == NULL) { PLOG_W("Couldn't open '%s' - R/O mode", hfuzz->dictionaryFile); return false; } defer { fclose(fDict); }; char* lineptr = NULL; size_t n = 0; defer { free(lineptr); }; for (;;) { ssize_t len = getdelim(&lineptr, &n, '\n', fDict); if (len == -1) { break; } if (len > 1 && lineptr[len - 1] == '\n') { lineptr[len - 1] = '\0'; len--; } if (lineptr[0] == '#') { continue; } if (lineptr[0] == '\n') { continue; } if (lineptr[0] == '\0') { continue; } char bufn[1025] = {}; char bufv[1025] = {}; if (sscanf(lineptr, "\"%1024s", bufv) != 1 && sscanf(lineptr, "%1024[^=]=\"%1024s", bufn, bufv) != 2) { LOG_W("Incorrect dictionary entry: '%s'. Skipping", lineptr); continue; } LOG_D("Parsing word: '%s'", bufv); char* s = util_StrDup(bufv); struct strings_t* str = (struct strings_t*)util_Malloc(sizeof(struct strings_t)); str->len = util_decodeCString(s); str->s = s; hfuzz->dictionaryCnt += 1; TAILQ_INSERT_TAIL(&hfuzz->dictq, str, pointers); LOG_D("Dictionary: loaded word: '%s' (len=%zu)", str->s, str->len); } LOG_I("Loaded %zu words from the dictionary", hfuzz->dictionaryCnt); return true; } bool input_parseBlacklist(honggfuzz_t* hfuzz) { FILE* fBl = fopen(hfuzz->blacklistFile, "rb"); if (fBl == NULL) { PLOG_W("Couldn't open '%s' - R/O mode", hfuzz->blacklistFile); return false; } defer { fclose(fBl); }; char* lineptr = NULL; /* lineptr can be NULL, but it's fine for free() */ defer { free(lineptr); }; size_t n = 0; for (;;) { if (getline(&lineptr, &n, fBl) == -1) { break; } if ((hfuzz->blacklist = util_Realloc(hfuzz->blacklist, (hfuzz->blacklistCnt + 1) * sizeof(hfuzz->blacklist[0]))) == NULL) { PLOG_W( "realloc failed (sz=%zu)", (hfuzz->blacklistCnt + 1) * sizeof(hfuzz->blacklist[0])); return false; } hfuzz->blacklist[hfuzz->blacklistCnt] = strtoull(lineptr, 0, 16); LOG_D("Blacklist: loaded %'" PRIu64 "'", hfuzz->blacklist[hfuzz->blacklistCnt]); // Verify entries are sorted so we can use interpolation search if (hfuzz->blacklistCnt > 1) { if (hfuzz->blacklist[hfuzz->blacklistCnt - 1] > hfuzz->blacklist[hfuzz->blacklistCnt]) { LOG_F( "Blacklist file not sorted. Use 'tools/createStackBlacklist.sh' to sort " "records"); return false; } } hfuzz->blacklistCnt += 1; } if (hfuzz->blacklistCnt > 0) { LOG_I("Loaded %zu stack hash(es) from the blacklist file", hfuzz->blacklistCnt); } else { LOG_F("Empty stack hashes blacklist file '%s'", hfuzz->blacklistFile); } return true; } bool input_prepareDynamicInput(run_t* run) { run->origFileName = "[DYNAMIC]"; { MX_SCOPED_RWLOCK_READ(&run->global->dynfileq_mutex); if (run->global->dynfileqCnt == 0) { LOG_F("The dynamic file corpus is empty. This shouldn't happen"); } if (run->dynfileqCurrent == NULL) { run->dynfileqCurrent = TAILQ_FIRST(&run->global->dynfileq); } else { if (run->dynfileqCurrent == TAILQ_LAST(&run->global->dynfileq, dyns_t)) { run->dynfileqCurrent = TAILQ_FIRST(&run->global->dynfileq); } else { run->dynfileqCurrent = TAILQ_NEXT(run->dynfileqCurrent, pointers); } } } input_setSize(run, run->dynfileqCurrent->size); memcpy(run->dynamicFile, run->dynfileqCurrent->data, run->dynfileqCurrent->size); mangle_mangleContent(run); return true; } bool input_prepareStaticFile(run_t* run, bool rewind) { static __thread char fname[PATH_MAX]; if (!input_getNext(run, fname, /* rewind= */ rewind)) { return false; } run->origFileName = files_basename(fname); ssize_t fileSz = files_readFileToBufMax(fname, run->dynamicFile, run->global->maxFileSz); if (fileSz < 0) { LOG_E("Couldn't read contents of '%s'", fname); return false; } input_setSize(run, fileSz); mangle_mangleContent(run); return true; } bool input_prepareExternalFile(run_t* run) { run->origFileName = "[EXTERNAL]"; int fd = files_writeBufToTmpFile(run->global->io.workDir, (const uint8_t*)"", 0, 0); if (fd == -1) { LOG_E("Couldn't write input file to a temporary buffer"); return false; } defer { close(fd); }; char fname[PATH_MAX]; snprintf(fname, sizeof(fname), "/dev/fd/%d", fd); const char* const argv[] = {run->global->exe.externalCommand, fname, NULL}; if (subproc_System(run, argv) != 0) { LOG_E("Subprocess '%s' returned abnormally", run->global->exe.externalCommand); return false; } LOG_D("Subporcess '%s' finished with success", run->global->exe.externalCommand); ssize_t sz = files_readFromFdSeek(fd, run->dynamicFile, run->global->maxFileSz, 0); if (sz == -1) { LOG_E("Couldn't read file from fd=%d", fd); return false; } input_setSize(run, (size_t)sz); return true; } bool input_postProcessFile(run_t* run) { int fd = files_writeBufToTmpFile(run->global->io.workDir, run->dynamicFile, run->dynamicFileSz, 0); if (fd == -1) { LOG_E("Couldn't write input file to a temporary buffer"); return false; } defer { close(fd); }; char fname[PATH_MAX]; snprintf(fname, sizeof(fname), "/dev/fd/%d", fd); const char* const argv[] = {run->global->exe.postExternalCommand, fname, NULL}; if (subproc_System(run, argv) != 0) { LOG_E("Subprocess '%s' returned abnormally", run->global->exe.postExternalCommand); return false; } LOG_D("Subporcess '%s' finished with success", run->global->exe.externalCommand); ssize_t sz = files_readFromFdSeek(fd, run->dynamicFile, run->global->maxFileSz, 0); if (sz == -1) { LOG_E("Couldn't read file from fd=%d", fd); return false; } input_setSize(run, (size_t)sz); return true; }