| /* |
| * Copyright (c) 2016-2020, Facebook, Inc. |
| * All rights reserved. |
| * |
| * This source code is licensed under both the BSD-style license (found in the |
| * LICENSE file in the root directory of this source tree) and the GPLv2 (found |
| * in the COPYING file in the root directory of this source tree). |
| * You may select, at your option, one of the above-listed licenses. |
| */ |
| |
| #define ZSTD_STATIC_LINKING_ONLY |
| #define ZDICT_STATIC_LINKING_ONLY |
| |
| #include <string.h> |
| |
| #include "zstd_helpers.h" |
| #include "fuzz_helpers.h" |
| #include "zstd.h" |
| #include "zdict.h" |
| |
| const int kMinClevel = -3; |
| const int kMaxClevel = 19; |
| |
| static void set(ZSTD_CCtx *cctx, ZSTD_cParameter param, int value) |
| { |
| FUZZ_ZASSERT(ZSTD_CCtx_setParameter(cctx, param, value)); |
| } |
| |
| static void setRand(ZSTD_CCtx *cctx, ZSTD_cParameter param, unsigned min, |
| unsigned max, FUZZ_dataProducer_t *producer) { |
| unsigned const value = FUZZ_dataProducer_uint32Range(producer, min, max); |
| set(cctx, param, value); |
| } |
| |
| ZSTD_compressionParameters FUZZ_randomCParams(size_t srcSize, FUZZ_dataProducer_t *producer) |
| { |
| /* Select compression parameters */ |
| ZSTD_compressionParameters cParams; |
| cParams.windowLog = FUZZ_dataProducer_uint32Range(producer, ZSTD_WINDOWLOG_MIN, 15); |
| cParams.hashLog = FUZZ_dataProducer_uint32Range(producer, ZSTD_HASHLOG_MIN, 15); |
| cParams.chainLog = FUZZ_dataProducer_uint32Range(producer, ZSTD_CHAINLOG_MIN, 16); |
| cParams.searchLog = FUZZ_dataProducer_uint32Range(producer, ZSTD_SEARCHLOG_MIN, 9); |
| cParams.minMatch = FUZZ_dataProducer_uint32Range(producer, ZSTD_MINMATCH_MIN, |
| ZSTD_MINMATCH_MAX); |
| cParams.targetLength = FUZZ_dataProducer_uint32Range(producer, 0, 512); |
| cParams.strategy = FUZZ_dataProducer_uint32Range(producer, ZSTD_STRATEGY_MIN, ZSTD_STRATEGY_MAX); |
| return ZSTD_adjustCParams(cParams, srcSize, 0); |
| } |
| |
| ZSTD_frameParameters FUZZ_randomFParams(FUZZ_dataProducer_t *producer) |
| { |
| /* Select frame parameters */ |
| ZSTD_frameParameters fParams; |
| fParams.contentSizeFlag = FUZZ_dataProducer_uint32Range(producer, 0, 1); |
| fParams.checksumFlag = FUZZ_dataProducer_uint32Range(producer, 0, 1); |
| fParams.noDictIDFlag = FUZZ_dataProducer_uint32Range(producer, 0, 1); |
| return fParams; |
| } |
| |
| ZSTD_parameters FUZZ_randomParams(size_t srcSize, FUZZ_dataProducer_t *producer) |
| { |
| ZSTD_parameters params; |
| params.cParams = FUZZ_randomCParams(srcSize, producer); |
| params.fParams = FUZZ_randomFParams(producer); |
| return params; |
| } |
| |
| void FUZZ_setRandomParameters(ZSTD_CCtx *cctx, size_t srcSize, FUZZ_dataProducer_t *producer) |
| { |
| ZSTD_compressionParameters cParams = FUZZ_randomCParams(srcSize, producer); |
| set(cctx, ZSTD_c_windowLog, cParams.windowLog); |
| set(cctx, ZSTD_c_hashLog, cParams.hashLog); |
| set(cctx, ZSTD_c_chainLog, cParams.chainLog); |
| set(cctx, ZSTD_c_searchLog, cParams.searchLog); |
| set(cctx, ZSTD_c_minMatch, cParams.minMatch); |
| set(cctx, ZSTD_c_targetLength, cParams.targetLength); |
| set(cctx, ZSTD_c_strategy, cParams.strategy); |
| /* Select frame parameters */ |
| setRand(cctx, ZSTD_c_contentSizeFlag, 0, 1, producer); |
| setRand(cctx, ZSTD_c_checksumFlag, 0, 1, producer); |
| setRand(cctx, ZSTD_c_dictIDFlag, 0, 1, producer); |
| /* Select long distance matching parameters */ |
| setRand(cctx, ZSTD_c_enableLongDistanceMatching, 0, 1, producer); |
| setRand(cctx, ZSTD_c_ldmHashLog, ZSTD_HASHLOG_MIN, 16, producer); |
| setRand(cctx, ZSTD_c_ldmMinMatch, ZSTD_LDM_MINMATCH_MIN, |
| ZSTD_LDM_MINMATCH_MAX, producer); |
| setRand(cctx, ZSTD_c_ldmBucketSizeLog, 0, ZSTD_LDM_BUCKETSIZELOG_MAX, |
| producer); |
| setRand(cctx, ZSTD_c_ldmHashRateLog, ZSTD_LDM_HASHRATELOG_MIN, |
| ZSTD_LDM_HASHRATELOG_MAX, producer); |
| /* Set misc parameters */ |
| setRand(cctx, ZSTD_c_nbWorkers, 0, 2, producer); |
| setRand(cctx, ZSTD_c_rsyncable, 0, 1, producer); |
| setRand(cctx, ZSTD_c_forceMaxWindow, 0, 1, producer); |
| setRand(cctx, ZSTD_c_literalCompressionMode, 0, 2, producer); |
| setRand(cctx, ZSTD_c_forceAttachDict, 0, 2, producer); |
| if (FUZZ_dataProducer_uint32Range(producer, 0, 1) == 0) { |
| setRand(cctx, ZSTD_c_srcSizeHint, ZSTD_SRCSIZEHINT_MIN, 2 * srcSize, producer); |
| } |
| if (FUZZ_dataProducer_uint32Range(producer, 0, 1) == 0) { |
| setRand(cctx, ZSTD_c_targetCBlockSize, ZSTD_TARGETCBLOCKSIZE_MIN, ZSTD_TARGETCBLOCKSIZE_MAX, producer); |
| } |
| } |
| |
| FUZZ_dict_t FUZZ_train(void const* src, size_t srcSize, FUZZ_dataProducer_t *producer) |
| { |
| size_t const dictSize = MAX(srcSize / 8, 1024); |
| size_t const totalSampleSize = dictSize * 11; |
| FUZZ_dict_t dict = { FUZZ_malloc(dictSize), dictSize }; |
| char* const samples = (char*)FUZZ_malloc(totalSampleSize); |
| unsigned nbSamples = 100; |
| size_t* const samplesSizes = (size_t*)FUZZ_malloc(sizeof(size_t) * nbSamples); |
| size_t pos = 0; |
| size_t sample = 0; |
| ZDICT_fastCover_params_t params; |
| |
| for (sample = 0; sample < nbSamples; ++sample) { |
| size_t const remaining = totalSampleSize - pos; |
| size_t const offset = FUZZ_dataProducer_uint32Range(producer, 0, MAX(srcSize, 1) - 1); |
| size_t const limit = MIN(srcSize - offset, remaining); |
| size_t const toCopy = MIN(limit, remaining / (nbSamples - sample)); |
| memcpy(samples + pos, src + offset, toCopy); |
| pos += toCopy; |
| samplesSizes[sample] = toCopy; |
| } |
| memset(samples + pos, 0, totalSampleSize - pos); |
| |
| memset(¶ms, 0, sizeof(params)); |
| params.accel = 5; |
| params.k = 40; |
| params.d = 8; |
| params.f = 14; |
| params.zParams.compressionLevel = 1; |
| dict.size = ZDICT_trainFromBuffer_fastCover(dict.buff, dictSize, |
| samples, samplesSizes, nbSamples, params); |
| if (ZSTD_isError(dict.size)) { |
| free(dict.buff); |
| memset(&dict, 0, sizeof(dict)); |
| } |
| |
| free(samplesSizes); |
| free(samples); |
| |
| return dict; |
| } |