| /** |
| * JPEG XL parser |
| * Copyright (c) 2023 Leo Izen <leo.izen@gmail.com> |
| * |
| * This file is part of FFmpeg. |
| * |
| * FFmpeg is free software; you can redistribute it and/or |
| * modify it under the terms of the GNU Lesser General Public |
| * License as published by the Free Software Foundation; either |
| * version 2.1 of the License, or (at your option) any later version. |
| * |
| * FFmpeg is distributed in the hope that it will be useful, |
| * but WITHOUT ANY WARRANTY; without even the implied warranty of |
| * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
| * Lesser General Public License for more details. |
| * |
| * You should have received a copy of the GNU Lesser General Public |
| * License along with FFmpeg; if not, write to the Free Software |
| * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA |
| */ |
| |
| #include <errno.h> |
| #include <stdint.h> |
| #include <string.h> |
| |
| #include "libavutil/attributes.h" |
| #include "libavutil/error.h" |
| #include "libavutil/intmath.h" |
| #include "libavutil/macros.h" |
| #include "libavutil/mem.h" |
| #include "libavutil/pixfmt.h" |
| |
| #include "bytestream.h" |
| #include "codec_id.h" |
| #define UNCHECKED_BITSTREAM_READER 0 |
| #define BITSTREAM_READER_LE |
| #include "get_bits.h" |
| #include "jpegxl.h" |
| #include "jpegxl_parse.h" |
| #include "parser.h" |
| #include "vlc.h" |
| |
| #define JXL_FLAG_NOISE 1 |
| #define JXL_FLAG_PATCHES 2 |
| #define JXL_FLAG_SPLINES 16 |
| #define JXL_FLAG_USE_LF_FRAME 32 |
| #define JXL_FLAG_SKIP_ADAPTIVE_LF_SMOOTH 128 |
| |
| #define MAX_PREFIX_ALPHABET_SIZE (1u << 15) |
| |
| #define clog1p(x) (ff_log2(x) + !!(x)) |
| #define unpack_signed(x) (((x) & 1 ? -(x)-1 : (x))/2) |
| #define div_ceil(x, y) (((x) - 1) / (y) + 1) |
| #define vlm(a,b) {.sym = (a), .len = (b)} |
| |
| typedef struct JXLHybridUintConf { |
| int split_exponent; |
| uint32_t msb_in_token; |
| uint32_t lsb_in_token; |
| } JXLHybridUintConf; |
| |
| typedef struct JXLSymbolDistribution { |
| JXLHybridUintConf config; |
| int log_bucket_size; |
| /* this is the actual size of the alphabet */ |
| int alphabet_size; |
| /* ceil(log(alphabet_size)) */ |
| int log_alphabet_size; |
| |
| /* for prefix code distributions */ |
| VLC vlc; |
| /* in case bits == 0 */ |
| uint32_t default_symbol; |
| |
| /* |
| * each (1 << log_alphabet_size) length |
| * with log_alphabet_size <= 8 |
| */ |
| /* frequencies associated with this Distribution */ |
| uint32_t freq[258]; |
| /* cutoffs for using the symbol table */ |
| uint16_t cutoffs[258]; |
| /* the symbol table for this distribution */ |
| uint16_t symbols[258]; |
| /* the offset for symbols */ |
| uint16_t offsets[258]; |
| |
| /* if this distribution contains only one symbol this is its index */ |
| int uniq_pos; |
| } JXLSymbolDistribution; |
| |
| typedef struct JXLDistributionBundle { |
| /* lz77 flags */ |
| int lz77_enabled; |
| uint32_t lz77_min_symbol; |
| uint32_t lz77_min_length; |
| JXLHybridUintConf lz_len_conf; |
| |
| /* one entry for each distribution */ |
| uint8_t *cluster_map; |
| /* length of cluster_map */ |
| int num_dist; |
| |
| /* one for each cluster */ |
| JXLSymbolDistribution *dists; |
| int num_clusters; |
| |
| /* whether to use brotli prefixes or ans */ |
| int use_prefix_code; |
| /* bundle log alphabet size, dist ones may be smaller */ |
| int log_alphabet_size; |
| } JXLDistributionBundle; |
| |
| typedef struct JXLEntropyDecoder { |
| |
| /* state is a positive 32-bit integer, or -1 if unset */ |
| int64_t state; |
| |
| /* lz77 values */ |
| uint32_t num_to_copy; |
| uint32_t copy_pos; |
| uint32_t num_decoded; |
| |
| /* length is (1 << 20) */ |
| /* if lz77 is enabled for this bundle */ |
| /* if lz77 is disabled it's NULL */ |
| uint32_t *window; |
| |
| /* primary bundle associated with this distribution */ |
| JXLDistributionBundle bundle; |
| |
| /* for av_log */ |
| void *logctx; |
| } JXLEntropyDecoder; |
| |
| typedef struct JXLFrame { |
| FFJXLFrameType type; |
| FFJXLFrameEncoding encoding; |
| |
| int is_last; |
| int full_frame; |
| |
| uint32_t total_length; |
| uint32_t body_length; |
| } JXLFrame; |
| |
| typedef struct JXLCodestream { |
| FFJXLMetadata meta; |
| JXLFrame frame; |
| } JXLCodestream; |
| |
| typedef struct JXLParseContext { |
| ParseContext pc; |
| JXLCodestream codestream; |
| |
| /* using ISOBMFF-based container */ |
| int container; |
| int skip; |
| int copied; |
| int collected_size; |
| int codestream_length; |
| int skipped_icc; |
| int next; |
| |
| uint8_t cs_buffer[4096 + AV_INPUT_BUFFER_PADDING_SIZE]; |
| } JXLParseContext; |
| |
| /* used for reading brotli prefixes */ |
| static const VLCElem level0_table[16] = { |
| vlm(0, 2), vlm(4, 2), vlm(3, 2), vlm(2, 3), vlm(0, 2), vlm(4, 2), vlm(3, 2), vlm(1, 4), |
| vlm(0, 2), vlm(4, 2), vlm(3, 2), vlm(2, 3), vlm(0, 2), vlm(4, 2), vlm(3, 2), vlm(5, 4), |
| }; |
| |
| /* prefix table for populating ANS distribution */ |
| static const VLCElem dist_prefix_table[128] = { |
| vlm(10, 3), vlm(12, 7), vlm(7, 3), vlm(3, 4), vlm(6, 3), vlm(8, 3), vlm(9, 3), vlm(5, 4), |
| vlm(10, 3), vlm(4, 4), vlm(7, 3), vlm(1, 4), vlm(6, 3), vlm(8, 3), vlm(9, 3), vlm(2, 4), |
| vlm(10, 3), vlm(0, 5), vlm(7, 3), vlm(3, 4), vlm(6, 3), vlm(8, 3), vlm(9, 3), vlm(5, 4), |
| vlm(10, 3), vlm(4, 4), vlm(7, 3), vlm(1, 4), vlm(6, 3), vlm(8, 3), vlm(9, 3), vlm(2, 4), |
| vlm(10, 3), vlm(11, 6), vlm(7, 3), vlm(3, 4), vlm(6, 3), vlm(8, 3), vlm(9, 3), vlm(5, 4), |
| vlm(10, 3), vlm(4, 4), vlm(7, 3), vlm(1, 4), vlm(6, 3), vlm(8, 3), vlm(9, 3), vlm(2, 4), |
| vlm(10, 3), vlm(0, 5), vlm(7, 3), vlm(3, 4), vlm(6, 3), vlm(8, 3), vlm(9, 3), vlm(5, 4), |
| vlm(10, 3), vlm(4, 4), vlm(7, 3), vlm(1, 4), vlm(6, 3), vlm(8, 3), vlm(9, 3), vlm(2, 4), |
| vlm(10, 3), vlm(13, 7), vlm(7, 3), vlm(3, 4), vlm(6, 3), vlm(8, 3), vlm(9, 3), vlm(5, 4), |
| vlm(10, 3), vlm(4, 4), vlm(7, 3), vlm(1, 4), vlm(6, 3), vlm(8, 3), vlm(9, 3), vlm(2, 4), |
| vlm(10, 3), vlm(0, 5), vlm(7, 3), vlm(3, 4), vlm(6, 3), vlm(8, 3), vlm(9, 3), vlm(5, 4), |
| vlm(10, 3), vlm(4, 4), vlm(7, 3), vlm(1, 4), vlm(6, 3), vlm(8, 3), vlm(9, 3), vlm(2, 4), |
| vlm(10, 3), vlm(11, 6), vlm(7, 3), vlm(3, 4), vlm(6, 3), vlm(8, 3), vlm(9, 3), vlm(5, 4), |
| vlm(10, 3), vlm(4, 4), vlm(7, 3), vlm(1, 4), vlm(6, 3), vlm(8, 3), vlm(9, 3), vlm(2, 4), |
| vlm(10, 3), vlm(0, 5), vlm(7, 3), vlm(3, 4), vlm(6, 3), vlm(8, 3), vlm(9, 3), vlm(5, 4), |
| vlm(10, 3), vlm(4, 4), vlm(7, 3), vlm(1, 4), vlm(6, 3), vlm(8, 3), vlm(9, 3), vlm(2, 4), |
| }; |
| |
| static const uint8_t prefix_codelen_map[18] = { |
| 1, 2, 3, 4, 0, 5, 17, 6, 16, 7, 8, 9, 10, 11, 12, 13, 14, 15, |
| }; |
| |
| /** |
| * Read a variable-length 8-bit integer. |
| * Used when populating the ANS frequency tables. |
| */ |
| static av_always_inline uint8_t jxl_u8(GetBitContext *gb) |
| { |
| int n; |
| if (!get_bits1(gb)) |
| return 0; |
| n = get_bits(gb, 3); |
| |
| return get_bitsz(gb, n) | (1 << n); |
| } |
| |
| /* read a U32(c_i + u(u_i)) */ |
| static av_always_inline uint32_t jxl_u32(GetBitContext *gb, |
| uint32_t c0, uint32_t c1, uint32_t c2, uint32_t c3, |
| uint32_t u0, uint32_t u1, uint32_t u2, uint32_t u3) |
| { |
| const uint32_t constants[4] = {c0, c1, c2, c3}; |
| const uint32_t ubits [4] = {u0, u1, u2, u3}; |
| uint32_t ret, choice = get_bits(gb, 2); |
| |
| ret = constants[choice]; |
| if (ubits[choice]) |
| ret += get_bits_long(gb, ubits[choice]); |
| |
| return ret; |
| } |
| |
| /* read a U64() */ |
| static uint64_t jxl_u64(GetBitContext *gb) |
| { |
| uint64_t shift = 12, ret; |
| |
| switch (get_bits(gb, 2)) { |
| case 1: |
| ret = 1 + get_bits(gb, 4); |
| break; |
| case 2: |
| ret = 17 + get_bits(gb, 8); |
| break; |
| case 3: |
| ret = get_bits(gb, 12); |
| while (get_bits1(gb)) { |
| if (shift < 60) { |
| ret |= (uint64_t)get_bits(gb, 8) << shift; |
| shift += 8; |
| } else { |
| ret |= (uint64_t)get_bits(gb, 4) << shift; |
| break; |
| } |
| } |
| break; |
| default: |
| ret = 0; |
| } |
| |
| return ret; |
| } |
| |
| static int read_hybrid_uint_conf(GetBitContext *gb, JXLHybridUintConf *conf, int log_alphabet_size) |
| { |
| conf->split_exponent = get_bitsz(gb, clog1p(log_alphabet_size)); |
| if (conf->split_exponent == log_alphabet_size) { |
| conf->msb_in_token = conf->lsb_in_token = 0; |
| return 0; |
| } |
| |
| conf->msb_in_token = get_bitsz(gb, clog1p(conf->split_exponent)); |
| if (conf->msb_in_token > conf->split_exponent) |
| return AVERROR_INVALIDDATA; |
| conf->lsb_in_token = get_bitsz(gb, clog1p(conf->split_exponent - conf->msb_in_token)); |
| if (conf->msb_in_token + conf->lsb_in_token > conf->split_exponent) |
| return AVERROR_INVALIDDATA; |
| |
| return 0; |
| } |
| |
| static int read_hybrid_uint(GetBitContext *gb, const JXLHybridUintConf *conf, uint32_t token, uint32_t *hybrid_uint) |
| { |
| uint32_t n, low, split = 1 << conf->split_exponent; |
| |
| if (token < split) { |
| *hybrid_uint = token; |
| return 0; |
| } |
| |
| n = conf->split_exponent - conf->lsb_in_token - conf->msb_in_token + |
| ((token - split) >> (conf->msb_in_token + conf->lsb_in_token)); |
| if (n >= 32) |
| return AVERROR_INVALIDDATA; |
| low = token & ((1 << conf->lsb_in_token) - 1); |
| token >>= conf->lsb_in_token; |
| token &= (1 << conf->msb_in_token) - 1; |
| token |= 1 << conf->msb_in_token; |
| *hybrid_uint = (((token << n) | get_bits_long(gb, n)) << conf->lsb_in_token ) | low; |
| |
| return 0; |
| } |
| |
| static inline uint32_t read_prefix_symbol(GetBitContext *gb, const JXLSymbolDistribution *dist) |
| { |
| if (!dist->vlc.bits) |
| return dist->default_symbol; |
| |
| return get_vlc2(gb, dist->vlc.table, dist->vlc.bits, 1); |
| } |
| |
| static uint32_t read_ans_symbol(GetBitContext *gb, JXLEntropyDecoder *dec, const JXLSymbolDistribution *dist) |
| { |
| uint32_t index, i, pos, symbol, offset; |
| |
| if (dec->state < 0) |
| dec->state = get_bits_long(gb, 32); |
| |
| index = dec->state & 0xFFF; |
| i = index >> dist->log_bucket_size; |
| pos = index & ((1 << dist->log_bucket_size) - 1); |
| symbol = pos >= dist->cutoffs[i] ? dist->symbols[i] : i; |
| offset = pos >= dist->cutoffs[i] ? dist->offsets[i] + pos : pos; |
| dec->state = dist->freq[symbol] * (dec->state >> 12) + offset; |
| if (dec->state < (1 << 16)) |
| dec->state = (dec->state << 16) | get_bits(gb, 16); |
| dec->state &= 0xFFFFFFFF; |
| |
| return symbol; |
| } |
| |
| static int decode_hybrid_varlen_uint(GetBitContext *gb, JXLEntropyDecoder *dec, |
| const JXLDistributionBundle *bundle, |
| uint32_t context, uint32_t *hybrid_uint) |
| { |
| int ret; |
| uint32_t token, distance; |
| const JXLSymbolDistribution *dist; |
| |
| if (dec->num_to_copy > 0) { |
| *hybrid_uint = dec->window[dec->copy_pos++ & 0xFFFFF]; |
| dec->num_to_copy--; |
| dec->window[dec->num_decoded++ & 0xFFFFF] = *hybrid_uint; |
| return 0; |
| } |
| |
| if (context >= bundle->num_dist) |
| return AVERROR(EINVAL); |
| if (bundle->cluster_map[context] >= bundle->num_clusters) |
| return AVERROR_INVALIDDATA; |
| |
| dist = &bundle->dists[bundle->cluster_map[context]]; |
| if (bundle->use_prefix_code) |
| token = read_prefix_symbol(gb, dist); |
| else |
| token = read_ans_symbol(gb, dec, dist); |
| |
| if (bundle->lz77_enabled && token >= bundle->lz77_min_symbol) { |
| const JXLSymbolDistribution *lz77dist = &bundle->dists[bundle->cluster_map[bundle->num_dist - 1]]; |
| ret = read_hybrid_uint(gb, &bundle->lz_len_conf, token - bundle->lz77_min_symbol, &dec->num_to_copy); |
| if (ret < 0) |
| return ret; |
| dec->num_to_copy += bundle->lz77_min_length; |
| if (bundle->use_prefix_code) |
| token = read_prefix_symbol(gb, lz77dist); |
| else |
| token = read_ans_symbol(gb, dec, lz77dist); |
| ret = read_hybrid_uint(gb, &lz77dist->config, token, &distance); |
| if (ret < 0) |
| return ret; |
| distance++; |
| distance = FFMIN3(distance, dec->num_decoded, 1 << 20); |
| dec->copy_pos = dec->num_decoded - distance; |
| return decode_hybrid_varlen_uint(gb, dec, bundle, context, hybrid_uint); |
| } |
| ret = read_hybrid_uint(gb, &dist->config, token, hybrid_uint); |
| if (ret < 0) |
| return ret; |
| if (bundle->lz77_enabled) |
| dec->window[dec->num_decoded++ & 0xFFFFF] = *hybrid_uint; |
| |
| return 0; |
| } |
| |
| static int populate_distribution(GetBitContext *gb, JXLSymbolDistribution *dist, int log_alphabet_size) |
| { |
| int len = 0, shift, omit_log = -1, omit_pos = -1; |
| int prev = 0, num_same = 0; |
| uint32_t total_count = 0; |
| uint8_t logcounts[258] = { 0 }; |
| uint8_t same[258] = { 0 }; |
| const int table_size = 1 << log_alphabet_size; |
| dist->uniq_pos = -1; |
| |
| if (get_bits1(gb)) { |
| /* simple code */ |
| if (get_bits1(gb)) { |
| uint8_t v1 = jxl_u8(gb); |
| uint8_t v2 = jxl_u8(gb); |
| if (v1 == v2) |
| return AVERROR_INVALIDDATA; |
| dist->freq[v1] = get_bits(gb, 12); |
| dist->freq[v2] = (1 << 12) - dist->freq[v1]; |
| if (!dist->freq[v1]) |
| dist->uniq_pos = v2; |
| dist->alphabet_size = 1 + FFMAX(v1, v2); |
| } else { |
| uint8_t x = jxl_u8(gb); |
| dist->freq[x] = 1 << 12; |
| dist->uniq_pos = x; |
| dist->alphabet_size = 1 + x; |
| } |
| if (dist->alphabet_size > table_size) |
| return AVERROR_INVALIDDATA; |
| |
| return 0; |
| } |
| |
| if (get_bits1(gb)) { |
| /* flat code */ |
| dist->alphabet_size = jxl_u8(gb) + 1; |
| if (dist->alphabet_size > table_size) |
| return AVERROR_INVALIDDATA; |
| for (int i = 0; i < dist->alphabet_size; i++) |
| dist->freq[i] = (1 << 12) / dist->alphabet_size; |
| for (int i = 0; i < (1 << 12) % dist->alphabet_size; i++) |
| dist->freq[i]++; |
| return 0; |
| } |
| |
| do { |
| if (!get_bits1(gb)) |
| break; |
| } while (++len < 3); |
| |
| shift = (get_bitsz(gb, len) | (1 << len)) - 1; |
| if (shift > 13) |
| return AVERROR_INVALIDDATA; |
| |
| dist->alphabet_size = jxl_u8(gb) + 3; |
| if (dist->alphabet_size > table_size) |
| return AVERROR_INVALIDDATA; |
| |
| for (int i = 0; i < dist->alphabet_size; i++) { |
| logcounts[i] = get_vlc2(gb, dist_prefix_table, 7, 1); |
| if (logcounts[i] == 13) { |
| int rle = jxl_u8(gb); |
| same[i] = rle + 5; |
| i += rle + 3; |
| continue; |
| } |
| if (logcounts[i] > omit_log) { |
| omit_log = logcounts[i]; |
| omit_pos = i; |
| } |
| } |
| if (omit_pos < 0 || omit_pos + 1 < dist->alphabet_size && logcounts[omit_pos + 1] == 13) |
| return AVERROR_INVALIDDATA; |
| |
| for (int i = 0; i < dist->alphabet_size; i++) { |
| if (same[i]) { |
| num_same = same[i] - 1; |
| prev = i > 0 ? dist->freq[i - 1] : 0; |
| } |
| if (num_same) { |
| dist->freq[i] = prev; |
| num_same--; |
| } else { |
| if (i == omit_pos || !logcounts[i]) |
| continue; |
| if (logcounts[i] == 1) { |
| dist->freq[i] = 1; |
| } else { |
| int bitcount = FFMIN(FFMAX(0, shift - ((12 - logcounts[i] + 1) >> 1)), logcounts[i] - 1); |
| dist->freq[i] = (1 << (logcounts[i] - 1)) + (get_bitsz(gb, bitcount) << (logcounts[i] - 1 - bitcount)); |
| } |
| } |
| total_count += dist->freq[i]; |
| } |
| dist->freq[omit_pos] = (1 << 12) - total_count; |
| |
| return 0; |
| } |
| |
| static void dist_bundle_close(JXLDistributionBundle *bundle) |
| { |
| if (bundle->use_prefix_code && bundle->dists) |
| for (int i = 0; i < bundle->num_clusters; i++) |
| ff_vlc_free(&bundle->dists[i].vlc); |
| av_freep(&bundle->dists); |
| av_freep(&bundle->cluster_map); |
| } |
| |
| |
| static int read_distribution_bundle(GetBitContext *gb, JXLEntropyDecoder *dec, |
| JXLDistributionBundle *bundle, int num_dist, int disallow_lz77); |
| |
| static int read_dist_clustering(GetBitContext *gb, JXLEntropyDecoder *dec, JXLDistributionBundle *bundle) |
| { |
| int ret; |
| |
| bundle->cluster_map = av_malloc(bundle->num_dist); |
| if (!bundle->cluster_map) |
| return AVERROR(ENOMEM); |
| |
| if (bundle->num_dist == 1) { |
| bundle->cluster_map[0] = 0; |
| bundle->num_clusters = 1; |
| return 0; |
| } |
| |
| if (get_bits1(gb)) { |
| /* simple clustering */ |
| uint32_t nbits = get_bits(gb, 2); |
| for (int i = 0; i < bundle->num_dist; i++) |
| bundle->cluster_map[i] = get_bitsz(gb, nbits); |
| } else { |
| /* complex clustering */ |
| int use_mtf = get_bits1(gb); |
| JXLDistributionBundle nested = { 0 }; |
| /* num_dist == 1 prevents this from recursing again */ |
| ret = read_distribution_bundle(gb, dec, &nested, 1, bundle->num_dist <= 2); |
| if (ret < 0) { |
| dist_bundle_close(&nested); |
| return ret; |
| } |
| for (int i = 0; i < bundle->num_dist; i++) { |
| uint32_t clust; |
| ret = decode_hybrid_varlen_uint(gb, dec, &nested, 0, &clust); |
| if (ret < 0) { |
| dist_bundle_close(&nested); |
| return ret; |
| } |
| bundle->cluster_map[i] = clust; |
| } |
| dec->state = -1; |
| /* it's not going to necessarily be zero after reading */ |
| dec->num_to_copy = 0; |
| dist_bundle_close(&nested); |
| if (use_mtf) { |
| uint8_t mtf[256]; |
| for (int i = 0; i < 256; i++) |
| mtf[i] = i; |
| for (int i = 0; i < bundle->num_dist; i++) { |
| int index = bundle->cluster_map[i]; |
| bundle->cluster_map[i] = mtf[index]; |
| if (index) { |
| int value = mtf[index]; |
| for (int j = index; j > 0; j--) |
| mtf[j] = mtf[j - 1]; |
| mtf[0] = value; |
| } |
| } |
| } |
| } |
| for (int i = 0; i < bundle->num_dist; i++) { |
| if (bundle->cluster_map[i] >= bundle->num_clusters) |
| bundle->num_clusters = bundle->cluster_map[i] + 1; |
| } |
| |
| if (bundle->num_clusters > bundle->num_dist) |
| return AVERROR_INVALIDDATA; |
| |
| return 0; |
| } |
| |
| static int gen_alias_map(JXLEntropyDecoder *dec, JXLSymbolDistribution *dist, int log_alphabet_size) |
| { |
| uint32_t bucket_size, table_size; |
| uint8_t overfull[256], underfull[256]; |
| int overfull_pos = 0, underfull_pos = 0; |
| dist->log_bucket_size = 12 - log_alphabet_size; |
| bucket_size = 1 << dist->log_bucket_size; |
| table_size = 1 << log_alphabet_size; |
| |
| if (dist->uniq_pos >= 0) { |
| for (int i = 0; i < table_size; i++) { |
| dist->symbols[i] = dist->uniq_pos; |
| dist->offsets[i] = bucket_size * i; |
| dist->cutoffs[i] = 0; |
| } |
| return 0; |
| } |
| |
| for (int i = 0; i < dist->alphabet_size; i++) { |
| dist->cutoffs[i] = dist->freq[i]; |
| dist->symbols[i] = i; |
| if (dist->cutoffs[i] > bucket_size) |
| overfull[overfull_pos++] = i; |
| else if (dist->cutoffs[i] < bucket_size) |
| underfull[underfull_pos++] = i; |
| } |
| |
| for (int i = dist->alphabet_size; i < table_size; i++) { |
| dist->cutoffs[i] = 0; |
| underfull[underfull_pos++] = i; |
| } |
| |
| while (overfull_pos) { |
| int o, u, by; |
| /* this should be impossible */ |
| if (!underfull_pos) |
| return AVERROR_INVALIDDATA; |
| u = underfull[--underfull_pos]; |
| o = overfull[--overfull_pos]; |
| by = bucket_size - dist->cutoffs[u]; |
| dist->cutoffs[o] -= by; |
| dist->symbols[u] = o; |
| dist->offsets[u] = dist->cutoffs[o]; |
| if (dist->cutoffs[o] < bucket_size) |
| underfull[underfull_pos++] = o; |
| else if (dist->cutoffs[o] > bucket_size) |
| overfull[overfull_pos++] = o; |
| } |
| |
| for (int i = 0; i < table_size; i++) { |
| if (dist->cutoffs[i] == bucket_size) { |
| dist->symbols[i] = i; |
| dist->offsets[i] = 0; |
| dist->cutoffs[i] = 0; |
| } else { |
| dist->offsets[i] -= dist->cutoffs[i]; |
| } |
| } |
| |
| return 0; |
| } |
| |
| static int read_simple_vlc_prefix(GetBitContext *gb, JXLEntropyDecoder *dec, JXLSymbolDistribution *dist) |
| { |
| int nsym, tree_select, bits; |
| |
| int8_t lens[4]; |
| int16_t symbols[4]; |
| |
| nsym = 1 + get_bits(gb, 2); |
| for (int i = 0; i < nsym; i++) |
| symbols[i] = get_bitsz(gb, dist->log_alphabet_size); |
| if (nsym == 4) |
| tree_select = get_bits1(gb); |
| switch (nsym) { |
| case 1: |
| dist->vlc.bits = 0; |
| dist->default_symbol = symbols[0]; |
| return 0; |
| case 2: |
| bits = 1; |
| lens[0] = 1, lens[1] = 1, lens[2] = 0, lens[3] = 0; |
| if (symbols[1] < symbols[0]) |
| FFSWAP(int16_t, symbols[0], symbols[1]); |
| break; |
| case 3: |
| bits = 2; |
| lens[0] = 1, lens[1] = 2, lens[2] = 2, lens[3] = 0; |
| if (symbols[2] < symbols[1]) |
| FFSWAP(int16_t, symbols[1], symbols[2]); |
| break; |
| case 4: |
| if (tree_select) { |
| bits = 3; |
| lens[0] = 1, lens[1] = 2, lens[2] = 3, lens[3] = 3; |
| if (symbols[3] < symbols[2]) |
| FFSWAP(int16_t, symbols[2], symbols[3]); |
| } else { |
| bits = 2; |
| lens[0] = 2, lens[1] = 2, lens[2] = 2, lens[3] = 2; |
| while (1) { |
| if (symbols[1] < symbols[0]) |
| FFSWAP(int16_t, symbols[0], symbols[1]); |
| if (symbols[3] < symbols[2]) |
| FFSWAP(int16_t, symbols[2], symbols[3]); |
| if (symbols[1] <= symbols[2]) |
| break; |
| FFSWAP(int16_t, symbols[1], symbols[2]); |
| } |
| } |
| break; |
| default: |
| // Challenge Complete! How did we get here? |
| return AVERROR_BUG; |
| } |
| |
| return ff_vlc_init_from_lengths(&dist->vlc, bits, nsym, lens, 1, symbols, |
| 2, 2, 0, VLC_INIT_LE, dec->logctx); |
| } |
| |
| static int read_vlc_prefix(GetBitContext *gb, JXLEntropyDecoder *dec, JXLSymbolDistribution *dist) |
| { |
| int8_t level1_lens[18] = { 0 }; |
| int8_t level1_lens_s[18] = { 0 }; |
| int16_t level1_syms[18] = { 0 }; |
| uint32_t level1_codecounts[19] = { 0 }; |
| uint8_t *buf = NULL; |
| int8_t *level2_lens, *level2_lens_s; |
| int16_t *level2_syms; |
| uint32_t *level2_codecounts; |
| |
| int repeat_count_prev = 0, repeat_count_zero = 0, prev = 8; |
| int total_code = 0, len, hskip, num_codes = 0, ret; |
| |
| VLC level1_vlc = { 0 }; |
| |
| if (dist->alphabet_size == 1) { |
| dist->vlc.bits = 0; |
| dist->default_symbol = 0; |
| return 0; |
| } |
| |
| hskip = get_bits(gb, 2); |
| if (hskip == 1) |
| return read_simple_vlc_prefix(gb, dec, dist); |
| |
| level1_codecounts[0] = hskip; |
| for (int i = hskip; i < 18; i++) { |
| len = level1_lens[prefix_codelen_map[i]] = get_vlc2(gb, level0_table, 4, 1); |
| if (len < 0) { |
| ret = AVERROR_INVALIDDATA; |
| goto end; |
| } |
| level1_codecounts[len]++; |
| if (len) { |
| total_code += (32 >> len); |
| num_codes++; |
| } |
| if (total_code >= 32) { |
| level1_codecounts[0] += 18 - i - 1; |
| break; |
| } |
| } |
| |
| if (total_code != 32 && num_codes >= 2 || num_codes < 1) { |
| ret = AVERROR_INVALIDDATA; |
| goto end; |
| } |
| |
| for (int i = 1; i < 19; i++) |
| level1_codecounts[i] += level1_codecounts[i - 1]; |
| |
| for (int i = 17; i >= 0; i--) { |
| int idx = --level1_codecounts[level1_lens[i]]; |
| level1_lens_s[idx] = level1_lens[i]; |
| level1_syms[idx] = i; |
| } |
| |
| ret = ff_vlc_init_from_lengths(&level1_vlc, 5, 18, level1_lens_s, 1, level1_syms, 2, 2, |
| 0, VLC_INIT_LE, dec->logctx); |
| if (ret < 0) |
| goto end; |
| |
| buf = av_mallocz(MAX_PREFIX_ALPHABET_SIZE * (2 * sizeof(int8_t) + sizeof(int16_t) + sizeof(uint32_t)) |
| + sizeof(uint32_t)); |
| if (!buf) { |
| ret = AVERROR(ENOMEM); |
| goto end; |
| } |
| |
| level2_lens = (int8_t *)buf; |
| level2_lens_s = (int8_t *)(buf + MAX_PREFIX_ALPHABET_SIZE * sizeof(int8_t)); |
| level2_syms = (int16_t *)(buf + MAX_PREFIX_ALPHABET_SIZE * (2 * sizeof(int8_t))); |
| level2_codecounts = (uint32_t *)(buf + MAX_PREFIX_ALPHABET_SIZE * (2 * sizeof(int8_t) + sizeof(int16_t))); |
| |
| total_code = 0; |
| for (int i = 0; i < dist->alphabet_size; i++) { |
| len = get_vlc2(gb, level1_vlc.table, 5, 1); |
| if (len < 0) { |
| ret = AVERROR_INVALIDDATA; |
| goto end; |
| } |
| if (get_bits_left(gb) < 0) { |
| ret = AVERROR_BUFFER_TOO_SMALL; |
| goto end; |
| } |
| if (len == 16) { |
| int extra = 3 + get_bits(gb, 2); |
| if (repeat_count_prev) |
| extra += 4 * (repeat_count_prev - 2) - repeat_count_prev; |
| extra = FFMIN(extra, dist->alphabet_size - i); |
| for (int j = 0; j < extra; j++) |
| level2_lens[i + j] = prev; |
| total_code += (32768 >> prev) * extra; |
| i += extra - 1; |
| repeat_count_prev += extra; |
| repeat_count_zero = 0; |
| level2_codecounts[prev] += extra; |
| } else if (len == 17) { |
| int extra = 3 + get_bits(gb, 3); |
| if (repeat_count_zero > 0) |
| extra += 8 * (repeat_count_zero - 2) - repeat_count_zero; |
| extra = FFMIN(extra, dist->alphabet_size - i); |
| i += extra - 1; |
| repeat_count_prev = 0; |
| repeat_count_zero += extra; |
| level2_codecounts[0] += extra; |
| } else { |
| level2_lens[i] = len; |
| repeat_count_prev = repeat_count_zero = 0; |
| if (len) { |
| total_code += (32768 >> len); |
| prev = len; |
| } |
| level2_codecounts[len]++; |
| } |
| if (total_code >= 32768) { |
| level2_codecounts[0] += dist->alphabet_size - i - 1; |
| break; |
| } |
| } |
| |
| if (total_code != 32768 && level2_codecounts[0] < dist->alphabet_size - 1) { |
| ret = AVERROR_INVALIDDATA; |
| goto end; |
| } |
| |
| for (int i = 1; i < dist->alphabet_size + 1; i++) |
| level2_codecounts[i] += level2_codecounts[i - 1]; |
| |
| for (int i = dist->alphabet_size - 1; i >= 0; i--) { |
| int idx = --level2_codecounts[level2_lens[i]]; |
| level2_lens_s[idx] = level2_lens[i]; |
| level2_syms[idx] = i; |
| } |
| |
| ret = ff_vlc_init_from_lengths(&dist->vlc, 15, dist->alphabet_size, level2_lens_s, |
| 1, level2_syms, 2, 2, 0, VLC_INIT_LE, dec->logctx); |
| |
| end: |
| av_freep(&buf); |
| ff_vlc_free(&level1_vlc); |
| |
| return ret; |
| } |
| |
| static int read_distribution_bundle(GetBitContext *gb, JXLEntropyDecoder *dec, |
| JXLDistributionBundle *bundle, int num_dist, int disallow_lz77) |
| { |
| int ret; |
| |
| if (num_dist <= 0) |
| return AVERROR(EINVAL); |
| |
| bundle->num_dist = num_dist; |
| bundle->lz77_enabled = get_bits1(gb); |
| if (bundle->lz77_enabled) { |
| if (disallow_lz77) |
| return AVERROR_INVALIDDATA; |
| bundle->lz77_min_symbol = jxl_u32(gb, 224, 512, 4096, 8, 0, 0, 0, 15); |
| bundle->lz77_min_length = jxl_u32(gb, 3, 4, 5, 9, 0, 0, 2, 8); |
| bundle->num_dist++; |
| ret = read_hybrid_uint_conf(gb, &bundle->lz_len_conf, 8); |
| if (ret < 0) |
| return ret; |
| } |
| |
| if (bundle->lz77_enabled && !dec->window) { |
| dec->window = av_malloc_array(1 << 20, sizeof(uint32_t)); |
| if (!dec->window) |
| return AVERROR(ENOMEM); |
| } |
| |
| ret = read_dist_clustering(gb, dec, bundle); |
| if (ret < 0) |
| return ret; |
| if (get_bits_left(gb) < 0) |
| return AVERROR_BUFFER_TOO_SMALL; |
| |
| bundle->dists = av_calloc(bundle->num_clusters, sizeof(JXLSymbolDistribution)); |
| if (!bundle->dists) |
| return AVERROR(ENOMEM); |
| |
| bundle->use_prefix_code = get_bits1(gb); |
| bundle->log_alphabet_size = bundle->use_prefix_code ? 15 : 5 + get_bits(gb, 2); |
| |
| for (int i = 0; i < bundle->num_clusters; i++) { |
| ret = read_hybrid_uint_conf(gb, &bundle->dists[i].config, bundle->log_alphabet_size); |
| if (ret < 0) |
| return ret; |
| if (get_bits_left(gb) < 0) |
| return AVERROR_BUFFER_TOO_SMALL; |
| } |
| |
| if (bundle->use_prefix_code) { |
| for (int i = 0; i < bundle->num_clusters; i++) { |
| JXLSymbolDistribution *dist = &bundle->dists[i]; |
| if (get_bits1(gb)) { |
| int n = get_bits(gb, 4); |
| dist->alphabet_size = 1 + (1 << n) + get_bitsz(gb, n); |
| if (dist->alphabet_size > MAX_PREFIX_ALPHABET_SIZE) |
| return AVERROR_INVALIDDATA; |
| } else { |
| dist->alphabet_size = 1; |
| } |
| dist->log_alphabet_size = clog1p(dist->alphabet_size - 1); |
| } |
| for (int i = 0; i < bundle->num_clusters; i++) { |
| ret = read_vlc_prefix(gb, dec, &bundle->dists[i]); |
| if (ret < 0) |
| return ret; |
| if (get_bits_left(gb) < 0) |
| return AVERROR_BUFFER_TOO_SMALL; |
| } |
| } else { |
| for (int i = 0; i < bundle->num_clusters; i++) { |
| ret = populate_distribution(gb, &bundle->dists[i], bundle->log_alphabet_size); |
| if (ret < 0) |
| return ret; |
| if (get_bits_left(gb) < 0) |
| return AVERROR_BUFFER_TOO_SMALL; |
| } |
| for (int i = 0; i < bundle->num_clusters; i++) { |
| ret = gen_alias_map(dec, &bundle->dists[i], bundle->log_alphabet_size); |
| if (ret < 0) |
| return ret; |
| } |
| } |
| |
| return 0; |
| } |
| |
| static void entropy_decoder_close(JXLEntropyDecoder *dec) |
| { |
| if (!dec) |
| return; |
| av_freep(&dec->window); |
| dist_bundle_close(&dec->bundle); |
| } |
| |
| static int entropy_decoder_init(void *avctx, GetBitContext *gb, JXLEntropyDecoder *dec, int num_dist) |
| { |
| int ret; |
| |
| memset(dec, 0, sizeof(*dec)); |
| dec->logctx = avctx; |
| dec->state = -1; |
| |
| ret = read_distribution_bundle(gb, dec, &dec->bundle, num_dist, 0); |
| if (ret < 0) { |
| entropy_decoder_close(dec); |
| return ret; |
| } |
| |
| return 0; |
| } |
| |
| static int64_t entropy_decoder_read_symbol(GetBitContext *gb, JXLEntropyDecoder *dec, uint32_t context) |
| { |
| int ret; |
| uint32_t hybrid_uint; |
| |
| ret = decode_hybrid_varlen_uint(gb, dec, &dec->bundle, context, &hybrid_uint); |
| if (ret < 0) |
| return ret; |
| |
| return hybrid_uint; |
| } |
| |
| static inline uint32_t icc_context(uint64_t i, uint32_t b1, uint32_t b2) |
| { |
| uint32_t p1, p2; |
| if (i <= 128) |
| return 0; |
| if (b1 >= 'a' && b1 <= 'z' || b1 >= 'A' && b1 <= 'Z') |
| p1 = 0; |
| else if (b1 >= '0' && b1 <= '9' || b1 == '.' || b1 == ',') |
| p1 = 1; |
| else if (b1 <= 1) |
| p1 = b1 + 2; |
| else if (b1 > 1 && b1 < 16) |
| p1 = 4; |
| else if (b1 > 240 && b1 < 255) |
| p1 = 5; |
| else if (b1 == 255) |
| p1 = 6; |
| else |
| p1 = 7; |
| |
| if (b2 >= 'a' && b2 <= 'z' || b2 >= 'A' && b2 <= 'Z') |
| p2 = 0; |
| else if (b2 >= '0' && b2 <= '9' || b2 == '.' || b2 == ',') |
| p2 = 1; |
| else if (b2 < 16) |
| p2 = 2; |
| else if (b2 > 240) |
| p2 = 3; |
| else |
| p2 = 4; |
| |
| return 1 + p1 + p2 * 8; |
| } |
| |
| static inline uint32_t toc_context(uint32_t x) |
| { |
| return FFMIN(7, clog1p(x)); |
| } |
| |
| static void populate_fields(AVCodecParserContext *s, AVCodecContext *avctx, const FFJXLMetadata *meta) |
| { |
| s->width = meta->width; |
| s->height = meta->height; |
| |
| switch (meta->csp) { |
| case JPEGXL_CS_RGB: |
| case JPEGXL_CS_XYB: |
| avctx->colorspace = AVCOL_SPC_RGB; |
| break; |
| default: |
| avctx->colorspace = AVCOL_SPC_UNSPECIFIED; |
| } |
| |
| if (meta->wp == JPEGXL_WP_D65) { |
| switch (meta->primaries) { |
| case JPEGXL_PR_SRGB: |
| avctx->color_primaries = AVCOL_PRI_BT709; |
| break; |
| case JPEGXL_PR_P3: |
| avctx->color_primaries = AVCOL_PRI_SMPTE432; |
| break; |
| case JPEGXL_PR_2100: |
| avctx->color_primaries = AVCOL_PRI_BT2020; |
| break; |
| default: |
| avctx->color_primaries = AVCOL_PRI_UNSPECIFIED; |
| } |
| } else if (meta->wp == JPEGXL_WP_DCI && meta->primaries == JPEGXL_PR_P3) { |
| avctx->color_primaries = AVCOL_PRI_SMPTE431; |
| } else { |
| avctx->color_primaries = AVCOL_PRI_UNSPECIFIED; |
| } |
| |
| if (meta->trc > JPEGXL_TR_GAMMA) { |
| FFJXLTransferCharacteristic trc = meta->trc - JPEGXL_TR_GAMMA; |
| switch (trc) { |
| case JPEGXL_TR_BT709: |
| avctx->color_trc = AVCOL_TRC_BT709; |
| break; |
| case JPEGXL_TR_LINEAR: |
| avctx->color_trc = AVCOL_TRC_LINEAR; |
| break; |
| case JPEGXL_TR_SRGB: |
| avctx->color_trc = AVCOL_TRC_IEC61966_2_1; |
| break; |
| case JPEGXL_TR_PQ: |
| avctx->color_trc = AVCOL_TRC_SMPTEST2084; |
| break; |
| case JPEGXL_TR_DCI: |
| avctx->color_trc = AVCOL_TRC_SMPTE428; |
| break; |
| case JPEGXL_TR_HLG: |
| avctx->color_trc = AVCOL_TRC_ARIB_STD_B67; |
| break; |
| default: |
| avctx->color_trc = AVCOL_TRC_UNSPECIFIED; |
| } |
| } else if (meta->trc > 0) { |
| if (meta->trc > 45355 && meta->trc < 45555) |
| avctx->color_trc = AVCOL_TRC_GAMMA22; |
| else if (meta->trc > 35614 && meta->trc < 35814) |
| avctx->color_trc = AVCOL_TRC_GAMMA28; |
| else |
| avctx->color_trc = AVCOL_TRC_UNSPECIFIED; |
| } else { |
| avctx->color_trc = AVCOL_TRC_UNSPECIFIED; |
| } |
| |
| if (meta->csp == JPEGXL_CS_GRAY) { |
| if (meta->bit_depth <= 8) |
| s->format = meta->have_alpha ? AV_PIX_FMT_YA8 : AV_PIX_FMT_GRAY8; |
| else if (meta->bit_depth <= 16) |
| s->format = meta->have_alpha ? AV_PIX_FMT_YA16 : AV_PIX_FMT_GRAY16; |
| else |
| s->format = meta->have_alpha ? AV_PIX_FMT_NONE : AV_PIX_FMT_GRAYF32; |
| } else { |
| if (meta->bit_depth <= 8) |
| s->format = meta->have_alpha ? AV_PIX_FMT_RGBA : AV_PIX_FMT_RGB24; |
| else if (meta->bit_depth <= 16) |
| s->format = meta->have_alpha ? AV_PIX_FMT_RGBA64 : AV_PIX_FMT_RGB48; |
| else |
| s->format = meta->have_alpha ? AV_PIX_FMT_RGBAF32 : AV_PIX_FMT_RGBF32; |
| } |
| } |
| |
| static int skip_icc_profile(void *avctx, JXLParseContext *ctx, GetBitContext *gb) |
| { |
| int64_t ret; |
| uint32_t last = 0, last2 = 0; |
| JXLEntropyDecoder dec = { 0 }; |
| uint64_t enc_size = jxl_u64(gb); |
| uint64_t output_size = 0; |
| int out_size_shift = 0; |
| |
| if (!enc_size || enc_size > (1 << 22)) |
| return AVERROR_INVALIDDATA; |
| |
| ret = entropy_decoder_init(avctx, gb, &dec, 41); |
| if (ret < 0) |
| goto end; |
| |
| if (get_bits_left(gb) < 0) { |
| ret = AVERROR_BUFFER_TOO_SMALL; |
| goto end; |
| } |
| |
| for (uint64_t read = 0; read < enc_size; read++) { |
| ret = entropy_decoder_read_symbol(gb, &dec, icc_context(read, last, last2)); |
| if (ret < 0) |
| goto end; |
| if (ret > 255) { |
| ret = AVERROR_INVALIDDATA; |
| goto end; |
| } |
| if (get_bits_left(gb) < 0) { |
| ret = AVERROR_BUFFER_TOO_SMALL; |
| goto end; |
| } |
| last2 = last; |
| last = ret; |
| if (out_size_shift < 63) { |
| output_size += (ret & UINT64_C(0x7F)) << out_size_shift; |
| if (!(ret & 0x80)) { |
| out_size_shift = 63; |
| } else { |
| out_size_shift += 7; |
| if (out_size_shift > 56) { |
| ret = AVERROR_INVALIDDATA; |
| goto end; |
| } |
| } |
| } else if (output_size < 132) { |
| ret = AVERROR_INVALIDDATA; |
| goto end; |
| } |
| } |
| |
| ret = 0; |
| |
| end: |
| entropy_decoder_close(&dec); |
| |
| return ret; |
| } |
| |
| static int skip_extensions(GetBitContext *gb) |
| { |
| uint64_t extensions = jxl_u64(gb), extensions_len = 0; |
| |
| if (get_bits_left(gb) < 0) |
| return AVERROR_BUFFER_TOO_SMALL; |
| |
| if (!extensions) |
| return 0; |
| |
| for (int i = 0; i < 64; i++) { |
| if (extensions & (UINT64_C(1) << i)) |
| extensions_len += jxl_u64(gb); |
| if (get_bits_left(gb) < 0) |
| return AVERROR_BUFFER_TOO_SMALL; |
| } |
| |
| if (extensions_len > INT_MAX || get_bits_left(gb) < extensions_len) |
| return AVERROR_BUFFER_TOO_SMALL; |
| |
| skip_bits_long(gb, extensions_len); |
| |
| return 0; |
| } |
| |
| static int parse_frame_header(void *avctx, JXLParseContext *ctx, GetBitContext *gb) |
| { |
| int all_default, do_yCbCr = 0, num_passes = 1, ret; |
| int group_size_shift = 1, lf_level = 0, save_as_ref = 0; |
| int have_crop = 0, full_frame = 1, resets_canvas = 1, upsampling = 1; |
| JXLFrame *frame = &ctx->codestream.frame; |
| const FFJXLMetadata *meta = &ctx->codestream.meta; |
| int32_t x0 = 0, y0 = 0; |
| uint32_t duration = 0, width = meta->coded_width, height = meta->coded_height; |
| uint32_t name_len, num_groups, num_lf_groups, group_dim, lf_group_dim, toc_count; |
| uint64_t flags = 0; |
| int start_len = get_bits_count(gb); |
| |
| memset(frame, 0, sizeof(*frame)); |
| frame->is_last = 1; |
| |
| all_default = get_bits1(gb); |
| if (!all_default) { |
| frame->type = get_bits(gb, 2); |
| frame->encoding = get_bits1(gb); |
| flags = jxl_u64(gb); |
| if (!meta->xyb_encoded) |
| do_yCbCr = get_bits1(gb); |
| if (!(flags & JXL_FLAG_USE_LF_FRAME)) { |
| if (do_yCbCr) |
| skip_bits(gb, 6); // jpeg upsampling |
| upsampling = jxl_u32(gb, 1, 2, 4, 8, 0, 0, 0, 0); |
| skip_bits_long(gb, 2 * meta->num_extra_channels); |
| if (get_bits_left(gb) < 0) |
| return AVERROR_BUFFER_TOO_SMALL; |
| } |
| if (frame->encoding == JPEGXL_ENC_MODULAR) |
| group_size_shift = get_bits(gb, 2); |
| else if (meta->xyb_encoded) |
| skip_bits(gb, 6); // xqm and bqm scales |
| if (frame->type != JPEGXL_FRAME_REFERENCE_ONLY) { |
| num_passes = jxl_u32(gb, 1, 2, 3, 4, 0, 0, 0, 3); |
| if (num_passes != 1) { |
| int num_ds = jxl_u32(gb, 0, 1, 2, 3, 0, 0, 0, 1); |
| skip_bits(gb, 2 * (num_passes - 1)); // shift |
| skip_bits(gb, 2 * num_ds); // downsample |
| for (int i = 0; i < num_ds; i++) |
| jxl_u32(gb, 0, 1, 2, 0, 0, 0, 0, 3); |
| } |
| } |
| if (frame->type == JPEGXL_FRAME_LF) |
| lf_level = 1 + get_bits(gb, 2); |
| else |
| have_crop = get_bits1(gb); |
| if (have_crop) { |
| if (frame->type != JPEGXL_FRAME_REFERENCE_ONLY) { |
| uint32_t ux0 = jxl_u32(gb, 0, 256, 2304, 18688, 8, 11, 14, 30); |
| uint32_t uy0 = jxl_u32(gb, 0, 256, 2304, 18688, 8, 11, 14, 30); |
| x0 = unpack_signed(ux0); |
| y0 = unpack_signed(uy0); |
| } |
| width = jxl_u32(gb, 0, 256, 2304, 18688, 8, 11, 14, 30); |
| height = jxl_u32(gb, 0, 256, 2304, 18688, 8, 11, 14, 30); |
| full_frame = x0 <= 0 && y0 <= 0 && width + x0 >= meta->coded_width |
| && height + y0 >= meta->coded_height; |
| } |
| if (get_bits_left(gb) < 0) |
| return AVERROR_BUFFER_TOO_SMALL; |
| if (frame->type == JPEGXL_FRAME_REGULAR || frame->type == JPEGXL_FRAME_SKIP_PROGRESSIVE) { |
| for (int i = 0; i <= meta->num_extra_channels; i++) { |
| int mode = jxl_u32(gb, 0, 1, 2, 3, 0, 0, 0, 2); |
| if (meta->num_extra_channels && (mode == JPEGXL_BM_BLEND || mode == JPEGXL_BM_MULADD)) |
| jxl_u32(gb, 0, 1, 2, 3, 0, 0, 0, 2); |
| if (meta->num_extra_channels && (mode == JPEGXL_BM_BLEND || mode == JPEGXL_BM_MULADD |
| || mode == JPEGXL_BM_MUL)) |
| skip_bits1(gb); |
| if (!i) |
| resets_canvas = mode == JPEGXL_BM_REPLACE && full_frame; |
| if (!resets_canvas) |
| skip_bits(gb, 2); |
| if (get_bits_left(gb) < 0) |
| return AVERROR_BUFFER_TOO_SMALL; |
| } |
| if (meta->animation_offset) |
| duration = jxl_u32(gb, 0, 1, 0, 0, 0, 0, 8, 32); |
| if (meta->have_timecodes) |
| skip_bits_long(gb, 32); |
| frame->is_last = get_bits1(gb); |
| } else { |
| frame->is_last = 0; |
| } |
| if (frame->type != JPEGXL_FRAME_LF && !frame->is_last) |
| save_as_ref = get_bits(gb, 2); |
| if (frame->type == JPEGXL_FRAME_REFERENCE_ONLY || |
| (resets_canvas && !frame->is_last && (!duration || save_as_ref) |
| && frame->type != JPEGXL_FRAME_LF)) |
| skip_bits1(gb); // save before color transform |
| name_len = 8 * jxl_u32(gb, 0, 0, 16, 48, 0, 4, 5, 10); |
| if (get_bits_left(gb) < name_len) |
| return AVERROR_BUFFER_TOO_SMALL; |
| skip_bits_long(gb, name_len); |
| } |
| |
| if (!all_default) { |
| int restd = get_bits1(gb), gab = 1; |
| if (!restd) |
| gab = get_bits1(gb); |
| if (gab && !restd && get_bits1(gb)) |
| // gab custom |
| skip_bits_long(gb, 16 * 6); |
| if (get_bits_left(gb) < 0) |
| return AVERROR_BUFFER_TOO_SMALL; |
| if (!restd) { |
| int epf = get_bits(gb, 2); |
| if (epf) { |
| if (frame->encoding == JPEGXL_ENC_VARDCT && get_bits1(gb)) { |
| skip_bits_long(gb, 16 * 8); // custom epf sharpness |
| if (get_bits_left(gb) < 0) |
| return AVERROR_BUFFER_TOO_SMALL; |
| } |
| if (get_bits1(gb)) { |
| skip_bits_long(gb, 3 * 16 + 32); // custom epf weight |
| if (get_bits_left(gb) < 0) |
| return AVERROR_BUFFER_TOO_SMALL; |
| } |
| if (get_bits1(gb)) { // custom epf sigma |
| if (frame->encoding == JPEGXL_ENC_VARDCT) |
| skip_bits(gb, 16); |
| skip_bits_long(gb, 16 * 3); |
| if (get_bits_left(gb) < 0) |
| return AVERROR_BUFFER_TOO_SMALL; |
| } |
| if (frame->encoding == JPEGXL_ENC_MODULAR) |
| skip_bits(gb, 16); |
| } |
| ret = skip_extensions(gb); |
| if (ret < 0) |
| return ret; |
| } |
| ret = skip_extensions(gb); |
| if (ret < 0) |
| return ret; |
| } |
| |
| width = div_ceil(div_ceil(width, upsampling), 1 << (3 * lf_level)); |
| height = div_ceil(div_ceil(height, upsampling), 1 << (3 * lf_level)); |
| group_dim = 128 << group_size_shift; |
| lf_group_dim = group_dim << 3; |
| num_groups = div_ceil(width, group_dim) * div_ceil(height, group_dim); |
| num_lf_groups = div_ceil(width, lf_group_dim) * div_ceil(height, lf_group_dim); |
| if (num_groups == 1 && num_passes == 1) |
| toc_count = 1; |
| else |
| toc_count = 2 + num_lf_groups + num_groups * num_passes; |
| |
| // permuted toc |
| if (get_bits1(gb)) { |
| JXLEntropyDecoder dec; |
| uint32_t end, lehmer = 0; |
| ret = entropy_decoder_init(avctx, gb, &dec, 8); |
| if (ret < 0) |
| return ret; |
| if (get_bits_left(gb) < 0) { |
| entropy_decoder_close(&dec); |
| return AVERROR_BUFFER_TOO_SMALL; |
| } |
| end = entropy_decoder_read_symbol(gb, &dec, toc_context(toc_count)); |
| if (end > toc_count) { |
| entropy_decoder_close(&dec); |
| return AVERROR_INVALIDDATA; |
| } |
| for (uint32_t i = 0; i < end; i++) { |
| lehmer = entropy_decoder_read_symbol(gb, &dec, toc_context(lehmer)); |
| if (get_bits_left(gb) < 0) { |
| entropy_decoder_close(&dec); |
| return AVERROR_BUFFER_TOO_SMALL; |
| } |
| } |
| entropy_decoder_close(&dec); |
| } |
| align_get_bits(gb); |
| |
| for (uint32_t i = 0; i < toc_count; i++) { |
| frame->body_length += 8 * jxl_u32(gb, 0, 1024, 17408, 4211712, 10, 14, 22, 30); |
| if (get_bits_left(gb) < 0) |
| return AVERROR_BUFFER_TOO_SMALL; |
| } |
| align_get_bits(gb); |
| |
| frame->total_length = frame->body_length + get_bits_count(gb) - start_len; |
| |
| return 0; |
| } |
| |
| static int skip_boxes(JXLParseContext *ctx, const uint8_t *buf, int buf_size) |
| { |
| GetByteContext gb; |
| |
| if (ctx->skip > buf_size) |
| return AVERROR_BUFFER_TOO_SMALL; |
| |
| buf += ctx->skip; |
| buf_size -= ctx->skip; |
| bytestream2_init(&gb, buf, buf_size); |
| |
| while (1) { |
| uint64_t size; |
| int head_size = 8; |
| |
| if (bytestream2_peek_le16(&gb) == FF_JPEGXL_CODESTREAM_SIGNATURE_LE) |
| break; |
| if (bytestream2_peek_le64(&gb) == FF_JPEGXL_CONTAINER_SIGNATURE_LE) |
| break; |
| |
| if (bytestream2_get_bytes_left(&gb) < 8) |
| return AVERROR_BUFFER_TOO_SMALL; |
| |
| size = bytestream2_get_be32(&gb); |
| bytestream2_skip(&gb, 4); // tag |
| if (size == 1) { |
| if (bytestream2_get_bytes_left(&gb) < 8) |
| return AVERROR_BUFFER_TOO_SMALL; |
| size = bytestream2_get_be64(&gb); |
| head_size = 16; |
| } |
| if (!size) |
| return AVERROR_INVALIDDATA; |
| /* invalid ISOBMFF size */ |
| if (size <= head_size || size > INT_MAX - ctx->skip) |
| return AVERROR_INVALIDDATA; |
| |
| ctx->skip += size; |
| bytestream2_skip(&gb, size - head_size); |
| if (bytestream2_get_bytes_left(&gb) <= 0) |
| return AVERROR_BUFFER_TOO_SMALL; |
| } |
| |
| return 0; |
| } |
| |
| static int try_parse(AVCodecParserContext *s, AVCodecContext *avctx, JXLParseContext *ctx, |
| const uint8_t *buf, int buf_size) |
| { |
| int ret, cs_buflen, header_skip; |
| const uint8_t *cs_buffer; |
| GetBitContext gb; |
| |
| if (ctx->skip > buf_size) |
| return AVERROR_BUFFER_TOO_SMALL; |
| |
| buf += ctx->skip; |
| buf_size -= ctx->skip; |
| |
| if (ctx->container || AV_RL64(buf) == FF_JPEGXL_CONTAINER_SIGNATURE_LE) { |
| ctx->container = 1; |
| ret = ff_jpegxl_collect_codestream_header(buf, buf_size, ctx->cs_buffer, |
| sizeof(ctx->cs_buffer) - AV_INPUT_BUFFER_PADDING_SIZE, &ctx->copied); |
| if (ret < 0) |
| return ret; |
| ctx->collected_size = ret; |
| if (!ctx->copied) { |
| ctx->skip += ret; |
| return AVERROR_BUFFER_TOO_SMALL; |
| } |
| cs_buffer = ctx->cs_buffer; |
| cs_buflen = FFMIN(sizeof(ctx->cs_buffer) - AV_INPUT_BUFFER_PADDING_SIZE, ctx->copied); |
| } else { |
| cs_buffer = buf; |
| cs_buflen = buf_size; |
| } |
| |
| if (!ctx->codestream_length) { |
| header_skip = ff_jpegxl_parse_codestream_header(cs_buffer, cs_buflen, &ctx->codestream.meta, 0); |
| if (header_skip < 0) |
| return header_skip; |
| ctx->codestream_length = header_skip; |
| populate_fields(s, avctx, &ctx->codestream.meta); |
| } |
| |
| if (ctx->container) |
| return ctx->collected_size; |
| |
| ret = init_get_bits8(&gb, cs_buffer, cs_buflen); |
| if (ret < 0) |
| return ret; |
| |
| skip_bits_long(&gb, ctx->codestream_length); |
| |
| if (!ctx->skipped_icc && ctx->codestream.meta.have_icc_profile) { |
| ret = skip_icc_profile(avctx, ctx, &gb); |
| if (ret < 0) |
| return ret; |
| ctx->skipped_icc = 1; |
| align_get_bits(&gb); |
| ctx->codestream_length = get_bits_count(&gb); |
| } |
| |
| if (get_bits_left(&gb) <= 0) |
| return AVERROR_BUFFER_TOO_SMALL; |
| |
| while (1) { |
| ret = parse_frame_header(avctx, ctx, &gb); |
| if (ret < 0) |
| return ret; |
| ctx->codestream_length += ctx->codestream.frame.total_length; |
| if (ctx->codestream.frame.is_last) |
| return ctx->codestream_length / 8; |
| if (get_bits_left(&gb) <= ctx->codestream.frame.body_length) |
| return AVERROR_BUFFER_TOO_SMALL; |
| skip_bits_long(&gb, ctx->codestream.frame.body_length); |
| } |
| } |
| |
| static int jpegxl_parse(AVCodecParserContext *s, AVCodecContext *avctx, |
| const uint8_t **poutbuf, int *poutbuf_size, |
| const uint8_t *buf, int buf_size) |
| { |
| JXLParseContext *ctx = s->priv_data; |
| int next = END_NOT_FOUND, ret; |
| const uint8_t *pbuf = ctx->pc.buffer; |
| int pindex = ctx->pc.index; |
| |
| *poutbuf_size = 0; |
| *poutbuf = NULL; |
| |
| if (!ctx->pc.index) { |
| if (ctx->pc.overread) |
| goto flush; |
| pbuf = buf; |
| pindex = buf_size; |
| } |
| |
| if ((!ctx->container || !ctx->codestream_length) && !ctx->next) { |
| ret = try_parse(s, avctx, ctx, pbuf, pindex); |
| if (ret < 0) |
| goto flush; |
| ctx->next = ret; |
| if (ctx->container) |
| ctx->skip += ctx->next; |
| } |
| |
| if (ctx->container && ctx->next >= 0) { |
| ret = skip_boxes(ctx, pbuf, pindex); |
| if (ret < 0) { |
| if (ret == AVERROR_INVALIDDATA) |
| ctx->next = -1; |
| goto flush; |
| } |
| ctx->next = ret + ctx->skip; |
| } |
| |
| if (ctx->next >= 0) |
| next = ctx->next - ctx->pc.index; |
| |
| flush: |
| if (next > buf_size) |
| next = END_NOT_FOUND; |
| |
| ret = ff_combine_frame(&ctx->pc, next, &buf, &buf_size); |
| if (ret < 0) |
| return buf_size; |
| |
| *poutbuf = buf; |
| *poutbuf_size = buf_size; |
| |
| ctx->codestream_length = 0; |
| ctx->collected_size = 0; |
| ctx->container = 0; |
| ctx->copied = 0; |
| ctx->skip = 0; |
| ctx->skipped_icc = 0; |
| ctx->next = 0; |
| memset(&ctx->codestream, 0, sizeof(ctx->codestream)); |
| |
| return next; |
| } |
| |
| const AVCodecParser ff_jpegxl_parser = { |
| .codec_ids = { AV_CODEC_ID_JPEGXL }, |
| .priv_data_size = sizeof(JXLParseContext), |
| .parser_parse = jpegxl_parse, |
| .parser_close = ff_parse_close, |
| }; |