FFmpeg  4.3.8
av1_parser.c
Go to the documentation of this file.
1 /*
2  * AV1 parser
3  *
4  * Copyright (C) 2018 James Almer <jamrial@gmail.com>
5  *
6  * This file is part of FFmpeg.
7  *
8  * FFmpeg is free software; you can redistribute it and/or
9  * modify it under the terms of the GNU Lesser General Public
10  * License as published by the Free Software Foundation; either
11  * version 2.1 of the License, or (at your option) any later version.
12  *
13  * FFmpeg is distributed in the hope that it will be useful,
14  * but WITHOUT ANY WARRANTY; without even the implied warranty of
15  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16  * Lesser General Public License for more details.
17  *
18  * You should have received a copy of the GNU Lesser General Public
19  * License along with FFmpeg; if not, write to the Free Software
20  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
21  */
22 
23 #include "av1_parse.h"
24 #include "cbs.h"
25 #include "cbs_av1.h"
26 #include "internal.h"
27 #include "parser.h"
28 
29 typedef struct AV1ParseContext {
34 
35 static const enum AVPixelFormat pix_fmts_8bit[2][2] = {
38 };
39 static const enum AVPixelFormat pix_fmts_10bit[2][2] = {
42 };
43 static const enum AVPixelFormat pix_fmts_12bit[2][2] = {
46 };
47 
48 static const enum AVPixelFormat pix_fmts_rgb[3] = {
50 };
51 
53  AVCodecContext *avctx,
54  const uint8_t **out_data, int *out_size,
55  const uint8_t *data, int size)
56 {
57  AV1ParseContext *s = ctx->priv_data;
62  int ret;
63 
64  *out_data = data;
65  *out_size = size;
66 
67  ctx->key_frame = -1;
70 
71  s->cbc->log_ctx = avctx;
72 
73  if (avctx->extradata_size && !s->parsed_extradata) {
74  s->parsed_extradata = 1;
75 
76  ret = ff_cbs_read(s->cbc, td, avctx->extradata, avctx->extradata_size);
77  if (ret < 0) {
78  av_log(avctx, AV_LOG_WARNING, "Failed to parse extradata.\n");
79  }
80 
81  ff_cbs_fragment_reset(s->cbc, td);
82  }
83 
84  ret = ff_cbs_read(s->cbc, td, data, size);
85  if (ret < 0) {
86  av_log(avctx, AV_LOG_ERROR, "Failed to parse temporal unit.\n");
87  goto end;
88  }
89 
90  if (!av1->sequence_header) {
91  av_log(avctx, AV_LOG_ERROR, "No sequence header available\n");
92  goto end;
93  }
94 
95  seq = av1->sequence_header;
96  color = &seq->color_config;
97 
98  for (int i = 0; i < td->nb_units; i++) {
99  CodedBitstreamUnit *unit = &td->units[i];
100  AV1RawOBU *obu = unit->content;
102  int frame_type;
103 
104  if (unit->type == AV1_OBU_FRAME)
105  frame = &obu->obu.frame.header;
106  else if (unit->type == AV1_OBU_FRAME_HEADER)
107  frame = &obu->obu.frame_header;
108  else
109  continue;
110 
111  if (obu->header.spatial_id > 0)
112  continue;
113 
114  if (frame->show_existing_frame) {
116 
117  if (!ref->valid) {
118  av_log(avctx, AV_LOG_ERROR, "Invalid reference frame\n");
119  goto end;
120  }
121 
122  ctx->width = ref->frame_width;
123  ctx->height = ref->frame_height;
124  frame_type = ref->frame_type;
125 
126  ctx->key_frame = 0;
127  } else if (!frame->show_frame) {
128  continue;
129  } else {
130  ctx->width = av1->frame_width;
131  ctx->height = av1->frame_height;
132  frame_type = frame->frame_type;
133 
134  ctx->key_frame = frame_type == AV1_FRAME_KEY;
135  }
136 
137  switch (frame_type) {
138  case AV1_FRAME_KEY:
141  break;
142  case AV1_FRAME_INTER:
144  break;
145  case AV1_FRAME_SWITCH:
147  break;
148  }
150  }
151 
152  switch (av1->bit_depth) {
153  case 8:
154  ctx->format = color->mono_chrome ? AV_PIX_FMT_GRAY8
155  : pix_fmts_8bit [color->subsampling_x][color->subsampling_y];
156  break;
157  case 10:
158  ctx->format = color->mono_chrome ? AV_PIX_FMT_GRAY10
159  : pix_fmts_10bit[color->subsampling_x][color->subsampling_y];
160  break;
161  case 12:
162  ctx->format = color->mono_chrome ? AV_PIX_FMT_GRAY12
163  : pix_fmts_12bit[color->subsampling_x][color->subsampling_y];
164  break;
165  }
167 
168  if (!color->subsampling_x && !color->subsampling_y &&
170  color->color_primaries == AVCOL_PRI_BT709 &&
172  ctx->format = pix_fmts_rgb[color->high_bitdepth + color->twelve_bit];
173 
174  avctx->pix_fmt = ctx->format;
175 
176  avctx->profile = seq->seq_profile;
177  avctx->level = seq->seq_level_idx[0];
178 
179  avctx->colorspace = (enum AVColorSpace) color->matrix_coefficients;
180  avctx->color_primaries = (enum AVColorPrimaries) color->color_primaries;
183 
184  if (ctx->width != avctx->width || ctx->height != avctx->height) {
185  ret = ff_set_dimensions(avctx, ctx->width, ctx->height);
186  if (ret < 0)
187  goto end;
188  }
189 
190  if (avctx->framerate.num)
191  avctx->time_base = av_inv_q(av_mul_q(avctx->framerate, (AVRational){avctx->ticks_per_frame, 1}));
192 
193 end:
194  ff_cbs_fragment_reset(s->cbc, td);
195 
196  s->cbc->log_ctx = NULL;
197 
198  return size;
199 }
200 
207 };
208 
210 {
211  AV1ParseContext *s = ctx->priv_data;
212  int ret;
213 
214  ret = ff_cbs_init(&s->cbc, AV_CODEC_ID_AV1, NULL);
215  if (ret < 0)
216  return ret;
217 
220 
221  return 0;
222 }
223 
225 {
226  AV1ParseContext *s = ctx->priv_data;
227 
229  ff_cbs_close(&s->cbc);
230 }
231 
233  const uint8_t *buf, int buf_size)
234 {
235  AV1OBU obu;
236  const uint8_t *ptr = buf, *end = buf + buf_size;
237 
238  while (ptr < end) {
239  int len = ff_av1_extract_obu(&obu, ptr, buf_size, avctx);
240  if (len < 0)
241  break;
242 
243  if (obu.type == AV1_OBU_FRAME_HEADER ||
244  obu.type == AV1_OBU_FRAME) {
245  return ptr - buf;
246  }
247  ptr += len;
248  buf_size -= len;
249  }
250 
251  return 0;
252 }
253 
255  .codec_ids = { AV_CODEC_ID_AV1 },
256  .priv_data_size = sizeof(AV1ParseContext),
257  .parser_init = av1_parser_init,
258  .parser_close = av1_parser_close,
259  .parser_parse = av1_parser_parse,
261 };
#define NULL
Definition: coverity.c:32
AVRational framerate
Definition: avcodec.h:2069
int nb_units
Number of units in this fragment.
Definition: cbs.h:147
int size
planar YUV 4:4:4, 24bpp, (1 Cr & Cb sample per 1x1 Y samples)
Definition: pixfmt.h:71
#define AV_LOG_WARNING
Something somehow does not look correct.
Definition: log.h:182
int ff_set_dimensions(AVCodecContext *s, int width, int height)
Check that the provided frame dimensions are valid and set them on the codec context.
Definition: utils.c:104
uint8_t mono_chrome
Definition: cbs_av1.h:44
int width
Dimensions of the decoded video intended for presentation.
Definition: avcodec.h:3500
int ff_cbs_init(CodedBitstreamContext **ctx_ptr, enum AVCodecID codec_id, void *log_ctx)
Create and initialise a new context for the given codec.
Definition: cbs.c:74
CodedBitstreamUnitType type
Codec-specific type of this unit.
Definition: cbs.h:68
enum AVColorRange color_range
MPEG vs JPEG YUV range.
Definition: avcodec.h:1161
planar GBR 4:4:4 24bpp
Definition: pixfmt.h:168
int num
Numerator.
Definition: rational.h:59
#define AV_PIX_FMT_GBRP10
Definition: pixfmt.h:413
int codec_ids[5]
Definition: avcodec.h:3521
enum AVPixelFormat pix_fmt
Pixel format, see AV_PIX_FMT_xxx.
Definition: avcodec.h:736
int out_size
Definition: movenc.c:55
static enum AVPixelFormat pix_fmts_10bit[2][2]
Definition: av1_parser.c:39
#define AV_PIX_FMT_YUV420P12
Definition: pixfmt.h:401
int ff_av1_extract_obu(AV1OBU *obu, const uint8_t *buf, int length, void *logctx)
Extract an OBU from a raw bitstream.
Definition: av1_parse.c:29
uint8_t color_range
Definition: cbs_av1.h:51
int profile
profile
Definition: avcodec.h:1859
order of coefficients is actually GBR, also IEC 61966-2-1 (sRGB)
Definition: pixfmt.h:510
uint8_t seq_profile
Definition: cbs_av1.h:74
AVColorTransferCharacteristic
Color Transfer Characteristic.
Definition: pixfmt.h:480
static const CodedBitstreamUnitType decompose_unit_types[]
Definition: av1_parser.c:201
static enum AVPixelFormat pix_fmts_12bit[2][2]
Definition: av1_parser.c:43
frame_type
AVRational time_base
This is the fundamental unit of time (in seconds) in terms of which frame timestamps are represented...
Definition: avcodec.h:649
Undefined.
Definition: avutil.h:273
#define AV_PIX_FMT_GRAY10
Definition: pixfmt.h:378
CodedBitstreamFragment temporal_unit
Definition: av1_parser.c:31
#define AV_PIX_FMT_GRAY12
Definition: pixfmt.h:379
uint8_t matrix_coefficients
Definition: cbs_av1.h:49
enum AVPictureStructure picture_structure
Indicate whether a picture is coded as a frame, top field or bottom field.
Definition: avcodec.h:3487
uint8_t
#define av_cold
Definition: attributes.h:88
#define av_assert2(cond)
assert() equivalent, that does lie in speed critical code.
Definition: avassert.h:64
static const uint32_t color[16+AV_CLASS_CATEGORY_NB]
Definition: log.c:92
AVColorSpace
YUV colorspace type.
Definition: pixfmt.h:509
uint32_t CodedBitstreamUnitType
The codec-specific type of a bitstream unit.
Definition: cbs.h:43
static av_cold int end(AVCodecContext *avctx)
Definition: avrndec.c:92
uint8_t * extradata
some codecs need / can use extradata like Huffman tables.
Definition: avcodec.h:627
static AVFrame * frame
const char data[16]
Definition: mxf.c:91
uint8_t high_bitdepth
Definition: cbs_av1.h:42
Coded bitstream unit structure.
Definition: cbs.h:64
void * content
Pointer to the decomposed form of this unit.
Definition: cbs.h:101
CodedBitstreamUnit * units
Pointer to an array of units of length nb_units_allocated.
Definition: cbs.h:162
#define AV_PIX_FMT_YUV422P12
Definition: pixfmt.h:402
AVColorPrimaries
Chromaticity coordinates of the source primaries.
Definition: pixfmt.h:455
static int av1_parser_split(AVCodecContext *avctx, const uint8_t *buf, int buf_size)
Definition: av1_parser.c:232
AVCodecParser ff_av1_parser
Definition: av1_parser.c:254
#define av_log(a,...)
static enum AVPixelFormat pix_fmts_8bit[2][2]
Definition: av1_parser.c:35
void ff_cbs_fragment_free(CodedBitstreamContext *ctx, CodedBitstreamFragment *frag)
Free the units array of a fragment in addition to what ff_cbs_fragment_reset does.
Definition: cbs.c:157
int parsed_extradata
Definition: av1_parser.c:32
#define i(width, name, range_min, range_max)
Definition: cbs_h2645.c:269
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
Definition: log.h:176
#define td
Definition: regdef.h:70
uint8_t twelve_bit
Definition: cbs_av1.h:43
static int av1_parser_parse(AVCodecParserContext *ctx, AVCodecContext *avctx, const uint8_t **out_data, int *out_size, const uint8_t *data, int size)
Definition: av1_parser.c:52
AV1RawFrame frame
Definition: cbs_av1.h:395
also ITU-R BT1361 / IEC 61966-2-4 / SMPTE RP177 Annex B
Definition: pixfmt.h:457
union AV1RawOBU::@25 obu
#define AV_PIX_FMT_YUV444P10
Definition: pixfmt.h:400
static av_cold int av1_parser_init(AVCodecParserContext *ctx)
Definition: av1_parser.c:209
static void av1_parser_close(AVCodecParserContext *ctx)
Definition: av1_parser.c:224
static char * split(char *message, char delim)
Definition: af_channelmap.c:81
planar YUV 4:2:2, 16bpp, (1 Cr & Cb sample per 2x1 Y samples)
Definition: pixfmt.h:70
AV1RawColorConfig color_config
Definition: cbs_av1.h:128
void * log_ctx
Logging context to be passed to all av_log() calls associated with this context.
Definition: cbs.h:173
uint8_t frame_type
Definition: cbs_av1.h:139
int width
picture width / height.
Definition: avcodec.h:699
AV1ReferenceFrameState * ref
Definition: cbs_av1.h:445
AV1RawOBUHeader header
Definition: cbs_av1.h:388
AVFormatContext * ctx
Definition: movenc.c:48
enum AVColorPrimaries color_primaries
Chromaticity coordinates of the source primaries.
Definition: avcodec.h:1140
#define s(width, name)
Definition: cbs_vp9.c:257
int level
level
Definition: avcodec.h:1982
uint8_t color_primaries
Definition: cbs_av1.h:47
#define FF_ARRAY_ELEMS(a)
the normal 2^n-1 "JPEG" YUV ranges
Definition: pixfmt.h:535
uint8_t subsampling_y
Definition: cbs_av1.h:53
int nb_decompose_unit_types
Length of the decompose_unit_types array.
Definition: cbs.h:201
Coded bitstream fragment structure, combining one or more units.
Definition: cbs.h:116
uint8_t subsampling_x
Definition: cbs_av1.h:52
main external API structure.
Definition: avcodec.h:526
int extradata_size
Definition: avcodec.h:628
#define AV_PIX_FMT_YUV420P10
Definition: pixfmt.h:397
Switching Predicted.
Definition: avutil.h:279
void ff_cbs_fragment_reset(CodedBitstreamContext *ctx, CodedBitstreamFragment *frag)
Free the units contained in a fragment as well as the fragment&#39;s own data buffer, but not the units a...
Definition: cbs.c:142
Context structure for coded bitstream operations.
Definition: cbs.h:168
enum AVColorSpace colorspace
YUV colorspace type.
Definition: avcodec.h:1154
Rational number (pair of numerator and denominator).
Definition: rational.h:58
enum AVColorTransferCharacteristic color_trc
Color Transfer Characteristic.
Definition: avcodec.h:1147
int type
Definition: av1_parse.h:48
uint8_t show_existing_frame
Definition: cbs_av1.h:134
CodedBitstreamContext * cbc
Definition: av1_parser.c:30
void ff_cbs_close(CodedBitstreamContext **ctx_ptr)
Close a context and free all internal state.
Definition: cbs.c:115
static enum AVPixelFormat pix_fmts_rgb[3]
Definition: av1_parser.c:48
AV1RawSequenceHeader * sequence_header
Definition: cbs_av1.h:419
uint8_t spatial_id
Definition: cbs_av1.h:37
#define AV_PIX_FMT_GBRP12
Definition: pixfmt.h:414
#define AV_PIX_FMT_YUV422P10
Definition: pixfmt.h:398
#define AV_PIX_FMT_YUV444P12
Definition: pixfmt.h:404
the normal 219*2^(n-8) "MPEG" YUV ranges
Definition: pixfmt.h:534
void * priv_data
Internal codec-specific data.
Definition: cbs.h:189
static av_always_inline AVRational av_inv_q(AVRational q)
Invert a rational.
Definition: rational.h:159
planar YUV 4:2:0, 12bpp, (1 Cr & Cb sample per 2x2 Y samples)
Definition: pixfmt.h:66
Y , 8bpp.
Definition: pixfmt.h:74
IEC 61966-2-1 (sRGB or sYCC)
Definition: pixfmt.h:494
common internal api header.
if(ret< 0)
Definition: vf_mcdeint.c:279
static int ref[MAX_W *MAX_W]
Definition: jpeg2000dwt.c:107
CodedBitstreamUnitType * decompose_unit_types
Array of unit types which should be decomposed when reading.
Definition: cbs.h:197
int len
int format
The format of the coded data, corresponds to enum AVPixelFormat for video and for enum AVSampleFormat...
Definition: avcodec.h:3517
AVRational av_mul_q(AVRational b, AVRational c)
Multiply two rationals.
Definition: rational.c:80
AV1RawFrameHeader frame_header
Definition: cbs_av1.h:394
uint8_t show_frame
Definition: cbs_av1.h:140
uint8_t frame_to_show_map_idx
Definition: cbs_av1.h:135
int ff_cbs_read(CodedBitstreamContext *ctx, CodedBitstreamFragment *frag, const uint8_t *data, size_t size)
Read a bitstream from a memory region into a fragment, then split into units and decompose.
Definition: cbs.c:269
AV1RawFrameHeader header
Definition: cbs_av1.h:300
AVPixelFormat
Pixel format.
Definition: pixfmt.h:64
int key_frame
Set by parser to 1 for key frames and 0 for non-key frames.
Definition: avcodec.h:3402
uint8_t seq_level_idx[AV1_MAX_OPERATING_POINTS]
Definition: cbs_av1.h:87
uint8_t transfer_characteristics
Definition: cbs_av1.h:48
Predicted.
Definition: avutil.h:275