FFmpeg coverage


Directory: ../../../ffmpeg/
File: src/libavformat/rtpdec_av1.c
Date: 2025-03-08 20:38:41
Exec Total Coverage
Lines: 0 188 0.0%
Functions: 0 5 0.0%
Branches: 0 126 0.0%

Line Branch Exec Source
1 /*
2 * Depacketization for RTP Payload Format For AV1 (v1.0)
3 * https://aomediacodec.github.io/av1-rtp-spec/
4 * Copyright (c) 2024 Axis Communications
5 *
6 * This file is part of FFmpeg.
7 *
8 * FFmpeg is free software; you can redistribute it and/or
9 * modify it under the terms of the GNU Lesser General Public
10 * License as published by the Free Software Foundation; either
11 * version 2.1 of the License, or (at your option) any later version.
12 *
13 * FFmpeg is distributed in the hope that it will be useful,
14 * but WITHOUT ANY WARRANTY; without even the implied warranty of
15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16 * Lesser General Public License for more details.
17 *
18 * You should have received a copy of the GNU Lesser General Public
19 * License along with FFmpeg; if not, write to the Free Software
20 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
21 */
22
23 /**
24 * @file
25 * @brief AV1 / RTP depacketization code (RTP Payload Format For AV1 (v1.0))
26 * @author Chris Hodges <chris.hodges@axis.com>
27 * @note The process will restore TDs and put back size fields into headers.
28 * It will also try to keep complete OBUs and remove partial OBUs
29 * caused by packet drops and thus keep the stream syntactically intact.
30 */
31
32 #include "libavutil/avstring.h"
33 #include "libavutil/mem.h"
34 #include "avformat.h"
35
36 #include "rtpdec.h"
37 #include "libavcodec/av1.h"
38 #include "rtp_av1.h"
39
40 // enable tracing of packet data
41 //#define RTPDEC_AV1_VERBOSE_TRACE
42
43 /**
44 * RTP/AV1 specific private data.
45 */
46 struct PayloadContext {
47 uint32_t timestamp; ///< last received timestamp for frame
48 uint8_t profile; ///< profile (main/high/professional)
49 uint8_t level_idx; ///< level (0-31)
50 uint8_t tier; ///< main tier or high tier
51 uint16_t prev_seq; ///< sequence number of previous packet
52 unsigned int frag_obu_size; ///< current total size of fragmented OBU
53 unsigned int frag_pkt_leb_pos; ///< offset in buffer where OBU LEB starts
54 unsigned int frag_lebs_res; ///< number of bytes reserved for LEB
55 unsigned int frag_header_size; ///< size of OBU header (1 or 2)
56 int needs_td; ///< indicates that a TD should be output
57 int drop_fragment; ///< drop all fragments until next frame
58 int keyframe_seen; ///< keyframe was seen
59 int wait_for_keyframe; ///< message about waiting for keyframe has been issued
60 };
61
62 static int sdp_parse_fmtp_config_av1(AVFormatContext *s,
63 AVStream *stream,
64 PayloadContext *av1_data,
65 const char *attr, const char *value) {
66 if (!strcmp(attr, "profile")) {
67 av1_data->profile = atoi(value);
68 av_log(s, AV_LOG_DEBUG, "RTP AV1 profile: %u\n", av1_data->profile);
69 } else if (!strcmp(attr, "level-idx")) {
70 av1_data->level_idx = atoi(value);
71 av_log(s, AV_LOG_DEBUG, "RTP AV1 level: %u\n", av1_data->profile);
72 } else if (!strcmp(attr, "tier")) {
73 av1_data->tier = atoi(value);
74 av_log(s, AV_LOG_DEBUG, "RTP AV1 tier: %u\n", av1_data->tier);
75 }
76 return 0;
77 }
78
79 // return 0 on complete packet, -1 on partial packet
80 static int av1_handle_packet(AVFormatContext *ctx, PayloadContext *data,
81 AVStream *st, AVPacket *pkt, uint32_t *timestamp,
82 const uint8_t *buf, int len, uint16_t seq,
83 int flags) {
84 uint8_t aggr_hdr;
85 int result = 0;
86 int is_frag_cont;
87 int is_last_fragmented;
88 int is_first_pkt;
89 unsigned int num_obus;
90 unsigned int obu_cnt = 1;
91 unsigned int rem_pkt_size = len;
92 unsigned int pktpos;
93 const uint8_t *buf_ptr = buf;
94 uint16_t expected_seq = data->prev_seq + 1;
95 int16_t seq_diff = seq - expected_seq;
96
97 data->prev_seq = seq;
98
99 if (!len) {
100 av_log(ctx, AV_LOG_ERROR, "Empty AV1 RTP packet\n");
101 return AVERROR_INVALIDDATA;
102 }
103 if (len < 2) {
104 av_log(ctx, AV_LOG_ERROR, "AV1 RTP packet too short\n");
105 return AVERROR_INVALIDDATA;
106 }
107
108 /* The payload structure is supposed to be straight-forward, but there are a
109 * couple of edge cases which need to be tackled and make things a bit more
110 * complex.
111 * These are mainly due to:
112 * - To reconstruct the OBU size for fragmented packets and place it the OBU
113 * header, the final size will not be known until the last fragment has
114 * been parsed. However, the number LEBs in the header is variable
115 * depending on the length of the payload.
116 * - We are increasing the out-packet size while we are getting fragmented
117 * OBUs. If an RTP packet gets dropped, we would create corrupted OBUs.
118 * In this case we decide to drop the whole frame.
119 */
120
121 #ifdef RTPDEC_AV1_VERBOSE_TRACE
122 av_log(ctx, AV_LOG_TRACE, "RTP Packet %d in (%x), len=%d:\n",
123 seq, flags, len);
124 av_hex_dump_log(ctx, AV_LOG_TRACE, buf, FFMIN(len, 64));
125 av_log(ctx, AV_LOG_TRACE, "... end at offset %x:\n", FFMAX(len - 64, 0));
126 av_hex_dump_log(ctx, AV_LOG_TRACE, buf + FFMAX(len - 64, 0), FFMIN(len - 64, 64));
127 #endif
128
129 /* 8 bit aggregate header: Z Y W W N - - - */
130 aggr_hdr = *buf_ptr++;
131 rem_pkt_size--;
132
133 /* Z: MUST be set to 1 if the first OBU element is an OBU fragment that is a
134 * continuation of an OBU fragment from the previous packet, and MUST be set
135 * to 0 otherwise */
136 is_frag_cont = (aggr_hdr >> AV1B_AGGR_HDR_FRAG_CONT) & 1;
137
138 /* Y: MUST be set to 1 if the last OBU element is an OBU fragment that will
139 * continue in the next packet, and MUST be set to 0 otherwise */
140 is_last_fragmented = (aggr_hdr >> AV1B_AGGR_HDR_LAST_FRAG) & 1;
141
142 /* W: two bit field that describes the number of OBU elements in the packet.
143 * This field MUST be set equal to 0 or equal to the number of OBU elements
144 * contained in the packet.
145 * If set to 0, each OBU element MUST be preceded by a length field.
146 * If not set to 0 (i.e., W = 1, 2 or 3) the last OBU element MUST NOT be
147 * preceded by a length field (it's derived from RTP packet size minus other
148 * known lengths). */
149 num_obus = (aggr_hdr >> AV1S_AGGR_HDR_NUM_OBUS) & AV1M_AGGR_HDR_NUM_OBUS;
150
151 /* N: MUST be set to 1 if the packet is the first packet of a coded video
152 * sequence, and MUST be set to 0 otherwise.*/
153 is_first_pkt = (aggr_hdr >> AV1B_AGGR_HDR_FIRST_PKT) & 1;
154
155 if (is_frag_cont) {
156 if (data->drop_fragment) {
157 return AVERROR_INVALIDDATA;
158 }
159 if (is_first_pkt) {
160 av_log(ctx, AV_LOG_ERROR, "Illegal aggregation header in first AV1 RTP packet\n");
161 return AVERROR_INVALIDDATA;
162 }
163 if (seq_diff) {
164 av_log(ctx, AV_LOG_WARNING, "AV1 RTP frag packet sequence mismatch (%d != %d), dropping temporal unit\n",
165 seq, expected_seq);
166 goto drop_fragment;
167 }
168 if (!pkt->size || !data->frag_obu_size) {
169 av_log(ctx, AV_LOG_WARNING, "Unexpected fragment continuation in AV1 RTP packet\n");
170 goto drop_fragment; // avoid repeated output for the same fragment
171 }
172 } else {
173 if (!is_first_pkt && !data->keyframe_seen) {
174 if (!data->wait_for_keyframe) {
175 data->wait_for_keyframe = 1;
176 av_log(ctx, AV_LOG_WARNING, "AV1 RTP packet before keyframe, dropping and waiting for next keyframe\n");
177 }
178 goto drop_fragment;
179 }
180 if (seq_diff && !is_first_pkt) {
181 av_log(ctx, AV_LOG_WARNING, "AV1 RTP unfrag packet sequence mismatch (%d != %d), dropping temporal unit\n",
182 seq, expected_seq);
183 goto drop_fragment;
184 }
185 data->drop_fragment = 0;
186 if (!data->needs_td && ((data->timestamp != *timestamp) || is_first_pkt)) {
187 av_log(ctx, AV_LOG_TRACE, "Timestamp changed to %u (or first pkt %d), forcing TD\n", *timestamp, is_first_pkt);
188 data->needs_td = 1;
189 data->frag_obu_size = 0; // new temporal unit might have been caused by dropped packets
190 }
191 if (data->frag_obu_size) {
192 data->frag_obu_size = 0; // make sure we recover
193 av_log(ctx, AV_LOG_ERROR, "Missing fragment continuation in AV1 RTP packet\n");
194 return AVERROR_INVALIDDATA;
195 }
196 // update the timestamp in the frame packet with the one from the RTP packet
197 data->timestamp = *timestamp;
198 }
199 pktpos = pkt->size;
200
201 #ifdef RTPDEC_AV1_VERBOSE_TRACE
202 av_log(ctx, AV_LOG_TRACE, "Input buffer size %d, aggr head 0x%02x fc %d, lf %d, no %d, fp %d\n",
203 len, aggr_hdr, is_frag_cont, is_last_fragmented, num_obus, is_first_pkt);
204 #endif
205
206 if (is_first_pkt) {
207 pkt->flags |= AV_PKT_FLAG_KEY;
208 data->keyframe_seen = 1;
209 data->wait_for_keyframe = 0;
210 }
211
212 // loop over OBU elements
213 while (rem_pkt_size) {
214 uint32_t obu_size;
215 int num_lebs;
216 int needs_size_field;
217 int output_size;
218 unsigned int obu_payload_size;
219 uint8_t obu_hdr;
220
221 obu_size = rem_pkt_size;
222 if (!num_obus || obu_cnt < num_obus) {
223 // read out explicit OBU element size (which almost corresponds to the original OBU size)
224 num_lebs = parse_leb(ctx, buf_ptr, rem_pkt_size, &obu_size);
225 if (!num_lebs) {
226 return AVERROR_INVALIDDATA;
227 }
228 rem_pkt_size -= num_lebs;
229 buf_ptr += num_lebs;
230 }
231 // read first byte (which is the header byte only for non-fragmented elements)
232 obu_hdr = *buf_ptr;
233 if (obu_size > rem_pkt_size) {
234 av_log(ctx, AV_LOG_ERROR, "AV1 OBU size %u larger than remaining pkt size %d\n", obu_size, rem_pkt_size);
235 return AVERROR_INVALIDDATA;
236 }
237
238 if (!obu_size) {
239 av_log(ctx, AV_LOG_ERROR, "Unreasonable AV1 OBU size %u\n", obu_size);
240 return AVERROR_INVALIDDATA;
241 }
242
243 if (!is_frag_cont) {
244 uint8_t obu_type = (obu_hdr >> AV1S_OBU_TYPE) & AV1M_OBU_TYPE;
245 if (obu_hdr & AV1F_OBU_FORBIDDEN) {
246 av_log(ctx, AV_LOG_ERROR, "Forbidden bit set in AV1 OBU header (0x%02x)\n", obu_hdr);
247 return AVERROR_INVALIDDATA;
248 }
249 // ignore and remove OBUs according to spec
250 if ((obu_type == AV1_OBU_TEMPORAL_DELIMITER) ||
251 (obu_type == AV1_OBU_TILE_LIST)) {
252 pktpos += obu_size;
253 rem_pkt_size -= obu_size;
254 // TODO: This probably breaks if the OBU_TILE_LIST is fragmented
255 // into the next RTP packet, so at least check and fail here
256 if (rem_pkt_size == 0 && is_last_fragmented) {
257 avpriv_report_missing_feature(ctx, "AV1 OBU_TILE_LIST (should not be there!) to be ignored but is fragmented\n");
258 return AVERROR_PATCHWELCOME;
259 }
260 obu_cnt++;
261 continue;
262 }
263 }
264
265 // If we need to add a size field, out size will be different
266 output_size = obu_size;
267 // Spec says the OBUs should have their size fields removed,
268 // but this is not mandatory
269 if (is_frag_cont || (obu_hdr & AV1F_OBU_HAS_SIZE_FIELD)) {
270 needs_size_field = 0;
271 } else {
272 needs_size_field = 1;
273 // (re)calculate number of LEB bytes needed (if it was implicit, there were no LEBs)
274 output_size += calc_leb_size(obu_size - (1 + ((obu_hdr & AV1F_OBU_EXTENSION_FLAG) ? 1 : 0)));
275 }
276
277 if (!is_frag_cont && (obu_cnt == 1)) {
278 if (data->needs_td) {
279 output_size += 2; // for Temporal Delimiter (TD)
280 }
281 if (pkt->data) {
282 if ((result = av_grow_packet(pkt, output_size)) < 0)
283 return result;
284 } else {
285 if ((result = av_new_packet(pkt, output_size) < 0))
286 return result;
287 }
288
289 if (data->needs_td) {
290 // restore TD
291 pkt->data[pktpos++] = 0x12;
292 pkt->data[pktpos++] = 0x00;
293 }
294 data->needs_td = 0;
295 } else {
296 if ((result = av_grow_packet(pkt, output_size)) < 0)
297 return result;
298 }
299
300 obu_payload_size = obu_size;
301 // do we need to restore the OBU size field?
302 if (needs_size_field) {
303 // set obu_has_size_field in header byte
304 pkt->data[pktpos++] = *buf_ptr++ | AV1F_OBU_HAS_SIZE_FIELD;
305 data->frag_header_size = 1;
306 obu_payload_size--;
307
308 // copy extension byte, if available
309 if (obu_hdr & AV1F_OBU_EXTENSION_FLAG) {
310 /* TODO we cannot handle the edge case where last element is a
311 * fragment of exactly one byte AND the header has the extension
312 * flag set. Note that it would be more efficient to not send a
313 * fragment of one byte and instead drop the size field of the
314 * prior element */
315 if (!obu_payload_size) {
316 av_log(ctx, AV_LOG_ERROR, "AV1 OBU too short for extension byte (0x%02x)\n",
317 obu_hdr);
318 return AVERROR_INVALIDDATA;
319 }
320 pkt->data[pktpos++] = *buf_ptr++;
321 data->frag_header_size = 2;
322 obu_payload_size--;
323 }
324
325 // remember start position of LEB for possibly fragmented packet to
326 // fixup OBU size later
327 data->frag_pkt_leb_pos = pktpos;
328 // write intermediate OBU size field
329 num_lebs = write_leb(pkt->data + pktpos, obu_payload_size);
330 data->frag_lebs_res = num_lebs;
331 pktpos += num_lebs;
332 }
333 // copy verbatim or without above header size patch
334 memcpy(pkt->data + pktpos, buf_ptr, obu_payload_size);
335 pktpos += obu_payload_size;
336 buf_ptr += obu_payload_size;
337 rem_pkt_size -= obu_size;
338
339 // if we were handling a fragmented packet and this was the last
340 // fragment, correct OBU size field
341 if (data->frag_obu_size && (rem_pkt_size || !is_last_fragmented)) {
342 uint32_t final_obu_size = data->frag_obu_size + obu_size - data->frag_header_size;
343 uint8_t *lebptr = pkt->data + data->frag_pkt_leb_pos;
344 num_lebs = calc_leb_size(final_obu_size);
345
346 // check if we had allocated enough LEB bytes in header,
347 // otherwise make some extra space
348 if (num_lebs > data->frag_lebs_res) {
349 int extra_bytes = num_lebs - data->frag_lebs_res;
350 if ((result = av_grow_packet(pkt, extra_bytes)) < 0)
351 return result;
352 // update pointer in case buffer address changed
353 lebptr = pkt->data + data->frag_pkt_leb_pos;
354 // move existing data for OBU back a bit
355 memmove(lebptr + extra_bytes, lebptr,
356 pkt->size - extra_bytes - data->frag_pkt_leb_pos);
357 // move pktpos further down for following OBUs in same packet.
358 pktpos += extra_bytes;
359 }
360
361 // update OBU size field
362 write_leb(lebptr, final_obu_size);
363
364 data->frag_obu_size = 0; // signal end of fragment
365 } else if (is_last_fragmented && !rem_pkt_size) {
366 // add to total OBU size, so we can fix that in OBU header
367 // (but only if the OBU size was missing!)
368 if (needs_size_field || data->frag_obu_size) {
369 data->frag_obu_size += obu_size;
370 }
371 // fragment not yet finished!
372 result = -1;
373 }
374 is_frag_cont = 0;
375
376 if (!rem_pkt_size && !num_obus && (num_obus != obu_cnt)) {
377 av_log(ctx, AV_LOG_WARNING, "AV1 aggregation header indicated %u OBU elements, was %u\n",
378 num_obus, obu_cnt);
379 }
380 obu_cnt++;
381 }
382
383 if (flags & RTP_FLAG_MARKER) {
384 av_log(ctx, AV_LOG_TRACE, "TD on next packet due to marker\n");
385 data->needs_td = 1;
386 } else {
387 // fragment may be complete, but temporal unit is not yet finished
388 result = -1;
389 }
390
391 if (!is_last_fragmented) {
392 data->frag_obu_size = 0;
393 data->frag_pkt_leb_pos = 0;
394 }
395
396 #ifdef RTPDEC_AV1_VERBOSE_TRACE
397 if (!result) {
398 av_log(ctx, AV_LOG_TRACE, "AV1 out pkt-size: %d\n", pkt->size);
399 av_hex_dump_log(ctx, AV_LOG_TRACE, pkt->data, FFMIN(pkt->size, 64));
400 av_log(ctx, AV_LOG_TRACE, "... end at offset %x:\n", FFMAX(pkt->size - 64, 0));
401 av_hex_dump_log(ctx, AV_LOG_TRACE, pkt->data + FFMAX(pkt->size - 64, 0), FFMIN(pkt->size, 64));
402 }
403 #endif
404 pkt->stream_index = st->index;
405
406 return result;
407
408 drop_fragment:
409 data->keyframe_seen = 0;
410 data->drop_fragment = 1;
411 data->frag_obu_size = 0;
412 data->needs_td = 1;
413 if (pkt->size) {
414 av_log(ctx, AV_LOG_TRACE, "Dumping current AV1 frame packet\n");
415 // we can't seem to deallocate the fragmented packet, but we can shrink it to 0
416 av_shrink_packet(pkt, 0);
417 }
418 return AVERROR_INVALIDDATA;
419 }
420
421 static void av1_close_context(PayloadContext *data) {
422 }
423
424 static int av1_need_keyframe(PayloadContext *data)
425 {
426 return !data->keyframe_seen;
427 }
428
429 static int parse_av1_sdp_line(AVFormatContext *s, int st_index,
430 PayloadContext *av1_data, const char *line) {
431 AVStream * stream;
432 const char *p = line;
433 int result = 0;
434
435 if (st_index < 0)
436 return 0;
437
438 stream = s->streams[st_index];
439
440 /* Optional parameters are profile, level-idx, and tier.
441 * See Section 7.2.1 of https://aomediacodec.github.io/av1-rtp-spec/ */
442 if (av_strstart(p, "fmtp:", &p)) {
443 result = ff_parse_fmtp(s, stream, av1_data, p, sdp_parse_fmtp_config_av1);
444 av_log(s, AV_LOG_DEBUG, "RTP AV1 Profile: %u, Level: %u, Tier: %u\n",
445 av1_data->profile, av1_data->level_idx, av1_data->tier);
446 }
447
448 return result;
449 }
450
451 const RTPDynamicProtocolHandler ff_av1_dynamic_handler = {
452 .enc_name = "AV1",
453 .codec_type = AVMEDIA_TYPE_VIDEO,
454 .codec_id = AV_CODEC_ID_AV1,
455 .need_parsing = AVSTREAM_PARSE_FULL,
456 .priv_data_size = sizeof(PayloadContext),
457 .parse_sdp_a_line = parse_av1_sdp_line,
458 .close = av1_close_context,
459 .parse_packet = av1_handle_packet,
460 .need_keyframe = av1_need_keyframe,
461 };
462