FFmpeg coverage


Directory: ../../../ffmpeg/
File: src/libavutil/avstring.h
Date: 2025-01-20 09:27:23
Exec Total Coverage
Lines: 18 20 90.0%
Functions: 6 7 85.7%
Branches: 31 38 81.6%

Line Branch Exec Source
1 /*
2 * Copyright (c) 2007 Mans Rullgard
3 *
4 * This file is part of FFmpeg.
5 *
6 * FFmpeg is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public
8 * License as published by the Free Software Foundation; either
9 * version 2.1 of the License, or (at your option) any later version.
10 *
11 * FFmpeg is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * Lesser General Public License for more details.
15 *
16 * You should have received a copy of the GNU Lesser General Public
17 * License along with FFmpeg; if not, write to the Free Software
18 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
19 */
20
21 #ifndef AVUTIL_AVSTRING_H
22 #define AVUTIL_AVSTRING_H
23
24 #include <stddef.h>
25 #include <stdint.h>
26 #include "attributes.h"
27
28 /**
29 * @addtogroup lavu_string
30 * @{
31 */
32
33 /**
34 * Return non-zero if pfx is a prefix of str. If it is, *ptr is set to
35 * the address of the first character in str after the prefix.
36 *
37 * @param str input string
38 * @param pfx prefix to test
39 * @param ptr updated if the prefix is matched inside str
40 * @return non-zero if the prefix matches, zero otherwise
41 */
42 int av_strstart(const char *str, const char *pfx, const char **ptr);
43
44 /**
45 * Return non-zero if pfx is a prefix of str independent of case. If
46 * it is, *ptr is set to the address of the first character in str
47 * after the prefix.
48 *
49 * @param str input string
50 * @param pfx prefix to test
51 * @param ptr updated if the prefix is matched inside str
52 * @return non-zero if the prefix matches, zero otherwise
53 */
54 int av_stristart(const char *str, const char *pfx, const char **ptr);
55
56 /**
57 * Locate the first case-independent occurrence in the string haystack
58 * of the string needle. A zero-length string needle is considered to
59 * match at the start of haystack.
60 *
61 * This function is a case-insensitive version of the standard strstr().
62 *
63 * @param haystack string to search in
64 * @param needle string to search for
65 * @return pointer to the located match within haystack
66 * or a null pointer if no match
67 */
68 char *av_stristr(const char *haystack, const char *needle);
69
70 /**
71 * Locate the first occurrence of the string needle in the string haystack
72 * where not more than hay_length characters are searched. A zero-length
73 * string needle is considered to match at the start of haystack.
74 *
75 * This function is a length-limited version of the standard strstr().
76 *
77 * @param haystack string to search in
78 * @param needle string to search for
79 * @param hay_length length of string to search in
80 * @return pointer to the located match within haystack
81 * or a null pointer if no match
82 */
83 char *av_strnstr(const char *haystack, const char *needle, size_t hay_length);
84
85 /**
86 * Copy the string src to dst, but no more than size - 1 bytes, and
87 * null-terminate dst.
88 *
89 * This function is the same as BSD strlcpy().
90 *
91 * @param dst destination buffer
92 * @param src source string
93 * @param size size of destination buffer
94 * @return the length of src
95 *
96 * @warning since the return value is the length of src, src absolutely
97 * _must_ be a properly 0-terminated string, otherwise this will read beyond
98 * the end of the buffer and possibly crash.
99 */
100 size_t av_strlcpy(char *dst, const char *src, size_t size);
101
102 /**
103 * Append the string src to the string dst, but to a total length of
104 * no more than size - 1 bytes, and null-terminate dst.
105 *
106 * This function is similar to BSD strlcat(), but differs when
107 * size <= strlen(dst).
108 *
109 * @param dst destination buffer
110 * @param src source string
111 * @param size size of destination buffer
112 * @return the total length of src and dst
113 *
114 * @warning since the return value use the length of src and dst, these
115 * absolutely _must_ be a properly 0-terminated strings, otherwise this
116 * will read beyond the end of the buffer and possibly crash.
117 */
118 size_t av_strlcat(char *dst, const char *src, size_t size);
119
120 /**
121 * Append output to a string, according to a format. Never write out of
122 * the destination buffer, and always put a terminating 0 within
123 * the buffer.
124 * @param dst destination buffer (string to which the output is
125 * appended)
126 * @param size total size of the destination buffer
127 * @param fmt printf-compatible format string, specifying how the
128 * following parameters are used
129 * @return the length of the string that would have been generated
130 * if enough space had been available
131 */
132 size_t av_strlcatf(char *dst, size_t size, const char *fmt, ...) av_printf_format(3, 4);
133
134 /**
135 * Get the count of continuous non zero chars starting from the beginning.
136 *
137 * @param s the string whose length to count
138 * @param len maximum number of characters to check in the string, that
139 * is the maximum value which is returned by the function
140 */
141 351 static inline size_t av_strnlen(const char *s, size_t len)
142 {
143 size_t i;
144
3/4
✓ Branch 0 taken 11904 times.
✗ Branch 1 not taken.
✓ Branch 2 taken 11553 times.
✓ Branch 3 taken 351 times.
11904 for (i = 0; i < len && s[i]; i++)
145 ;
146 351 return i;
147 }
148
149 /**
150 * Print arguments following specified format into a large enough auto
151 * allocated buffer. It is similar to GNU asprintf().
152 * @param fmt printf-compatible format string, specifying how the
153 * following parameters are used.
154 * @return the allocated string
155 * @note You have to free the string yourself with av_free().
156 */
157 char *av_asprintf(const char *fmt, ...) av_printf_format(1, 2);
158
159 /**
160 * Unescape the given string until a non escaped terminating char,
161 * and return the token corresponding to the unescaped string.
162 *
163 * The normal \ and ' escaping is supported. Leading and trailing
164 * whitespaces are removed, unless they are escaped with '\' or are
165 * enclosed between ''.
166 *
167 * @param buf the buffer to parse, buf will be updated to point to the
168 * terminating char
169 * @param term a 0-terminated list of terminating chars
170 * @return the malloced unescaped string, which must be av_freed by
171 * the user, NULL in case of allocation failure
172 */
173 char *av_get_token(const char **buf, const char *term);
174
175 /**
176 * Split the string into several tokens which can be accessed by
177 * successive calls to av_strtok().
178 *
179 * A token is defined as a sequence of characters not belonging to the
180 * set specified in delim.
181 *
182 * On the first call to av_strtok(), s should point to the string to
183 * parse, and the value of saveptr is ignored. In subsequent calls, s
184 * should be NULL, and saveptr should be unchanged since the previous
185 * call.
186 *
187 * This function is similar to strtok_r() defined in POSIX.1.
188 *
189 * @param s the string to parse, may be NULL
190 * @param delim 0-terminated list of token delimiters, must be non-NULL
191 * @param saveptr user-provided pointer which points to stored
192 * information necessary for av_strtok() to continue scanning the same
193 * string. saveptr is updated to point to the next character after the
194 * first delimiter found, or to NULL if the string was terminated
195 * @return the found token, or NULL when no token is found
196 */
197 char *av_strtok(char *s, const char *delim, char **saveptr);
198
199 /**
200 * Locale-independent conversion of ASCII isdigit.
201 */
202 7822360 static inline av_const int av_isdigit(int c)
203 {
204
4/4
✓ Branch 0 taken 7045854 times.
✓ Branch 1 taken 776506 times.
✓ Branch 2 taken 4136179 times.
✓ Branch 3 taken 2909675 times.
7822360 return c >= '0' && c <= '9';
205 }
206
207 /**
208 * Locale-independent conversion of ASCII isgraph.
209 */
210 static inline av_const int av_isgraph(int c)
211 {
212 return c > 32 && c < 127;
213 }
214
215 /**
216 * Locale-independent conversion of ASCII isspace.
217 */
218 261747 static inline av_const int av_isspace(int c)
219 {
220
12/12
✓ Branch 0 taken 258120 times.
✓ Branch 1 taken 3627 times.
✓ Branch 2 taken 258118 times.
✓ Branch 3 taken 2 times.
✓ Branch 4 taken 257593 times.
✓ Branch 5 taken 525 times.
✓ Branch 6 taken 257590 times.
✓ Branch 7 taken 3 times.
✓ Branch 8 taken 257588 times.
✓ Branch 9 taken 2 times.
✓ Branch 10 taken 73 times.
✓ Branch 11 taken 257515 times.
261747 return c == ' ' || c == '\f' || c == '\n' || c == '\r' || c == '\t' ||
221 c == '\v';
222 }
223
224 /**
225 * Locale-independent conversion of ASCII characters to uppercase.
226 */
227 14109569 static inline av_const int av_toupper(int c)
228 {
229
4/4
✓ Branch 0 taken 11099694 times.
✓ Branch 1 taken 3009875 times.
✓ Branch 2 taken 11092078 times.
✓ Branch 3 taken 7616 times.
14109569 if (c >= 'a' && c <= 'z')
230 11092078 c ^= 0x20;
231 14109569 return c;
232 }
233
234 /**
235 * Locale-independent conversion of ASCII characters to lowercase.
236 */
237 8620150 static inline av_const int av_tolower(int c)
238 {
239
4/4
✓ Branch 0 taken 8280165 times.
✓ Branch 1 taken 339985 times.
✓ Branch 2 taken 87670 times.
✓ Branch 3 taken 8192495 times.
8620150 if (c >= 'A' && c <= 'Z')
240 87670 c ^= 0x20;
241 8620150 return c;
242 }
243
244 /**
245 * Locale-independent conversion of ASCII isxdigit.
246 */
247 8 static inline av_const int av_isxdigit(int c)
248 {
249 8 c = av_tolower(c);
250
4/6
✓ Branch 0 taken 1 times.
✓ Branch 1 taken 7 times.
✓ Branch 2 taken 1 times.
✗ Branch 3 not taken.
✓ Branch 4 taken 1 times.
✗ Branch 5 not taken.
8 return av_isdigit(c) || (c >= 'a' && c <= 'f');
251 }
252
253 /**
254 * Locale-independent case-insensitive compare.
255 * @note This means only ASCII-range characters are case-insensitive
256 */
257 int av_strcasecmp(const char *a, const char *b);
258
259 /**
260 * Locale-independent case-insensitive compare.
261 * @note This means only ASCII-range characters are case-insensitive
262 */
263 int av_strncasecmp(const char *a, const char *b, size_t n);
264
265 /**
266 * Locale-independent strings replace.
267 * @note This means only ASCII-range characters are replaced.
268 */
269 char *av_strireplace(const char *str, const char *from, const char *to);
270
271 /**
272 * Thread safe basename.
273 * @param path the string to parse, on DOS both \ and / are considered separators.
274 * @return pointer to the basename substring.
275 * If path does not contain a slash, the function returns a copy of path.
276 * If path is a NULL pointer or points to an empty string, a pointer
277 * to a string "." is returned.
278 */
279 const char *av_basename(const char *path);
280
281 /**
282 * Thread safe dirname.
283 * @param path the string to parse, on DOS both \ and / are considered separators.
284 * @return A pointer to a string that's the parent directory of path.
285 * If path is a NULL pointer or points to an empty string, a pointer
286 * to a string "." is returned.
287 * @note the function may modify the contents of the path, so copies should be passed.
288 */
289 const char *av_dirname(char *path);
290
291 /**
292 * Match instances of a name in a comma-separated list of names.
293 * List entries are checked from the start to the end of the names list,
294 * the first match ends further processing. If an entry prefixed with '-'
295 * matches, then 0 is returned. The "ALL" list entry is considered to
296 * match all names.
297 *
298 * @param name Name to look for.
299 * @param names List of names.
300 * @return 1 on match, 0 otherwise.
301 */
302 int av_match_name(const char *name, const char *names);
303
304 /**
305 * Append path component to the existing path.
306 * Path separator '/' is placed between when needed.
307 * Resulting string have to be freed with av_free().
308 * @param path base path
309 * @param component component to be appended
310 * @return new path or NULL on error.
311 */
312 char *av_append_path_component(const char *path, const char *component);
313
314 enum AVEscapeMode {
315 AV_ESCAPE_MODE_AUTO, ///< Use auto-selected escaping mode.
316 AV_ESCAPE_MODE_BACKSLASH, ///< Use backslash escaping.
317 AV_ESCAPE_MODE_QUOTE, ///< Use single-quote escaping.
318 AV_ESCAPE_MODE_XML, ///< Use XML non-markup character data escaping.
319 };
320
321 /**
322 * Consider spaces special and escape them even in the middle of the
323 * string.
324 *
325 * This is equivalent to adding the whitespace characters to the special
326 * characters lists, except it is guaranteed to use the exact same list
327 * of whitespace characters as the rest of libavutil.
328 */
329 #define AV_ESCAPE_FLAG_WHITESPACE (1 << 0)
330
331 /**
332 * Escape only specified special characters.
333 * Without this flag, escape also any characters that may be considered
334 * special by av_get_token(), such as the single quote.
335 */
336 #define AV_ESCAPE_FLAG_STRICT (1 << 1)
337
338 /**
339 * Within AV_ESCAPE_MODE_XML, additionally escape single quotes for single
340 * quoted attributes.
341 */
342 #define AV_ESCAPE_FLAG_XML_SINGLE_QUOTES (1 << 2)
343
344 /**
345 * Within AV_ESCAPE_MODE_XML, additionally escape double quotes for double
346 * quoted attributes.
347 */
348 #define AV_ESCAPE_FLAG_XML_DOUBLE_QUOTES (1 << 3)
349
350
351 /**
352 * Escape string in src, and put the escaped string in an allocated
353 * string in *dst, which must be freed with av_free().
354 *
355 * @param dst pointer where an allocated string is put
356 * @param src string to escape, must be non-NULL
357 * @param special_chars string containing the special characters which
358 * need to be escaped, can be NULL
359 * @param mode escape mode to employ, see AV_ESCAPE_MODE_* macros.
360 * Any unknown value for mode will be considered equivalent to
361 * AV_ESCAPE_MODE_BACKSLASH, but this behaviour can change without
362 * notice.
363 * @param flags flags which control how to escape, see AV_ESCAPE_FLAG_ macros
364 * @return the length of the allocated string, or a negative error code in case of error
365 * @see av_bprint_escape()
366 */
367 av_warn_unused_result
368 int av_escape(char **dst, const char *src, const char *special_chars,
369 enum AVEscapeMode mode, int flags);
370
371 #define AV_UTF8_FLAG_ACCEPT_INVALID_BIG_CODES 1 ///< accept codepoints over 0x10FFFF
372 #define AV_UTF8_FLAG_ACCEPT_NON_CHARACTERS 2 ///< accept non-characters - 0xFFFE and 0xFFFF
373 #define AV_UTF8_FLAG_ACCEPT_SURROGATES 4 ///< accept UTF-16 surrogates codes
374 #define AV_UTF8_FLAG_EXCLUDE_XML_INVALID_CONTROL_CODES 8 ///< exclude control codes not accepted by XML
375
376 #define AV_UTF8_FLAG_ACCEPT_ALL \
377 AV_UTF8_FLAG_ACCEPT_INVALID_BIG_CODES|AV_UTF8_FLAG_ACCEPT_NON_CHARACTERS|AV_UTF8_FLAG_ACCEPT_SURROGATES
378
379 /**
380 * Read and decode a single UTF-8 code point (character) from the
381 * buffer in *buf, and update *buf to point to the next byte to
382 * decode.
383 *
384 * In case of an invalid byte sequence, the pointer will be updated to
385 * the next byte after the invalid sequence and the function will
386 * return an error code.
387 *
388 * Depending on the specified flags, the function will also fail in
389 * case the decoded code point does not belong to a valid range.
390 *
391 * @note For speed-relevant code a carefully implemented use of
392 * GET_UTF8() may be preferred.
393 *
394 * @param codep pointer used to return the parsed code in case of success.
395 * The value in *codep is set even in case the range check fails.
396 * @param bufp pointer to the address the first byte of the sequence
397 * to decode, updated by the function to point to the
398 * byte next after the decoded sequence
399 * @param buf_end pointer to the end of the buffer, points to the next
400 * byte past the last in the buffer. This is used to
401 * avoid buffer overreads (in case of an unfinished
402 * UTF-8 sequence towards the end of the buffer).
403 * @param flags a collection of AV_UTF8_FLAG_* flags
404 * @return >= 0 in case a sequence was successfully read, a negative
405 * value in case of invalid sequence
406 */
407 av_warn_unused_result
408 int av_utf8_decode(int32_t *codep, const uint8_t **bufp, const uint8_t *buf_end,
409 unsigned int flags);
410
411 /**
412 * Check if a name is in a list.
413 * @returns 0 if not found, or the 1 based index where it has been found in the
414 * list.
415 */
416 int av_match_list(const char *name, const char *list, char separator);
417
418 /**
419 * See libc sscanf manual for more information.
420 * Locale-independent sscanf implementation.
421 */
422 int av_sscanf(const char *string, const char *format, ...);
423
424 /**
425 * @}
426 */
427
428 #endif /* AVUTIL_AVSTRING_H */
429