libavutil/avstring.c
fc78ce80
 /*
  * Copyright (c) 2000, 2001, 2002 Fabrice Bellard
  * Copyright (c) 2007 Mans Rullgard
  *
  * This file is part of FFmpeg.
  *
  * FFmpeg is free software; you can redistribute it and/or
  * modify it under the terms of the GNU Lesser General Public
  * License as published by the Free Software Foundation; either
  * version 2.1 of the License, or (at your option) any later version.
  *
  * FFmpeg is distributed in the hope that it will be useful,
  * but WITHOUT ANY WARRANTY; without even the implied warranty of
  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
  * Lesser General Public License for more details.
  *
  * You should have received a copy of the GNU Lesser General Public
  * License along with FFmpeg; if not, write to the Free Software
  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  */
 
1e7f3638
 #include <stdarg.h>
1d9c2dc8
 #include <stdint.h>
1e7f3638
 #include <stdio.h>
fc78ce80
 #include <string.h>
4333df63
 
d8fd06c3
 #include "config.h"
 #include "common.h"
64b12fc3
 #include "mem.h"
d4ec07df
 #include "avassert.h"
4333df63
 #include "avstring.h"
9767ec6b
 #include "bprint.h"
fc78ce80
 
 int av_strstart(const char *str, const char *pfx, const char **ptr)
 {
059eeabf
     while (*pfx && *pfx == *str) {
         pfx++;
         str++;
     }
fc78ce80
     if (!*pfx && ptr)
         *ptr = str;
     return !*pfx;
 }
 
 int av_stristart(const char *str, const char *pfx, const char **ptr)
 {
88d55b82
     while (*pfx && av_toupper((unsigned)*pfx) == av_toupper((unsigned)*str)) {
059eeabf
         pfx++;
         str++;
     }
fc78ce80
     if (!*pfx && ptr)
         *ptr = str;
     return !*pfx;
 }
 
ac6ef868
 char *av_stristr(const char *s1, const char *s2)
 {
     if (!*s2)
68eb35b8
         return (char*)(intptr_t)s1;
ac6ef868
 
4333df63
     do
ac6ef868
         if (av_stristart(s1, s2, NULL))
68eb35b8
             return (char*)(intptr_t)s1;
4333df63
     while (*s1++);
ac6ef868
 
     return NULL;
 }
 
b85a5e87
 char *av_strnstr(const char *haystack, const char *needle, size_t hay_length)
 {
     size_t needle_len = strlen(needle);
     if (!needle_len)
32de2831
         return (char*)haystack;
b85a5e87
     while (hay_length >= needle_len) {
         hay_length--;
         if (!memcmp(haystack, needle, needle_len))
32de2831
             return (char*)haystack;
b85a5e87
         haystack++;
     }
     return NULL;
 }
 
fc78ce80
 size_t av_strlcpy(char *dst, const char *src, size_t size)
 {
     size_t len = 0;
     while (++len < size && *src)
         *dst++ = *src++;
     if (len <= size)
         *dst = 0;
     return len + strlen(src) - 1;
 }
 
 size_t av_strlcat(char *dst, const char *src, size_t size)
 {
     size_t len = strlen(dst);
     if (size <= len + 1)
         return len + strlen(src);
     return len + av_strlcpy(dst + len, src, size - len);
 }
1e7f3638
 
 size_t av_strlcatf(char *dst, size_t size, const char *fmt, ...)
 {
8c6bbc67
     size_t len = strlen(dst);
1e7f3638
     va_list vl;
 
     va_start(vl, fmt);
     len += vsnprintf(dst + len, size > len ? size - len : 0, fmt, vl);
     va_end(vl);
 
     return len;
 }
277c7332
 
61e2e296
 char *av_asprintf(const char *fmt, ...)
 {
     char *p = NULL;
     va_list va;
     int len;
 
     va_start(va, fmt);
     len = vsnprintf(NULL, 0, fmt, va);
     va_end(va);
     if (len < 0)
         goto end;
 
     p = av_malloc(len + 1);
     if (!p)
         goto end;
 
     va_start(va, fmt);
     len = vsnprintf(p, len + 1, fmt, va);
     va_end(va);
     if (len < 0)
         av_freep(&p);
 
 end:
     return p;
 }
 
b3e88ae8
 char *av_d2str(double d)
 {
4333df63
     char *str = av_malloc(16);
     if (str)
         snprintf(str, 16, "%f", d);
277c7332
     return str;
 }
372e2884
 
 #define WHITESPACES " \n\t"
 
 char *av_get_token(const char **buf, const char *term)
 {
4333df63
     char *out     = av_malloc(strlen(*buf) + 1);
     char *ret     = out, *end = out;
372e2884
     const char *p = *buf;
4333df63
     if (!out)
         return NULL;
372e2884
     p += strspn(p, WHITESPACES);
 
4333df63
     while (*p && !strspn(p, term)) {
372e2884
         char c = *p++;
4333df63
         if (c == '\\' && *p) {
372e2884
             *out++ = *p++;
4333df63
             end    = out;
         } else if (c == '\'') {
             while (*p && *p != '\'')
372e2884
                 *out++ = *p++;
4333df63
             if (*p) {
372e2884
                 p++;
4333df63
                 end = out;
372e2884
             }
4333df63
         } else {
372e2884
             *out++ = c;
         }
     }
 
4333df63
     do
372e2884
         *out-- = 0;
4333df63
     while (out >= end && strspn(out, WHITESPACES));
372e2884
 
     *buf = p;
 
     return ret;
 }
 
b35e9e19
 char *av_strtok(char *s, const char *delim, char **saveptr)
 {
     char *tok;
 
     if (!s && !(s = *saveptr))
         return NULL;
 
     /* skip leading delimiters */
     s += strspn(s, delim);
 
     /* s now points to the first non delimiter char, or to the end of the string */
     if (!*s) {
         *saveptr = NULL;
         return NULL;
     }
     tok = s++;
 
     /* skip non delimiters */
     s += strcspn(s, delim);
     if (*s) {
         *s = 0;
         *saveptr = s+1;
     } else {
         *saveptr = NULL;
     }
 
     return tok;
 }
 
96949daf
 int av_strcasecmp(const char *a, const char *b)
 {
     uint8_t c1, c2;
     do {
ba04ecfd
         c1 = av_tolower(*a++);
         c2 = av_tolower(*b++);
96949daf
     } while (c1 && c1 == c2);
     return c1 - c2;
 }
 
 int av_strncasecmp(const char *a, const char *b, size_t n)
 {
     const char *end = a + n;
     uint8_t c1, c2;
     do {
ba04ecfd
         c1 = av_tolower(*a++);
         c2 = av_tolower(*b++);
96949daf
     } while (a < end && c1 && c1 == c2);
     return c1 - c2;
 }
 
d8fd06c3
 const char *av_basename(const char *path)
 {
     char *p = strrchr(path, '/');
 
 #if HAVE_DOS_PATHS
     char *q = strrchr(path, '\\');
     char *d = strchr(path, ':');
 
     p = FFMAX3(p, q, d);
 #endif
 
     if (!p)
         return path;
 
     return p + 1;
 }
 
 const char *av_dirname(char *path)
 {
     char *p = strrchr(path, '/');
 
 #if HAVE_DOS_PATHS
     char *q = strrchr(path, '\\');
     char *d = strchr(path, ':');
 
     d = d ? d + 1 : d;
 
     p = FFMAX3(p, q, d);
 #endif
 
     if (!p)
         return ".";
 
     *p = '\0';
 
     return path;
 }
 
9767ec6b
 int av_escape(char **dst, const char *src, const char *special_chars,
               enum AVEscapeMode mode, int flags)
 {
     AVBPrint dstbuf;
 
     av_bprint_init(&dstbuf, 1, AV_BPRINT_SIZE_UNLIMITED);
     av_bprint_escape(&dstbuf, src, special_chars, mode, flags);
 
     if (!av_bprint_is_complete(&dstbuf)) {
         av_bprint_finalize(&dstbuf, NULL);
         return AVERROR(ENOMEM);
     } else {
         av_bprint_finalize(&dstbuf, dst);
         return dstbuf.len;
     }
 }
 
12c5c1d3
 int av_isdigit(int c)
 {
     return c >= '0' && c <= '9';
 }
 
 int av_isgraph(int c)
 {
     return c > 32 && c < 127;
 }
 
 int av_isspace(int c)
 {
     return c == ' ' || c == '\f' || c == '\n' || c == '\r' || c == '\t' ||
            c == '\v';
 }
 
 int av_isxdigit(int c)
 {
     c = av_tolower(c);
4be368b5
     return av_isdigit(c) || (c >= 'a' && c <= 'f');
12c5c1d3
 }
 
69e7336b
 int av_match_name(const char *name, const char *names)
 {
     const char *p;
     int len, namelen;
 
     if (!name || !names)
         return 0;
 
     namelen = strlen(name);
     while ((p = strchr(names, ','))) {
         len = FFMAX(p - names, namelen);
         if (!av_strncasecmp(name, names, len))
             return 1;
         names = p + 1;
     }
     return !av_strcasecmp(name, names);
 }
 
68590650
 int av_utf8_decode(int32_t *codep, const uint8_t **bufp, const uint8_t *buf_end,
                    unsigned int flags)
 {
     const uint8_t *p = *bufp;
     uint32_t top;
     uint64_t code;
d4ec07df
     int ret = 0, tail_len;
     uint32_t overlong_encoding_mins[6] = {
         0x00000000, 0x00000080, 0x00000800, 0x00010000, 0x00200000, 0x04000000,
     };
68590650
 
     if (p >= buf_end)
         return 0;
 
     code = *p++;
 
     /* first sequence byte starts with 10, or is 1111-1110 or 1111-1111,
        which is not admitted */
     if ((code & 0xc0) == 0x80 || code >= 0xFE) {
         ret = AVERROR(EILSEQ);
         goto end;
     }
     top = (code & 128) >> 1;
 
d4ec07df
     tail_len = 0;
68590650
     while (code & top) {
         int tmp;
d4ec07df
         tail_len++;
68590650
         if (p >= buf_end) {
a31547ce
             (*bufp) ++;
             return AVERROR(EILSEQ); /* incomplete sequence */
68590650
         }
 
         /* we assume the byte to be in the form 10xx-xxxx */
         tmp = *p++ - 128;   /* strip leading 1 */
         if (tmp>>6) {
a31547ce
             (*bufp) ++;
             return AVERROR(EILSEQ);
68590650
         }
         code = (code<<6) + tmp;
         top <<= 5;
     }
     code &= (top << 1) - 1;
 
d4ec07df
     /* check for overlong encodings */
     av_assert0(tail_len <= 5);
     if (code < overlong_encoding_mins[tail_len]) {
         ret = AVERROR(EILSEQ);
         goto end;
     }
 
68590650
     if (code >= 1<<31) {
         ret = AVERROR(EILSEQ);  /* out-of-range value */
         goto end;
     }
 
     *codep = code;
 
     if (code > 0x10FFFF &&
         !(flags & AV_UTF8_FLAG_ACCEPT_INVALID_BIG_CODES))
         ret = AVERROR(EILSEQ);
     if (code < 0x20 && code != 0x9 && code != 0xA && code != 0xD &&
         flags & AV_UTF8_FLAG_EXCLUDE_XML_INVALID_CONTROL_CODES)
         ret = AVERROR(EILSEQ);
     if (code >= 0xD800 && code <= 0xDFFF &&
         !(flags & AV_UTF8_FLAG_ACCEPT_SURROGATES))
         ret = AVERROR(EILSEQ);
9ab5cf54
     if ((code == 0xFFFE || code == 0xFFFF) &&
         !(flags & AV_UTF8_FLAG_ACCEPT_NON_CHARACTERS))
68590650
         ret = AVERROR(EILSEQ);
 
 end:
     *bufp = p;
     return ret;
 }
 
372e2884
 #ifdef TEST
 
 int main(void)
 {
     int i;
5717689c
     static const char * const strings[] = {
4333df63
         "''",
         "",
         ":",
         "\\",
         "'",
         "    ''    :",
         "    ''  ''  :",
         "foo   '' :",
         "'foo'",
         "foo     ",
         "  '  foo  '  ",
         "foo\\",
         "foo':  blah:blah",
         "foo\\:  blah:blah",
         "foo\'",
         "'foo :  '  :blahblah",
         "\\ :blah",
         "     foo",
         "      foo       ",
         "      foo     \\ ",
         "foo ':blah",
         " foo   bar    :   blahblah",
         "\\f\\o\\o",
         "'foo : \\ \\  '   : blahblah",
         "'\\fo\\o:': blahblah",
         "\\'fo\\o\\:':  foo  '  :blahblah"
     };
372e2884
 
     printf("Testing av_get_token()\n");
4333df63
     for (i = 0; i < FF_ARRAY_ELEMS(strings); i++) {
b2d0c5bd
         const char *p = strings[i];
         char *q;
4333df63
         printf("|%s|", p);
         q = av_get_token(&p, ":");
         printf(" -> |%s|", q);
         printf(" + |%s|\n", p);
         av_free(q);
372e2884
     }
 
     return 0;
 }
 
 #endif /* TEST */