scrcpy/app/src/util/str_util.c

#include "str_util.h"

#include <errno.h>
#include <limits.h>
#include <stdlib.h>
#include <string.h>

#ifdef _WIN32
# include <windows.h>
# include <tchar.h>
#endif

size_t
xstrncpy(char *dest, const char *src, size_t n) {
    size_t i;
    for (i = 0; i < n - 1 && src[i] != '\0'; ++i)
        dest[i] = src[i];
    if (n)
        dest[i] = '\0';
    return src[i] == '\0' ? i : n;
}

size_t
xstrjoin(char *dst, const char *const tokens[], char sep, size_t n) {
    const char *const *remaining = tokens;
    const char *token = *remaining++;
    size_t i = 0;
    while (token) {
        if (i) {
            dst[i++] = sep;
            if (i == n)
                goto truncated;
        }
        size_t w = xstrncpy(dst + i, token, n - i);
        if (w >= n - i)
            goto truncated;
        i += w;
        token = *remaining++;
    }
    return i;

truncated:
    dst[n - 1] = '\0';
    return n;
}

char *
strquote(const char *src) {
    size_t len = strlen(src);
    char *quoted = malloc(len + 3);
    if (!quoted) {
        return NULL;
    }
    memcpy(&quoted[1], src, len);
    quoted[0] = '"';
    quoted[len + 1] = '"';
    quoted[len + 2] = '\0';
    return quoted;
}

bool
parse_integer(const char *s, long *out) {
    char *endptr;
    if (*s == '\0') {
        return false;
    }
    errno = 0;
    long value = strtol(s, &endptr, 0);
    if (errno == ERANGE) {
        return false;
    }
    if (*endptr != '\0') {
        return false;
    }

    *out = value;
    return true;
}

size_t
parse_integers(const char *s, const char sep, size_t max_items, long *out) {
    size_t count = 0;
    char *endptr;
    do {
        errno = 0;
        long value = strtol(s, &endptr, 0);
        if (errno == ERANGE) {
            return 0;
        }

        if (endptr == s || (*endptr != sep && *endptr != '\0')) {
            return 0;
        }

        out[count++] = value;
        if (*endptr == sep) {
            if (count >= max_items) {
                // max items already reached, could not accept a new item
                return 0;
            }
            // parse the next token during the next iteration
            s = endptr + 1;
        }
    } while (*endptr != '\0');

    return count;
}

bool
parse_integer_with_suffix(const char *s, long *out) {
    char *endptr;
    if (*s == '\0') {
        return false;
    }
    errno = 0;
    long value = strtol(s, &endptr, 0);
    if (errno == ERANGE) {
        return false;
    }
    int mul = 1;
    if (*endptr != '\0') {
        if (s == endptr) {
            return false;
        }
        if ((*endptr == 'M' || *endptr == 'm') && endptr[1] == '\0') {
            mul = 1000000;
        } else if ((*endptr == 'K' || *endptr == 'k') && endptr[1] == '\0') {
            mul = 1000;
        } else {
            return false;
        }
    }

    if ((value < 0 && LONG_MIN / mul > value) ||
        (value > 0 && LONG_MAX / mul < value)) {
        return false;
    }

    *out = value * mul;
    return true;
}

bool
strlist_contains(const char *list, char sep, const char *s) {
    char *p;
    do {
        p = strchr(list, sep);

        size_t token_len = p ? (size_t) (p - list) : strlen(list);
        if (!strncmp(list, s, token_len)) {
            return true;
        }

        if (p) {
            list = p + 1;
        }
    } while (p);
    return false;
}

size_t
utf8_truncation_index(const char *utf8, size_t max_len) {
    size_t len = strlen(utf8);
    if (len <= max_len) {
        return len;
    }
    len = max_len;
    // see UTF-8 encoding <https://en.wikipedia.org/wiki/UTF-8#Description>
    while ((utf8[len] & 0x80) != 0 && (utf8[len] & 0xc0) != 0xc0) {
        // the next byte is not the start of a new UTF-8 codepoint
        // so if we would cut there, the character would be truncated
        len--;
    }
    return len;
}

#ifdef _WIN32

wchar_t *
utf8_to_wide_char(const char *utf8) {
    int len = MultiByteToWideChar(CP_UTF8, 0, utf8, -1, NULL, 0);
    if (!len) {
        return NULL;
    }

    wchar_t *wide = malloc(len * sizeof(wchar_t));
    if (!wide) {
        return NULL;
    }

    MultiByteToWideChar(CP_UTF8, 0, utf8, -1, wide, len);
    return wide;
}

char *
utf8_from_wide_char(const wchar_t *ws) {
    int len = WideCharToMultiByte(CP_UTF8, 0, ws, -1, NULL, 0, NULL, NULL);
    if (!len) {
        return NULL;
    }

    char *utf8 = malloc(len);
    if (!utf8) {
        return NULL;
    }

    WideCharToMultiByte(CP_UTF8, 0, ws, -1, utf8, len, NULL, NULL);
    return utf8;
}

#endif
Separate multi-words filenames by '_' Rename foobar.ext to foo_bar.ext. <https://github.com/Genymobile/scrcpy/pull/226#discussion_r209454865> 2018-08-15 23:01:54 +08:00			`#include "str_util.h"`
Initial commit Start a new clean history from here. 2017-12-12 22:12:07 +08:00
Factorize integer argument parsing Add util functions for integer parsing (with tests), and factorize integer argument parsing to avoid code duplication. 2019-12-07 18:01:55 +08:00			`#include <errno.h>`
			`#include <limits.h>`
Support paths containing spaces on Windows Quote the arguments of "adb push" to support paths which contain spaces on Windows. Fixes <https://github.com/Genymobile/scrcpy/issues/288>. 2018-10-05 02:47:53 +08:00			`#include <stdlib.h>`
			`#include <string.h>`

Create process with wide chars on Windows Windows does not support UTF-8, so pushing a file with non-ASCII characters failed. Convert the UTF-8 command line to a wide characters string and call CreateProcessW(). Fixes <https://github.com/Genymobile/scrcpy/issues/422> 2019-02-10 19:53:03 +08:00			`#ifdef _WIN32`
			`# include <windows.h>`
			`# include <tchar.h>`
			`#endif`

Update code style Limit source code to 80 chars, and declare functions return type and modifiers on a separate line. This allows to avoid very long lines, and all function names are aligned. (We do this on VLC, and I like it.) 2019-03-03 03:09:56 +08:00			`size_t`
			`xstrncpy(char dest, const char src, size_t n) {`
Initial commit Start a new clean history from here. 2017-12-12 22:12:07 +08:00			`size_t i;`
			`for (i = 0; i < n - 1 && src[i] != '\0'; ++i)`
			`dest[i] = src[i];`
			`if (n)`
			`dest[i] = '\0';`
			`return src[i] == '\0' ? i : n;`
			`}`

Update code style Limit source code to 80 chars, and declare functions return type and modifiers on a separate line. This allows to avoid very long lines, and all function names are aligned. (We do this on VLC, and I like it.) 2019-03-03 03:09:56 +08:00			`size_t`
			`xstrjoin(char dst, const char const tokens[], char sep, size_t n) {`
Initial commit Start a new clean history from here. 2017-12-12 22:12:07 +08:00			`const char const remaining = tokens;`
			`const char token = remaining++;`
			`size_t i = 0;`
			`while (token) {`
			`if (i) {`
			`dst[i++] = sep;`
			`if (i == n)`
			`goto truncated;`
			`}`
			`size_t w = xstrncpy(dst + i, token, n - i);`
			`if (w >= n - i)`
			`goto truncated;`
			`i += w;`
			`token = *remaining++;`
			`}`
			`return i;`

			`truncated:`
			`dst[n - 1] = '\0';`
			`return n;`
			`}`
Support paths containing spaces on Windows Quote the arguments of "adb push" to support paths which contain spaces on Windows. Fixes <https://github.com/Genymobile/scrcpy/issues/288>. 2018-10-05 02:47:53 +08:00
Update code style Limit source code to 80 chars, and declare functions return type and modifiers on a separate line. This allows to avoid very long lines, and all function names are aligned. (We do this on VLC, and I like it.) 2019-03-03 03:09:56 +08:00			`char *`
			`strquote(const char *src) {`
Support paths containing spaces on Windows Quote the arguments of "adb push" to support paths which contain spaces on Windows. Fixes <https://github.com/Genymobile/scrcpy/issues/288>. 2018-10-05 02:47:53 +08:00			`size_t len = strlen(src);`
Replace SDL_strdup() by strdup() The functions SDL_malloc(), SDL_free() and SDL_strdup() were used only because strdup() was not available everywhere. Now that it is available, use the native version of these functions. 2021-01-24 22:14:53 +08:00			`char *quoted = malloc(len + 3);`
Support paths containing spaces on Windows Quote the arguments of "adb push" to support paths which contain spaces on Windows. Fixes <https://github.com/Genymobile/scrcpy/issues/288>. 2018-10-05 02:47:53 +08:00			`if (!quoted) {`
			`return NULL;`
			`}`
			`memcpy(&quoted[1], src, len);`
			`quoted[0] = '"';`
			`quoted[len + 1] = '"';`
			`quoted[len + 2] = '\0';`
			`return quoted;`
			`}`
Create process with wide chars on Windows Windows does not support UTF-8, so pushing a file with non-ASCII characters failed. Convert the UTF-8 command line to a wide characters string and call CreateProcessW(). Fixes <https://github.com/Genymobile/scrcpy/issues/422> 2019-02-10 19:53:03 +08:00
Factorize integer argument parsing Add util functions for integer parsing (with tests), and factorize integer argument parsing to avoid code duplication. 2019-12-07 18:01:55 +08:00			`bool`
			`parse_integer(const char s, long out) {`
			`char *endptr;`
			`if (*s == '\0') {`
			`return false;`
			`}`
			`errno = 0;`
			`long value = strtol(s, &endptr, 0);`
			`if (errno == ERANGE) {`
			`return false;`
			`}`
			`if (*endptr != '\0') {`
			`return false;`
			`}`

			`*out = value;`
			`return true;`
			`}`

Add util function to parse a list of integers This will help parsing arguments like '1234:5678' into a list of integers. 2019-12-09 21:32:59 +08:00			`size_t`
			`parse_integers(const char s, const char sep, size_t max_items, long out) {`
			`size_t count = 0;`
			`char *endptr;`
			`do {`
			`errno = 0;`
			`long value = strtol(s, &endptr, 0);`
			`if (errno == ERANGE) {`
			`return 0;`
			`}`

			`if (endptr == s \|\| (endptr != sep && endptr != '\0')) {`
			`return 0;`
			`}`

			`out[count++] = value;`
			`if (*endptr == sep) {`
			`if (count >= max_items) {`
			`// max items already reached, could not accept a new item`
			`return 0;`
			`}`
			`// parse the next token during the next iteration`
			`s = endptr + 1;`
			`}`
			`} while (*endptr != '\0');`

			`return count;`
			`}`

Factorize integer argument parsing Add util functions for integer parsing (with tests), and factorize integer argument parsing to avoid code duplication. 2019-12-07 18:01:55 +08:00			`bool`
			`parse_integer_with_suffix(const char s, long out) {`
			`char *endptr;`
			`if (*s == '\0') {`
			`return false;`
			`}`
			`errno = 0;`
			`long value = strtol(s, &endptr, 0);`
			`if (errno == ERANGE) {`
			`return false;`
			`}`
			`int mul = 1;`
			`if (*endptr != '\0') {`
			`if (s == endptr) {`
			`return false;`
			`}`
			`if ((endptr == 'M' \|\| endptr == 'm') && endptr[1] == '\0') {`
			`mul = 1000000;`
			`} else if ((endptr == 'K' \|\| endptr == 'k') && endptr[1] == '\0') {`
			`mul = 1000;`
			`} else {`
			`return false;`
			`}`
			`}`

			`if ((value < 0 && LONG_MIN / mul > value) \|\|`
			`(value > 0 && LONG_MAX / mul < value)) {`
			`return false;`
			`}`

			`out = value mul;`
			`return true;`
			`}`

Add strlist_contains() Add a function to know if a string list, using some separator, contains a specific string. 2021-04-19 15:22:53 +08:00			`bool`
			`strlist_contains(const char list, char sep, const char s) {`
			`char *p;`
			`do {`
			`p = strchr(list, sep);`

			`size_t token_len = p ? (size_t) (p - list) : strlen(list);`
			`if (!strncmp(list, s, token_len)) {`
			`return true;`
			`}`

			`if (p) {`
			`list = p + 1;`
			`}`
			`} while (p);`
			`return false;`
			`}`

Add helpers to truncate UTF-8 at code points This will help to avoid truncating a UTF-8 string in the middle of a code point, producing an invalid UTF-8 result. 2019-05-31 01:01:08 +08:00			`size_t`
			`utf8_truncation_index(const char *utf8, size_t max_len) {`
			`size_t len = strlen(utf8);`
			`if (len <= max_len) {`
			`return len;`
			`}`
			`len = max_len;`
			`// see UTF-8 encoding <https://en.wikipedia.org/wiki/UTF-8#Description>`
			`while ((utf8[len] & 0x80) != 0 && (utf8[len] & 0xc0) != 0xc0) {`
			`// the next byte is not the start of a new UTF-8 codepoint`
			`// so if we would cut there, the character would be truncated`
			`len--;`
			`}`
			`return len;`
			`}`

Create process with wide chars on Windows Windows does not support UTF-8, so pushing a file with non-ASCII characters failed. Convert the UTF-8 command line to a wide characters string and call CreateProcessW(). Fixes <https://github.com/Genymobile/scrcpy/issues/422> 2019-02-10 19:53:03 +08:00			`#ifdef _WIN32`

Update code style Limit source code to 80 chars, and declare functions return type and modifiers on a separate line. This allows to avoid very long lines, and all function names are aligned. (We do this on VLC, and I like it.) 2019-03-03 03:09:56 +08:00			`wchar_t *`
			`utf8_to_wide_char(const char *utf8) {`
Create process with wide chars on Windows Windows does not support UTF-8, so pushing a file with non-ASCII characters failed. Convert the UTF-8 command line to a wide characters string and call CreateProcessW(). Fixes <https://github.com/Genymobile/scrcpy/issues/422> 2019-02-10 19:53:03 +08:00			`int len = MultiByteToWideChar(CP_UTF8, 0, utf8, -1, NULL, 0);`
			`if (!len) {`
			`return NULL;`
			`}`

Replace SDL_strdup() by strdup() The functions SDL_malloc(), SDL_free() and SDL_strdup() were used only because strdup() was not available everywhere. Now that it is available, use the native version of these functions. 2021-01-24 22:14:53 +08:00			`wchar_t wide = malloc(len sizeof(wchar_t));`
Create process with wide chars on Windows Windows does not support UTF-8, so pushing a file with non-ASCII characters failed. Convert the UTF-8 command line to a wide characters string and call CreateProcessW(). Fixes <https://github.com/Genymobile/scrcpy/issues/422> 2019-02-10 19:53:03 +08:00			`if (!wide) {`
			`return NULL;`
			`}`

			`MultiByteToWideChar(CP_UTF8, 0, utf8, -1, wide, len);`
			`return wide;`
			`}`

Add functions to convert wide char to UTF-8 There was already utf8_to_wide_char(), used to correctly execute commands on Windows. Add the reverse converter: utf8_from_wide_char(). We will need it to build the scrcpy-server path based on the executable directory. 2019-06-10 21:44:45 +08:00			`char *`
			`utf8_from_wide_char(const wchar_t *ws) {`
			`int len = WideCharToMultiByte(CP_UTF8, 0, ws, -1, NULL, 0, NULL, NULL);`
			`if (!len) {`
			`return NULL;`
			`}`

Replace SDL_strdup() by strdup() The functions SDL_malloc(), SDL_free() and SDL_strdup() were used only because strdup() was not available everywhere. Now that it is available, use the native version of these functions. 2021-01-24 22:14:53 +08:00			`char *utf8 = malloc(len);`
Add functions to convert wide char to UTF-8 There was already utf8_to_wide_char(), used to correctly execute commands on Windows. Add the reverse converter: utf8_from_wide_char(). We will need it to build the scrcpy-server path based on the executable directory. 2019-06-10 21:44:45 +08:00			`if (!utf8) {`
			`return NULL;`
			`}`

			`WideCharToMultiByte(CP_UTF8, 0, ws, -1, utf8, len, NULL, NULL);`
			`return utf8;`
			`}`

Create process with wide chars on Windows Windows does not support UTF-8, so pushing a file with non-ASCII characters failed. Convert the UTF-8 command line to a wide characters string and call CreateProcessW(). Fixes <https://github.com/Genymobile/scrcpy/issues/422> 2019-02-10 19:53:03 +08:00			`#endif`