2020-09-06 16:53:08 +00:00
|
|
|
/*
|
|
|
|
* C utilities
|
2023-11-12 09:01:40 +00:00
|
|
|
*
|
2020-09-06 16:53:08 +00:00
|
|
|
* Copyright (c) 2017 Fabrice Bellard
|
|
|
|
* Copyright (c) 2018 Charlie Gordon
|
|
|
|
*
|
|
|
|
* Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
|
|
* of this software and associated documentation files (the "Software"), to deal
|
|
|
|
* in the Software without restriction, including without limitation the rights
|
|
|
|
* to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
|
|
* copies of the Software, and to permit persons to whom the Software is
|
|
|
|
* furnished to do so, subject to the following conditions:
|
|
|
|
*
|
|
|
|
* The above copyright notice and this permission notice shall be included in
|
|
|
|
* all copies or substantial portions of the Software.
|
|
|
|
*
|
|
|
|
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
|
|
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
|
|
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
|
|
|
|
* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
|
|
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
|
|
* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
|
|
|
|
* THE SOFTWARE.
|
|
|
|
*/
|
|
|
|
#ifndef CUTILS_H
|
|
|
|
#define CUTILS_H
|
|
|
|
|
|
|
|
#include <stdlib.h>
|
2024-02-18 12:39:33 +00:00
|
|
|
#include <string.h>
|
2020-09-06 16:53:08 +00:00
|
|
|
#include <inttypes.h>
|
2024-09-03 18:32:17 +00:00
|
|
|
#include <math.h>
|
2020-09-06 16:53:08 +00:00
|
|
|
|
2024-07-01 10:30:20 +00:00
|
|
|
#ifdef __cplusplus
|
|
|
|
extern "C" {
|
|
|
|
#endif
|
|
|
|
|
2024-04-02 19:50:42 +00:00
|
|
|
#if defined(_MSC_VER)
|
2023-11-22 08:36:53 +00:00
|
|
|
#include <winsock2.h>
|
|
|
|
#include <malloc.h>
|
|
|
|
#define alloca _alloca
|
|
|
|
#define ssize_t ptrdiff_t
|
|
|
|
#endif
|
2023-12-05 09:46:40 +00:00
|
|
|
#if defined(__APPLE__)
|
|
|
|
#include <malloc/malloc.h>
|
2024-03-12 08:06:07 +00:00
|
|
|
#elif defined(__linux__) || defined(__ANDROID__) || defined(__CYGWIN__)
|
2023-12-05 09:46:40 +00:00
|
|
|
#include <malloc.h>
|
|
|
|
#elif defined(__FreeBSD__)
|
|
|
|
#include <malloc_np.h>
|
2024-09-09 19:48:05 +00:00
|
|
|
#elif defined(_WIN32)
|
|
|
|
#include <windows.h>
|
2023-12-05 09:46:40 +00:00
|
|
|
#endif
|
2024-10-07 20:08:31 +00:00
|
|
|
#if !defined(_WIN32) && !defined(EMSCRIPTEN) && !defined(__wasi__)
|
2024-04-02 19:50:42 +00:00
|
|
|
#include <errno.h>
|
|
|
|
#include <pthread.h>
|
|
|
|
#endif
|
2024-01-16 11:42:05 +00:00
|
|
|
|
2024-10-29 18:54:33 +00:00
|
|
|
#if defined(__SANITIZE_ADDRESS__)
|
|
|
|
# define __ASAN__ 1
|
|
|
|
#elif defined(__has_feature)
|
|
|
|
# if __has_feature(address_sanitizer)
|
|
|
|
# define __ASAN__ 1
|
|
|
|
# endif
|
|
|
|
#endif
|
|
|
|
|
2024-01-16 11:42:05 +00:00
|
|
|
#if defined(_MSC_VER) && !defined(__clang__)
|
|
|
|
# define likely(x) (x)
|
|
|
|
# define unlikely(x) (x)
|
|
|
|
# define force_inline __forceinline
|
|
|
|
# define no_inline __declspec(noinline)
|
|
|
|
# define __maybe_unused
|
|
|
|
# define __attribute__(x)
|
|
|
|
# define __attribute(x)
|
|
|
|
# include <intrin.h>
|
|
|
|
static void *__builtin_frame_address(unsigned int level) {
|
|
|
|
return (void *)((char*)_AddressOfReturnAddress() - sizeof(int *) - level * sizeof(int *));
|
|
|
|
}
|
|
|
|
#else
|
|
|
|
# define likely(x) __builtin_expect(!!(x), 1)
|
|
|
|
# define unlikely(x) __builtin_expect(!!(x), 0)
|
|
|
|
# define force_inline inline __attribute__((always_inline))
|
|
|
|
# define no_inline __attribute__((noinline))
|
|
|
|
# define __maybe_unused __attribute__((unused))
|
|
|
|
#endif
|
|
|
|
|
|
|
|
// https://stackoverflow.com/a/6849629
|
|
|
|
#undef FORMAT_STRING
|
|
|
|
#if _MSC_VER >= 1400
|
|
|
|
# include <sal.h>
|
|
|
|
# if _MSC_VER > 1400
|
|
|
|
# define FORMAT_STRING(p) _Printf_format_string_ p
|
|
|
|
# else
|
|
|
|
# define FORMAT_STRING(p) __format_string p
|
|
|
|
# endif /* FORMAT_STRING */
|
|
|
|
#else
|
|
|
|
# define FORMAT_STRING(p) p
|
|
|
|
#endif /* _MSC_VER */
|
|
|
|
|
|
|
|
#if defined(_MSC_VER) && !defined(__clang__)
|
|
|
|
#include <math.h>
|
|
|
|
#define INF INFINITY
|
|
|
|
#define NEG_INF -INFINITY
|
|
|
|
#else
|
|
|
|
#define INF (1.0/0.0)
|
|
|
|
#define NEG_INF (-1.0/0.0)
|
|
|
|
#endif
|
2020-09-06 16:53:08 +00:00
|
|
|
|
|
|
|
#ifndef offsetof
|
|
|
|
#define offsetof(type, field) ((size_t) &((type *)0)->field)
|
|
|
|
#endif
|
|
|
|
#ifndef countof
|
|
|
|
#define countof(x) (sizeof(x) / sizeof((x)[0]))
|
2023-11-29 08:12:02 +00:00
|
|
|
#ifndef endof
|
|
|
|
#define endof(x) ((x) + countof(x))
|
|
|
|
#endif
|
2020-09-06 16:53:08 +00:00
|
|
|
#endif
|
2023-12-22 20:51:53 +00:00
|
|
|
#ifndef container_of
|
|
|
|
/* return the pointer of type 'type *' containing 'ptr' as field 'member' */
|
|
|
|
#define container_of(ptr, type, member) ((type *)((uint8_t *)(ptr) - offsetof(type, member)))
|
|
|
|
#endif
|
2020-09-06 16:53:08 +00:00
|
|
|
|
2024-10-11 07:36:11 +00:00
|
|
|
#if defined(_MSC_VER)
|
|
|
|
#define minimum_length(n) n
|
2024-03-10 09:34:26 +00:00
|
|
|
#else
|
2024-10-11 07:36:11 +00:00
|
|
|
#define minimum_length(n) static n
|
2024-03-10 09:34:26 +00:00
|
|
|
#endif
|
|
|
|
|
2020-09-06 16:53:08 +00:00
|
|
|
typedef int BOOL;
|
|
|
|
|
|
|
|
#ifndef FALSE
|
|
|
|
enum {
|
|
|
|
FALSE = 0,
|
|
|
|
TRUE = 1,
|
|
|
|
};
|
|
|
|
#endif
|
|
|
|
|
2024-12-15 10:01:16 +00:00
|
|
|
void js__pstrcpy(char *buf, int buf_size, const char *str);
|
|
|
|
char *js__pstrcat(char *buf, int buf_size, const char *s);
|
|
|
|
int js__strstart(const char *str, const char *val, const char **ptr);
|
|
|
|
int js__has_suffix(const char *str, const char *suffix);
|
2020-09-06 16:53:08 +00:00
|
|
|
|
2024-04-19 09:35:44 +00:00
|
|
|
static inline uint8_t is_be(void) {
|
|
|
|
union {
|
|
|
|
uint16_t a;
|
|
|
|
uint8_t b;
|
|
|
|
} u = { 0x100 };
|
|
|
|
return u.b;
|
|
|
|
}
|
|
|
|
|
2020-09-06 16:53:08 +00:00
|
|
|
static inline int max_int(int a, int b)
|
|
|
|
{
|
|
|
|
if (a > b)
|
|
|
|
return a;
|
|
|
|
else
|
|
|
|
return b;
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline int min_int(int a, int b)
|
|
|
|
{
|
|
|
|
if (a < b)
|
|
|
|
return a;
|
|
|
|
else
|
|
|
|
return b;
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline uint32_t max_uint32(uint32_t a, uint32_t b)
|
|
|
|
{
|
|
|
|
if (a > b)
|
|
|
|
return a;
|
|
|
|
else
|
|
|
|
return b;
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline uint32_t min_uint32(uint32_t a, uint32_t b)
|
|
|
|
{
|
|
|
|
if (a < b)
|
|
|
|
return a;
|
|
|
|
else
|
|
|
|
return b;
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline int64_t max_int64(int64_t a, int64_t b)
|
|
|
|
{
|
|
|
|
if (a > b)
|
|
|
|
return a;
|
|
|
|
else
|
|
|
|
return b;
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline int64_t min_int64(int64_t a, int64_t b)
|
|
|
|
{
|
|
|
|
if (a < b)
|
|
|
|
return a;
|
|
|
|
else
|
|
|
|
return b;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* WARNING: undefined if a = 0 */
|
|
|
|
static inline int clz32(unsigned int a)
|
|
|
|
{
|
2024-01-16 11:42:05 +00:00
|
|
|
#if defined(_MSC_VER) && !defined(__clang__)
|
|
|
|
unsigned long index;
|
|
|
|
_BitScanReverse(&index, a);
|
|
|
|
return 31 - index;
|
|
|
|
#else
|
2020-09-06 16:53:08 +00:00
|
|
|
return __builtin_clz(a);
|
2024-01-16 11:42:05 +00:00
|
|
|
#endif
|
2020-09-06 16:53:08 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
/* WARNING: undefined if a = 0 */
|
|
|
|
static inline int clz64(uint64_t a)
|
|
|
|
{
|
2024-01-16 11:42:05 +00:00
|
|
|
#if defined(_MSC_VER) && !defined(__clang__)
|
2024-06-15 13:04:42 +00:00
|
|
|
#if INTPTR_MAX == INT64_MAX
|
2024-01-16 11:42:05 +00:00
|
|
|
unsigned long index;
|
|
|
|
_BitScanReverse64(&index, a);
|
|
|
|
return 63 - index;
|
2024-06-15 13:04:42 +00:00
|
|
|
#else
|
|
|
|
if (a >> 32)
|
|
|
|
return clz32((unsigned)(a >> 32));
|
|
|
|
else
|
|
|
|
return clz32((unsigned)a) + 32;
|
2024-07-01 10:30:20 +00:00
|
|
|
#endif
|
2024-01-16 11:42:05 +00:00
|
|
|
#else
|
2020-09-06 16:53:08 +00:00
|
|
|
return __builtin_clzll(a);
|
2024-01-16 11:42:05 +00:00
|
|
|
#endif
|
2020-09-06 16:53:08 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
/* WARNING: undefined if a = 0 */
|
|
|
|
static inline int ctz32(unsigned int a)
|
|
|
|
{
|
2024-01-16 11:42:05 +00:00
|
|
|
#if defined(_MSC_VER) && !defined(__clang__)
|
|
|
|
unsigned long index;
|
|
|
|
_BitScanForward(&index, a);
|
|
|
|
return index;
|
|
|
|
#else
|
2020-09-06 16:53:08 +00:00
|
|
|
return __builtin_ctz(a);
|
2024-01-16 11:42:05 +00:00
|
|
|
#endif
|
2020-09-06 16:53:08 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
/* WARNING: undefined if a = 0 */
|
|
|
|
static inline int ctz64(uint64_t a)
|
|
|
|
{
|
2024-01-16 11:42:05 +00:00
|
|
|
#if defined(_MSC_VER) && !defined(__clang__)
|
|
|
|
unsigned long index;
|
|
|
|
_BitScanForward64(&index, a);
|
|
|
|
return index;
|
|
|
|
#else
|
2020-09-06 16:53:08 +00:00
|
|
|
return __builtin_ctzll(a);
|
2024-01-16 11:42:05 +00:00
|
|
|
#endif
|
2020-09-06 16:53:08 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
static inline uint64_t get_u64(const uint8_t *tab)
|
|
|
|
{
|
2024-02-18 12:39:33 +00:00
|
|
|
uint64_t v;
|
|
|
|
memcpy(&v, tab, sizeof(v));
|
|
|
|
return v;
|
2020-09-06 16:53:08 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
static inline int64_t get_i64(const uint8_t *tab)
|
|
|
|
{
|
2024-02-18 12:39:33 +00:00
|
|
|
int64_t v;
|
|
|
|
memcpy(&v, tab, sizeof(v));
|
|
|
|
return v;
|
2020-09-06 16:53:08 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
static inline void put_u64(uint8_t *tab, uint64_t val)
|
|
|
|
{
|
2024-02-18 12:39:33 +00:00
|
|
|
memcpy(tab, &val, sizeof(val));
|
2020-09-06 16:53:08 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
static inline uint32_t get_u32(const uint8_t *tab)
|
|
|
|
{
|
2024-02-18 12:39:33 +00:00
|
|
|
uint32_t v;
|
|
|
|
memcpy(&v, tab, sizeof(v));
|
|
|
|
return v;
|
2020-09-06 16:53:08 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
static inline int32_t get_i32(const uint8_t *tab)
|
|
|
|
{
|
2024-02-18 12:39:33 +00:00
|
|
|
int32_t v;
|
|
|
|
memcpy(&v, tab, sizeof(v));
|
|
|
|
return v;
|
2020-09-06 16:53:08 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
static inline void put_u32(uint8_t *tab, uint32_t val)
|
|
|
|
{
|
2024-02-18 12:39:33 +00:00
|
|
|
memcpy(tab, &val, sizeof(val));
|
2020-09-06 16:53:08 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
static inline uint32_t get_u16(const uint8_t *tab)
|
|
|
|
{
|
2024-02-18 12:39:33 +00:00
|
|
|
uint16_t v;
|
|
|
|
memcpy(&v, tab, sizeof(v));
|
|
|
|
return v;
|
2020-09-06 16:53:08 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
static inline int32_t get_i16(const uint8_t *tab)
|
|
|
|
{
|
2024-02-18 12:39:33 +00:00
|
|
|
int16_t v;
|
|
|
|
memcpy(&v, tab, sizeof(v));
|
|
|
|
return v;
|
2020-09-06 16:53:08 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
static inline void put_u16(uint8_t *tab, uint16_t val)
|
|
|
|
{
|
2024-02-18 12:39:33 +00:00
|
|
|
memcpy(tab, &val, sizeof(val));
|
2020-09-06 16:53:08 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
static inline uint32_t get_u8(const uint8_t *tab)
|
|
|
|
{
|
|
|
|
return *tab;
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline int32_t get_i8(const uint8_t *tab)
|
|
|
|
{
|
|
|
|
return (int8_t)*tab;
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline void put_u8(uint8_t *tab, uint8_t val)
|
|
|
|
{
|
|
|
|
*tab = val;
|
|
|
|
}
|
|
|
|
|
2023-12-07 14:48:31 +00:00
|
|
|
#ifndef bswap16
|
2020-09-06 16:53:08 +00:00
|
|
|
static inline uint16_t bswap16(uint16_t x)
|
|
|
|
{
|
|
|
|
return (x >> 8) | (x << 8);
|
|
|
|
}
|
2023-12-07 14:48:31 +00:00
|
|
|
#endif
|
2020-09-06 16:53:08 +00:00
|
|
|
|
2023-12-07 14:48:31 +00:00
|
|
|
#ifndef bswap32
|
2020-09-06 16:53:08 +00:00
|
|
|
static inline uint32_t bswap32(uint32_t v)
|
|
|
|
{
|
|
|
|
return ((v & 0xff000000) >> 24) | ((v & 0x00ff0000) >> 8) |
|
|
|
|
((v & 0x0000ff00) << 8) | ((v & 0x000000ff) << 24);
|
|
|
|
}
|
2023-12-07 14:48:31 +00:00
|
|
|
#endif
|
2020-09-06 16:53:08 +00:00
|
|
|
|
2023-12-07 14:48:31 +00:00
|
|
|
#ifndef bswap64
|
2020-09-06 16:53:08 +00:00
|
|
|
static inline uint64_t bswap64(uint64_t v)
|
|
|
|
{
|
2023-11-12 09:01:40 +00:00
|
|
|
return ((v & ((uint64_t)0xff << (7 * 8))) >> (7 * 8)) |
|
|
|
|
((v & ((uint64_t)0xff << (6 * 8))) >> (5 * 8)) |
|
|
|
|
((v & ((uint64_t)0xff << (5 * 8))) >> (3 * 8)) |
|
|
|
|
((v & ((uint64_t)0xff << (4 * 8))) >> (1 * 8)) |
|
|
|
|
((v & ((uint64_t)0xff << (3 * 8))) << (1 * 8)) |
|
|
|
|
((v & ((uint64_t)0xff << (2 * 8))) << (3 * 8)) |
|
|
|
|
((v & ((uint64_t)0xff << (1 * 8))) << (5 * 8)) |
|
2020-09-06 16:53:08 +00:00
|
|
|
((v & ((uint64_t)0xff << (0 * 8))) << (7 * 8));
|
|
|
|
}
|
2023-12-07 14:48:31 +00:00
|
|
|
#endif
|
2020-09-06 16:53:08 +00:00
|
|
|
|
2023-11-29 07:50:53 +00:00
|
|
|
static inline void inplace_bswap16(uint8_t *tab) {
|
|
|
|
put_u16(tab, bswap16(get_u16(tab)));
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline void inplace_bswap32(uint8_t *tab) {
|
|
|
|
put_u32(tab, bswap32(get_u32(tab)));
|
|
|
|
}
|
|
|
|
|
2024-09-03 18:32:17 +00:00
|
|
|
static inline double fromfp16(uint16_t v) {
|
|
|
|
double d, s;
|
|
|
|
int e;
|
|
|
|
if ((v & 0x7C00) == 0x7C00) {
|
|
|
|
d = (v & 0x3FF) ? NAN : INFINITY;
|
|
|
|
} else {
|
|
|
|
d = (v & 0x3FF) / 1024.;
|
|
|
|
e = (v & 0x7C00) >> 10;
|
|
|
|
if (e == 0) {
|
|
|
|
e = -14;
|
|
|
|
} else {
|
|
|
|
d += 1;
|
|
|
|
e -= 15;
|
|
|
|
}
|
|
|
|
d = scalbn(d, e);
|
|
|
|
}
|
|
|
|
s = (v & 0x8000) ? -1.0 : 1.0;
|
|
|
|
return d * s;
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline uint16_t tofp16(double d) {
|
|
|
|
uint16_t f, s;
|
|
|
|
double t;
|
|
|
|
int e;
|
|
|
|
s = 0;
|
|
|
|
if (copysign(1, d) < 0) { // preserve sign when |d| is negative zero
|
|
|
|
d = -d;
|
|
|
|
s = 0x8000;
|
|
|
|
}
|
|
|
|
if (isinf(d))
|
|
|
|
return s | 0x7C00;
|
|
|
|
if (isnan(d))
|
|
|
|
return s | 0x7C01;
|
|
|
|
if (d == 0)
|
|
|
|
return s | 0;
|
|
|
|
d = 2 * frexp(d, &e);
|
|
|
|
e--;
|
|
|
|
if (e > 15)
|
|
|
|
return s | 0x7C00; // out of range, return +/-infinity
|
|
|
|
if (e < -25) {
|
|
|
|
d = 0;
|
|
|
|
e = 0;
|
|
|
|
} else if (e < -14) {
|
|
|
|
d = scalbn(d, e + 14);
|
|
|
|
e = 0;
|
|
|
|
} else {
|
|
|
|
d -= 1;
|
|
|
|
e += 15;
|
|
|
|
}
|
|
|
|
d *= 1024.;
|
|
|
|
f = (uint16_t)d;
|
|
|
|
t = d - f;
|
|
|
|
if (t < 0.5)
|
|
|
|
goto done;
|
|
|
|
if (t == 0.5)
|
|
|
|
if ((f & 1) == 0)
|
|
|
|
goto done;
|
|
|
|
// adjust for rounding
|
|
|
|
if (++f == 1024) {
|
|
|
|
f = 0;
|
|
|
|
if (++e == 31)
|
|
|
|
return s | 0x7C00; // out of range, return +/-infinity
|
|
|
|
}
|
|
|
|
done:
|
|
|
|
return s | (e << 10) | f;
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline int isfp16nan(uint16_t v) {
|
|
|
|
return (v & 0x7FFF) > 0x7C00;
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline int isfp16zero(uint16_t v) {
|
|
|
|
return (v & 0x7FFF) == 0;
|
|
|
|
}
|
|
|
|
|
2020-09-06 16:53:08 +00:00
|
|
|
/* XXX: should take an extra argument to pass slack information to the caller */
|
|
|
|
typedef void *DynBufReallocFunc(void *opaque, void *ptr, size_t size);
|
|
|
|
|
|
|
|
typedef struct DynBuf {
|
|
|
|
uint8_t *buf;
|
|
|
|
size_t size;
|
|
|
|
size_t allocated_size;
|
|
|
|
BOOL error; /* true if a memory allocation error occurred */
|
|
|
|
DynBufReallocFunc *realloc_func;
|
|
|
|
void *opaque; /* for realloc_func */
|
|
|
|
} DynBuf;
|
|
|
|
|
|
|
|
void dbuf_init(DynBuf *s);
|
|
|
|
void dbuf_init2(DynBuf *s, void *opaque, DynBufReallocFunc *realloc_func);
|
|
|
|
int dbuf_realloc(DynBuf *s, size_t new_size);
|
2023-12-16 00:01:26 +00:00
|
|
|
int dbuf_write(DynBuf *s, size_t offset, const void *data, size_t len);
|
|
|
|
int dbuf_put(DynBuf *s, const void *data, size_t len);
|
2020-09-06 16:53:08 +00:00
|
|
|
int dbuf_put_self(DynBuf *s, size_t offset, size_t len);
|
|
|
|
int dbuf_putc(DynBuf *s, uint8_t c);
|
|
|
|
int dbuf_putstr(DynBuf *s, const char *str);
|
|
|
|
static inline int dbuf_put_u16(DynBuf *s, uint16_t val)
|
|
|
|
{
|
|
|
|
return dbuf_put(s, (uint8_t *)&val, 2);
|
|
|
|
}
|
|
|
|
static inline int dbuf_put_u32(DynBuf *s, uint32_t val)
|
|
|
|
{
|
|
|
|
return dbuf_put(s, (uint8_t *)&val, 4);
|
|
|
|
}
|
|
|
|
static inline int dbuf_put_u64(DynBuf *s, uint64_t val)
|
|
|
|
{
|
|
|
|
return dbuf_put(s, (uint8_t *)&val, 8);
|
|
|
|
}
|
|
|
|
int __attribute__((format(printf, 2, 3))) dbuf_printf(DynBuf *s,
|
2024-01-16 11:42:05 +00:00
|
|
|
FORMAT_STRING(const char *fmt), ...);
|
2020-09-06 16:53:08 +00:00
|
|
|
void dbuf_free(DynBuf *s);
|
|
|
|
static inline BOOL dbuf_error(DynBuf *s) {
|
|
|
|
return s->error;
|
|
|
|
}
|
2020-09-06 17:07:30 +00:00
|
|
|
static inline void dbuf_set_error(DynBuf *s)
|
|
|
|
{
|
|
|
|
s->error = TRUE;
|
|
|
|
}
|
2020-09-06 16:53:08 +00:00
|
|
|
|
Improve UTF-8 decoding and encoding functions (#410)
Ensure proper UTF-8 encoding (1 to 4 bytes).
Handle invalid encodings (return 0xFFFD and consume a single byte)
Individually encoded surrogate code points are accepted.
- add `utf8_scan()` to analyze a byte array for UTF-8 contents
detects invalid encoding, computes number of codepoints and content kind:
plain ASCII, 8-bit, 16-bit or larger codepoints.
- add `utf8_encode_len(c)` to compute the number of bytes to encode `c`
- rename `unicode_to_utf8` as `utf8_encode`
- rename `unicode_from_utf8` as `utf8_decode`
- add `utf8_decode_buf8(dest, size, src, len)` to decode a UTF-8 encoded
byte array known to contain only ASCII and 8-bit codepoints.
- add `utf8_decode_buf16(dest, size, src, len)` to decode a UTF-8 encoded
byte array into an array of 16-bit codepoints using UTF-16 surrogate pairs
for non-BMP1 codepoints.
- add `utf8_encode_buf8(dest, size, src, len)` to encode an array of 8-bit
codepoints as a UTF-8 encoded null terminated string
- add `utf16_encode_buf8(dest, size, src, len)` to decode an array of 16-bit
codepoints (including surrogate pairs) as a UTF-8 encoded null terminated string
- detect invalid UTF-8 encoding in RegExp parser
- simplify `JS_AtomGetStrRT`, `JS_NewStringLen` using the above functions
- simplify UTF-8 decoding and error testing
2024-05-21 12:08:33 +00:00
|
|
|
/*---- UTF-8 and UTF-16 handling ----*/
|
2020-09-06 16:53:08 +00:00
|
|
|
|
Improve UTF-8 decoding and encoding functions (#410)
Ensure proper UTF-8 encoding (1 to 4 bytes).
Handle invalid encodings (return 0xFFFD and consume a single byte)
Individually encoded surrogate code points are accepted.
- add `utf8_scan()` to analyze a byte array for UTF-8 contents
detects invalid encoding, computes number of codepoints and content kind:
plain ASCII, 8-bit, 16-bit or larger codepoints.
- add `utf8_encode_len(c)` to compute the number of bytes to encode `c`
- rename `unicode_to_utf8` as `utf8_encode`
- rename `unicode_from_utf8` as `utf8_decode`
- add `utf8_decode_buf8(dest, size, src, len)` to decode a UTF-8 encoded
byte array known to contain only ASCII and 8-bit codepoints.
- add `utf8_decode_buf16(dest, size, src, len)` to decode a UTF-8 encoded
byte array into an array of 16-bit codepoints using UTF-16 surrogate pairs
for non-BMP1 codepoints.
- add `utf8_encode_buf8(dest, size, src, len)` to encode an array of 8-bit
codepoints as a UTF-8 encoded null terminated string
- add `utf16_encode_buf8(dest, size, src, len)` to decode an array of 16-bit
codepoints (including surrogate pairs) as a UTF-8 encoded null terminated string
- detect invalid UTF-8 encoding in RegExp parser
- simplify `JS_AtomGetStrRT`, `JS_NewStringLen` using the above functions
- simplify UTF-8 decoding and error testing
2024-05-21 12:08:33 +00:00
|
|
|
#define UTF8_CHAR_LEN_MAX 4
|
|
|
|
|
|
|
|
enum {
|
|
|
|
UTF8_PLAIN_ASCII = 0, // 7-bit ASCII plain text
|
|
|
|
UTF8_NON_ASCII = 1, // has non ASCII code points (8-bit or more)
|
|
|
|
UTF8_HAS_16BIT = 2, // has 16-bit code points
|
|
|
|
UTF8_HAS_NON_BMP1 = 4, // has non-BMP1 code points, needs UTF-16 surrogate pairs
|
|
|
|
UTF8_HAS_ERRORS = 8, // has encoding errors
|
|
|
|
};
|
|
|
|
int utf8_scan(const char *buf, size_t len, size_t *plen);
|
|
|
|
size_t utf8_encode_len(uint32_t c);
|
2024-10-10 16:55:42 +00:00
|
|
|
size_t utf8_encode(uint8_t buf[minimum_length(UTF8_CHAR_LEN_MAX)], uint32_t c);
|
2024-05-27 06:15:52 +00:00
|
|
|
uint32_t utf8_decode_len(const uint8_t *p, size_t max_len, const uint8_t **pp);
|
|
|
|
uint32_t utf8_decode(const uint8_t *p, const uint8_t **pp);
|
Improve UTF-8 decoding and encoding functions (#410)
Ensure proper UTF-8 encoding (1 to 4 bytes).
Handle invalid encodings (return 0xFFFD and consume a single byte)
Individually encoded surrogate code points are accepted.
- add `utf8_scan()` to analyze a byte array for UTF-8 contents
detects invalid encoding, computes number of codepoints and content kind:
plain ASCII, 8-bit, 16-bit or larger codepoints.
- add `utf8_encode_len(c)` to compute the number of bytes to encode `c`
- rename `unicode_to_utf8` as `utf8_encode`
- rename `unicode_from_utf8` as `utf8_decode`
- add `utf8_decode_buf8(dest, size, src, len)` to decode a UTF-8 encoded
byte array known to contain only ASCII and 8-bit codepoints.
- add `utf8_decode_buf16(dest, size, src, len)` to decode a UTF-8 encoded
byte array into an array of 16-bit codepoints using UTF-16 surrogate pairs
for non-BMP1 codepoints.
- add `utf8_encode_buf8(dest, size, src, len)` to encode an array of 8-bit
codepoints as a UTF-8 encoded null terminated string
- add `utf16_encode_buf8(dest, size, src, len)` to decode an array of 16-bit
codepoints (including surrogate pairs) as a UTF-8 encoded null terminated string
- detect invalid UTF-8 encoding in RegExp parser
- simplify `JS_AtomGetStrRT`, `JS_NewStringLen` using the above functions
- simplify UTF-8 decoding and error testing
2024-05-21 12:08:33 +00:00
|
|
|
size_t utf8_decode_buf8(uint8_t *dest, size_t dest_len, const char *src, size_t src_len);
|
|
|
|
size_t utf8_decode_buf16(uint16_t *dest, size_t dest_len, const char *src, size_t src_len);
|
|
|
|
size_t utf8_encode_buf8(char *dest, size_t dest_len, const uint8_t *src, size_t src_len);
|
|
|
|
size_t utf8_encode_buf16(char *dest, size_t dest_len, const uint16_t *src, size_t src_len);
|
2020-09-06 16:53:08 +00:00
|
|
|
|
2024-04-07 16:19:55 +00:00
|
|
|
static inline BOOL is_surrogate(uint32_t c)
|
|
|
|
{
|
|
|
|
return (c >> 11) == (0xD800 >> 11); // 0xD800-0xDFFF
|
|
|
|
}
|
|
|
|
|
2023-11-20 08:46:02 +00:00
|
|
|
static inline BOOL is_hi_surrogate(uint32_t c)
|
|
|
|
{
|
2024-04-07 16:19:55 +00:00
|
|
|
return (c >> 10) == (0xD800 >> 10); // 0xD800-0xDBFF
|
2023-11-20 08:46:02 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
static inline BOOL is_lo_surrogate(uint32_t c)
|
|
|
|
{
|
2024-04-07 16:19:55 +00:00
|
|
|
return (c >> 10) == (0xDC00 >> 10); // 0xDC00-0xDFFF
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline uint32_t get_hi_surrogate(uint32_t c)
|
|
|
|
{
|
|
|
|
return (c >> 10) - (0x10000 >> 10) + 0xD800;
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline uint32_t get_lo_surrogate(uint32_t c)
|
|
|
|
{
|
|
|
|
return (c & 0x3FF) | 0xDC00;
|
2023-11-20 08:46:02 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
static inline uint32_t from_surrogate(uint32_t hi, uint32_t lo)
|
|
|
|
{
|
|
|
|
return 65536 + 1024 * (hi & 1023) + (lo & 1023);
|
|
|
|
}
|
|
|
|
|
2020-09-06 16:53:08 +00:00
|
|
|
static inline int from_hex(int c)
|
|
|
|
{
|
|
|
|
if (c >= '0' && c <= '9')
|
|
|
|
return c - '0';
|
|
|
|
else if (c >= 'A' && c <= 'F')
|
|
|
|
return c - 'A' + 10;
|
|
|
|
else if (c >= 'a' && c <= 'f')
|
|
|
|
return c - 'a' + 10;
|
|
|
|
else
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
2024-04-19 09:35:44 +00:00
|
|
|
static inline uint8_t is_upper_ascii(uint8_t c) {
|
|
|
|
return c >= 'A' && c <= 'Z';
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline uint8_t to_upper_ascii(uint8_t c) {
|
|
|
|
return c >= 'a' && c <= 'z' ? c - 'a' + 'A' : c;
|
|
|
|
}
|
|
|
|
|
|
|
|
extern char const digits36[36];
|
|
|
|
size_t u32toa(char buf[minimum_length(11)], uint32_t n);
|
|
|
|
size_t i32toa(char buf[minimum_length(12)], int32_t n);
|
|
|
|
size_t u64toa(char buf[minimum_length(21)], uint64_t n);
|
|
|
|
size_t i64toa(char buf[minimum_length(22)], int64_t n);
|
|
|
|
size_t u32toa_radix(char buf[minimum_length(33)], uint32_t n, unsigned int base);
|
2024-05-26 06:06:36 +00:00
|
|
|
size_t i32toa_radix(char buf[minimum_length(34)], int32_t n, unsigned base);
|
2024-04-19 09:35:44 +00:00
|
|
|
size_t u64toa_radix(char buf[minimum_length(65)], uint64_t n, unsigned int base);
|
|
|
|
size_t i64toa_radix(char buf[minimum_length(66)], int64_t n, unsigned int base);
|
|
|
|
|
2020-09-06 16:53:08 +00:00
|
|
|
void rqsort(void *base, size_t nmemb, size_t size,
|
|
|
|
int (*cmp)(const void *, const void *, void *),
|
|
|
|
void *arg);
|
|
|
|
|
2023-11-22 08:36:53 +00:00
|
|
|
int64_t js__gettimeofday_us(void);
|
|
|
|
uint64_t js__hrtime_ns(void);
|
|
|
|
|
2023-12-05 09:46:40 +00:00
|
|
|
static inline size_t js__malloc_usable_size(const void *ptr)
|
|
|
|
{
|
|
|
|
#if defined(__APPLE__)
|
|
|
|
return malloc_size(ptr);
|
|
|
|
#elif defined(_WIN32)
|
|
|
|
return _msize((void *)ptr);
|
2024-03-12 08:06:07 +00:00
|
|
|
#elif defined(__linux__) || defined(__ANDROID__) || defined(__CYGWIN__) || defined(__FreeBSD__)
|
2023-12-05 09:46:40 +00:00
|
|
|
return malloc_usable_size((void *)ptr);
|
|
|
|
#else
|
|
|
|
return 0;
|
|
|
|
#endif
|
|
|
|
}
|
|
|
|
|
2024-04-02 19:50:42 +00:00
|
|
|
/* Cross-platform threading APIs. */
|
|
|
|
|
|
|
|
#if !defined(EMSCRIPTEN) && !defined(__wasi__)
|
|
|
|
|
|
|
|
#if defined(_WIN32)
|
|
|
|
#define JS_ONCE_INIT INIT_ONCE_STATIC_INIT
|
|
|
|
typedef INIT_ONCE js_once_t;
|
|
|
|
typedef CRITICAL_SECTION js_mutex_t;
|
|
|
|
typedef CONDITION_VARIABLE js_cond_t;
|
|
|
|
#else
|
|
|
|
#define JS_ONCE_INIT PTHREAD_ONCE_INIT
|
|
|
|
typedef pthread_once_t js_once_t;
|
|
|
|
typedef pthread_mutex_t js_mutex_t;
|
|
|
|
typedef pthread_cond_t js_cond_t;
|
|
|
|
#endif
|
|
|
|
|
|
|
|
void js_once(js_once_t *guard, void (*callback)(void));
|
|
|
|
|
|
|
|
void js_mutex_init(js_mutex_t *mutex);
|
|
|
|
void js_mutex_destroy(js_mutex_t *mutex);
|
|
|
|
void js_mutex_lock(js_mutex_t *mutex);
|
|
|
|
void js_mutex_unlock(js_mutex_t *mutex);
|
|
|
|
|
|
|
|
void js_cond_init(js_cond_t *cond);
|
|
|
|
void js_cond_destroy(js_cond_t *cond);
|
|
|
|
void js_cond_signal(js_cond_t *cond);
|
|
|
|
void js_cond_broadcast(js_cond_t *cond);
|
|
|
|
void js_cond_wait(js_cond_t *cond, js_mutex_t *mutex);
|
|
|
|
int js_cond_timedwait(js_cond_t *cond, js_mutex_t *mutex, uint64_t timeout);
|
|
|
|
|
|
|
|
#endif /* !defined(EMSCRIPTEN) && !defined(__wasi__) */
|
|
|
|
|
2024-07-01 10:30:20 +00:00
|
|
|
#ifdef __cplusplus
|
|
|
|
} /* extern "C" { */
|
|
|
|
#endif
|
|
|
|
|
2020-09-06 16:53:08 +00:00
|
|
|
#endif /* CUTILS_H */
|