util.c | searchcode

/user/firefly/mt-daapd-svn/src/util.c

https://bitbucket.org/altlc/wive-rtnl-ralink-rt305x-routers-firmware-amod · C · 725 lines · 515 code · 125 blank · 85 comment · 137 complexity · fe59051f8b056a3babbcf80a101d7ff1 MD5 · raw file

/*
 * simple utility functions
 */

#ifdef HAVE_CONFIG_H
#  include "config.h"
#endif

#include <errno.h>
#include <pthread.h>

#ifdef HAVE_STDINT_H
# include <stdint.h>
#endif

#include <stdio.h>
#include <stdarg.h>
#include <stdlib.h>
#include <string.h>
#include <sys/types.h>

#ifdef HAVE_ICONV
# include <iconv.h>
#endif

#include "daapd.h"
#include "err.h"
#include "util.h"


/* Globals */
pthread_mutex_t util_locks[(int)l_last];
pthread_mutex_t util_mutex = PTHREAD_MUTEX_INITIALIZER;
int _util_initialized=0;


/* Forwards */
void _util_mutex_init(void);

/**
 * Simple hash generator
 */
uint32_t util_djb_hash_block(unsigned char *data, uint32_t len) {
    uint32_t hash = 5381;
    unsigned char *pstr = data;

    while(len--) {
        hash = ((hash << 5) + hash) + *pstr;
        pstr++;
    }
    return hash;
}

/**
 * simple hash generator
 */
uint32_t util_djb_hash_str(char *str) {
    uint32_t len;

    len = (uint32_t)strlen(str);
    return util_djb_hash_block((unsigned char *)str,len);
}

/**
 * Dumb utility function that should probably be somehwere else
 */
int util_must_exit(void) {
    return config.stop;
}

#ifdef HAVE_ICONV
int util_utf8toutf16(unsigned char *utf16, int dlen, unsigned char *utf8, int slen) {
    int result;
    DPRINTF(E_DBG,L_MISC,"Converting %s to utf-16le (slen=%d, dlen=%d)\n",utf8,slen,dlen);

    result=util_xtoy(utf16, dlen, utf8, slen, "UTF-8","UTF-16LE");
    DPRINTF(E_DBG,L_MISC,"Result: %d\n",result);
//    _util_hexdump(utf16,32);
    return result;
}

int util_utf16toutf8(unsigned char *utf8, int dlen, unsigned char *utf16, int slen) {
    int result;

    DPRINTF(E_DBG,L_MISC,"Converting *something* to utf-8 (slen=%d, dlen=%d)\n",slen,dlen);
//    _util_hexdump(utf16,32);
    result = util_xtoy(utf8, dlen, utf16, slen, "UTF-16LE","UTF-8");

    DPRINTF(E_DBG,L_MISC,"Converted to %s\n",utf8);

    return result;
}

int util_utf16_byte_len(unsigned char *utf16) {
    unsigned char *src = utf16;
    int len = 0;

    while(1) {
        if((src[0] == 0) && (src[1]==0))
            return len;
        len += 2;
        src += 2;
    }
  return len; /* ?? */
}


unsigned char *util_utf8toutf16_alloc(unsigned char *utf8) {
    unsigned char *utf16;

    utf16 = calloc(1,strlen((char*)utf8) * 4 + 1);
    if(util_xtoy(utf16,strlen((char*)utf8) * 4 + 1, utf8, strlen((char*)utf8),"UTF-8","UTF-16LE")) {
        return utf16;
    }

    free(utf16);
    return NULL;
}

unsigned char *util_utf16toutf8_alloc(unsigned char *utf16, int slen) {
    unsigned char *utf8;

    utf8=calloc(1, slen * 2 + 1);
    if(util_xtoy(utf8,slen * 2 + 1,utf16,slen,"UTF-16LE","UTF-8")) {
        return utf8;
    }

    free(utf8);
    return NULL;
}

unsigned char *util_xtoutf8_alloc(unsigned char *x, int slen, char *from) {
    unsigned char *utf8;

    utf8 = calloc(1, slen * 4 + 1);
    if(util_xtoy(utf8,slen * 4 + 1, x, slen, from, "UTF-8")) {
        return utf8;
    }
    free(utf8);
    return NULL;
}

int util_xtoy(unsigned char *dbuffer, int dlen, unsigned char *sbuffer, int slen, char *from, char *to) {
    iconv_t iv;
    size_t csize;

    /* type punning warnings */
    size_t st_dlen = (size_t)dlen;
    size_t st_slen = (size_t)slen;
    char *st_dbuffer = (char*)dbuffer;
    ICONV_CONST char *st_sbuffer = (char*)sbuffer;

    memset(dbuffer,0,dlen);

    iv=iconv_open(to,from);
    if(iv == (iconv_t)-1) {
        DPRINTF(E_LOG,L_MISC,"iconv error: iconv_open failed with %d\n",errno);
    }

    csize = iconv(iv,&st_sbuffer,&st_slen,
                  &st_dbuffer,&st_dlen);
    if(csize == (size_t)-1) {
        switch(errno) {
            case EILSEQ:
                DPRINTF(E_LOG,L_MISC,"iconv error: Invalid multibyte sequence\n");
                break;
            case EINVAL:
                DPRINTF(E_LOG,L_MISC,"iconv error: Incomplete multibyte sequence\n");
                break;
            case E2BIG:
                DPRINTF(E_LOG,L_MISC,"iconv error: Insufficient buffer size\n");
                break;
            default:
                DPRINTF(E_LOG,L_MISC,"iconv error: unknown (%d)\n",errno);
                break;
        }
    }
    iconv_close(iv);

    return (csize != (size_t)-1);
}

#else

/* homerolled conversions */
int util_utf16_byte_len(unsigned char *utf16) {
    unsigned char *src = utf16;
    int len = 0;

    while(1) {
        if((src[0] == 0) && (src[1]==0))
            return len;
        len += 2;
        src += 2;
    }
    return len; /* ?? */
}

/**
 * calculate how long a utf16le string will be once converted
 */
int util_utf16toutf8_len(unsigned char *utf16, int len) {
    unsigned char *src = utf16;
    int out_len = 0;
    uint32_t temp_dword;

    while(src+2 <= utf16 + len) {
        temp_dword = src[1] << 8 | src[0];

        if((temp_dword & 0xFC00) == 0xD800) {
            src += 2;
            if(src + 2 <= utf16 + len) {
                out_len += 4;
            } else {
                return -1;
            }
        } else {
            if(temp_dword <= 0x7F)
                out_len += 1;
            else if(temp_dword <= 0x7FF)
                out_len += 2;
            else if(temp_dword <= 0xFFFF)
                out_len += 3;
        }

        src += 2;
    }
    return out_len;
}

/**
 * convert utf16 string to utf8.  This is a bit naive, but...
 * Since utf-8 can't expand past 4 bytes per code point, and
 * we're converting utf-16, we can't be more than 2n+1 bytes, so
 * we'll just allocate that much.
 *
 * Probably it could be more efficiently calculated, but this will
 * always work.  Besides, these are small strings, and will be freed
 * after the db insert.
 *
 * We assume this is utf-16LE, as it comes from windows
 *
 * @param utf16 utf-16 to convert
 * @param len length of utf-16 string
 */

int util_utf16toutf8(unsigned char *utf8, int dlen, unsigned char *utf16, int len) {
    unsigned char *src=utf16;
    unsigned char *dst;
    unsigned int w1, w2;
    int bytes;
    int new_len;

    if(!len)
        return FALSE;

    new_len = util_utf16toutf8_len(utf16,len);
    if((new_len == -1) || (dlen <= new_len)) {
        DPRINTF(E_LOG,L_MISC,"Cannot convert %s to utf8; E2BIG (%d vs %d)\n",utf8,new_len,dlen);
        return FALSE;
    }

    dst=utf8;
    while((src+2) <= utf16+len) {
        w1=src[1] << 8 | src[0];
        src += 2;
        if((w1 & 0xFC00) == 0xD800) { // could be surrogate pair
            if(src+2 > utf16+len) {
                DPRINTF(E_INF,L_SCAN,"Invalid utf-16 in file\n");
                return FALSE;
            }
            w2 = src[3] << 8 | src[2];
            if((w2 & 0xFC00) != 0xDC00) {
                DPRINTF(E_INF,L_SCAN,"Invalid utf-16 in file\n");
                return FALSE;
            }

            // get bottom 10 of each
            w1 = w1 & 0x03FF;
            w1 = w1 << 10;
            w1 = w1 | (w2 & 0x03FF);

            // add back the 0x10000
            w1 += 0x10000;
        }

        // now encode the original code point in utf-8
        if (w1 < 0x80) {
            *dst++ = w1;
            bytes=0;
        } else if (w1 < 0x800) {
            *dst++ = 0xC0 | (w1 >> 6);
            bytes=1;
        } else if (w1 < 0x10000) {
            *dst++ = 0xE0 | (w1 >> 12);
            bytes=2;
        } else {
            *dst++ = 0xF0 | (w1 >> 18);
            bytes=3;
        }

        while(bytes) {
            *dst++ = 0x80 | ((w1 >> (6*(bytes-1))) & 0x3f);
            bytes--;
        }
    }

    *dst = '\x0';

    return new_len;
}

/**
 * calculate how long a utf8 string will be once converted
 */
int util_utf8toutf16_len(unsigned char *utf8) {
    int len,out_len,trailing_bytes;
    unsigned char *src = utf8;

    len=(int)strlen((char *)utf8);
    out_len = 0;

    while(src < utf8 + len) {
        trailing_bytes = 0;
        if((*src & 0xE0) == 0xC0) trailing_bytes = 1;
        else if((*src & 0xF0) == 0xE0) trailing_bytes = 2;
        else if((*src & 0xF8) == 0xF0) trailing_bytes = 3;

        if(src + trailing_bytes > utf8 + len)
            return -1;

        out_len += 2;
        if(trailing_bytes == 3) /* surrogate pair */
            out_len += 2;

        src += (1 + trailing_bytes);
    }

    out_len += 1;
    return out_len;
}

unsigned char *util_utf8toutf16_alloc(unsigned char *utf8) {
    unsigned char *out;
    int new_len;

    new_len = util_utf8toutf16_len(utf8);
    if(new_len == -1)
        return NULL;

    out = calloc(1,new_len + 2);
    if(!util_utf8toutf16(out,new_len + 2,utf8,(int)strlen((char*)utf8))) {
        free(out);
        return NULL;
    }

    return out;
}

unsigned char *util_utf16touft8_alloc(unsigned char *utf16, int len) {
    unsigned char *out;
    int new_len;

    new_len = util_utf16toutf8_len(utf16,len);
    if(new_len == -1)
        return NULL;

    out = calloc(1,new_len + 1);
    if(!util_utf16toutf8(out,new_len + 1,utf16,len)) {
        free(out);
        return NULL;
    }
    return out;
}

int util_utf8toutf16(unsigned char *utf16, int dlen, unsigned char *utf8, int len) {
    unsigned char *src=utf8;
    unsigned char *dst;
    int new_len;
    int trailing_bytes;
    uint32_t utf32;
    uint16_t temp_word;

    len=(int)strlen((char*)utf8); /* ignore passed length, might be wrong! */
    if(!len)
        return FALSE;

    new_len = util_utf8toutf16_len(utf8);
    if((new_len == -1) || (dlen <= (new_len+1))) {
        DPRINTF(E_LOG,L_MISC,"Cannot convert %s to utf16; E2BIG (%d vs %d)\n",utf8,new_len,dlen);
        return FALSE;
    }

    dst=utf16;

    while(src < utf8 + len) {
        utf32=0;
        trailing_bytes=0;

        if((*src & 0xE0) == 0xC0) trailing_bytes = 1;
        else if((*src & 0xF0) == 0xE0) trailing_bytes = 2;
        else if((*src & 0xF8) == 0xF0) trailing_bytes = 3;

        if(src + trailing_bytes > utf8 + len) {
            DPRINTF(E_LOG,L_SCAN,"Invalid UTF8 string\n");
            return FALSE;
        }

        switch(trailing_bytes) {
        case 0:
            utf32 = *src;
            break;
        case 1:
            utf32 = ((src[0] & 0x1F) << 6) |
                (src[1] & 0x3F);
            break;
        case 2:
            utf32 = ((src[0] & 0x0F) << 12) |
                ((src[1] & 0x3F) << 6) |
                ((src[2] & 0x3F));
            break;
        case 3:
            utf32 = ((src[0] & 0x07) << 18) |
                ((src[1] & 0x3F) << 12) |
                ((src[2] & 0x3F) << 6) |
                ((src[3] & 0x3F));
            break;
        }

        if(utf32 <= 0xFFFF) {
            /* we are encoding LE style... */
            *dst++ = utf32 & 0xFF;
            *dst++ = (utf32 & 0xFF00) >> 8;
        } else {
            /* Encode with surrogates */
            temp_word = 0xD800 | ((utf32 & 0x0FFC00) >> 10);
            *dst++ = temp_word & 0xFF;
            *dst++ = (temp_word & 0xFF00) >> 8;
            temp_word = 0xDC00 | (utf32 & 0x3FF);
            *dst++ = temp_word & 0xFF;
            *dst++ = (temp_word & 0xFF00) >> 8;
        }

        src += (trailing_bytes + 1);
    }

    *dst++ = '\x0';
    *dst = '\x0';
    return new_len;
}

#endif

void util_hexdump(unsigned char *block, int len) {
    char charmap[256];
    int index;
    int row, offset;
    char output[80];
    char tmp[20];

    memset(charmap,'.',sizeof(charmap));

    for(index=' ';index<'~';index++) charmap[index]=index;
    for(row=0;row<(len+15)/16;row++) {
        sprintf(output,"%04X: ",row*16);
        for(offset=0; offset < 16; offset++) {
            if(row * 16 + offset < len) {
                sprintf(tmp,"%02X ",block[row*16 + offset]);
            } else {
                sprintf(tmp,"   ");
            }
            strcat(output,tmp);
        }

        for(offset=0; offset < 16; offset++) {
            if(row * 16 + offset < len) {
                sprintf(tmp,"%c",charmap[block[row*16 + offset]]);
            } else {
                sprintf(tmp," ");
            }
            strcat(output,tmp);
        }

        DPRINTF(E_LOG,L_MISC,"%s\n",output);
    }
}

/**
 * simple mutex wrapper for better debugging
 */
void util_mutex_lock(ff_lock_t which) {
    if(!_util_initialized)
        _util_mutex_init();

    if(pthread_mutex_lock(&util_locks[(int)which])) {
        fprintf(stderr,"Cannot lock mutex\n");
        exit(-1);
    }
}

/**
 * simple mutex wrapper for better debugging
 */
void util_mutex_unlock(ff_lock_t which) {
    if(pthread_mutex_unlock(&util_locks[(int)which])) {
        fprintf(stderr,"Cannot unlock mutex\n");
        exit(-1);
    }

}

/**
 * mutex initializer.  This might should be done from the
 * main thread.
 */
void _util_mutex_init(void) {
    int err;
    ff_lock_t lock;

    if((err = pthread_mutex_lock(&util_mutex))) {
        fprintf(stderr,"Error locking mutex\n");
        exit(-1);
    }

    if(!_util_initialized) {
        /* now, walk through and manually initialize the mutexes */
        for(lock=(ff_lock_t)0; lock < l_last; lock++) {
            if((err = pthread_mutex_init(&util_locks[(int)lock],NULL))) {
                fprintf(stderr,"Error initializing mutex\n");
                exit(-1);
            }
        }
        _util_initialized=1;
    }

    pthread_mutex_unlock(&util_mutex);
}

/**
 * split a string on delimiter boundaries, filling
 * a string-pointer array.
 *
 * The user must free both the first element in the array,
 * and the array itself.
 *
 * @param s string to split
 * @param delimiters boundaries to split on
 * @param argvp an argv array to be filled
 * @returns number of tokens
 */
int util_split(char *s, char *delimiters, char ***argvp) {
    int i;
    int numtokens;
    const char *snew;
    char *t;
    char *tokptr;
    char *tmp;
    char *fix_src, *fix_dst;

    if ((s == NULL) || (delimiters == NULL) || (argvp == NULL))
        return -1;
    *argvp = NULL;
    snew = s + strspn(s, delimiters);
    if ((t = malloc(strlen(snew) + 1)) == NULL)
        return -1;

    strcpy(t, snew);
    numtokens = 1;
    tokptr = NULL;
    tmp = t;

    tmp = s;
    while(*tmp) {
        if(strchr(delimiters,*tmp) && (*(tmp+1) == *tmp)) {
            tmp += 2;
        } else if(strchr(delimiters,*tmp)) {
            numtokens++;
            tmp++;
        } else {
            tmp++;
        }
    }

    DPRINTF(E_DBG,L_CONF,"Found %d tokens in %s\n",numtokens,s);

    if ((*argvp = malloc((numtokens + 1)*sizeof(char *))) == NULL) {
        free(t);
        return -1;
    }

    if (numtokens == 0)
        free(t);
    else {
        tokptr = t;
        tmp = t;
        for (i = 0; i < numtokens; i++) {
            while(*tmp) {
                if(strchr(delimiters,*tmp) && (*(tmp+1) != *tmp))
                    break;
                if(strchr(delimiters,*tmp)) {
                    tmp += 2;
                } else {
                    tmp++;
                }
            }
            *tmp = '\0';
            tmp++;
            (*argvp)[i] = tokptr;

            fix_src = fix_dst = tokptr;
            while(*fix_src) {
                if(strchr(delimiters,*fix_src) && (*(fix_src+1) == *fix_src)) {
                    fix_src++;
                }
                *fix_dst++ = *fix_src++;
            }
            *fix_dst = '\0';

            tokptr = tmp;
            DPRINTF(E_DBG,L_CONF,"Token %d: %s\n",i+1,(*argvp)[i]);
        }
    }

    *((*argvp) + numtokens) = NULL;
    return numtokens;
}

/**
 * dispose of the argv set that was created in util_split
 *
 * @param argv string array to delete
 */
void util_dispose_split(char **argv) {
    if(!argv)
        return;

    if(argv[0])
        free(argv[0]);

    free(argv);
}

/**
 * Write a formatted string to an allocated string.  Leverage
 * the existing util_vasprintf to do so
 */
char *util_asprintf(char *fmt, ...) {
    char *outbuf;
    va_list ap;

    ASSERT(fmt);

    if(!fmt)
        return NULL;

    va_start(ap,fmt);
    outbuf = util_vasprintf(fmt, ap);
    va_end(ap);

    return outbuf;
}

/**
 * Write a formatted string to an allocated string.  This deals with
 * versions of vsnprintf that return either the C99 way, or the pre-C99
 * way, by increasing the buffer until it works.
 *
 * @param
 * @param fmt format string of print (compatible with printf(2))
 * @returns TRUE on success
 */

#ifdef HAVE_VA_COPY
# define VA_COPY(a,b) va_copy((a),(b))
#else
# ifdef HAVE___VA_COPY
#  define VA_COPY(a,b) __va_copy((a),(b))
# else
#  define VA_COPY(a,b) memcpy((&a),(&b),sizeof(b))
# endif
#endif

char *util_vasprintf(char *fmt, va_list ap) {
    char *outbuf;
    char *newbuf;
    va_list ap2;
    int size=200;
    int new_size;

    outbuf = (char*)malloc(size);
    if(!outbuf)
        DPRINTF(E_FATAL,L_MISC,"Could not allocate buffer in vasprintf\n");

    VA_COPY(ap2,ap);

    while(1) {
        new_size=vsnprintf(outbuf,size,fmt,ap);

        if(new_size > -1 && new_size < size)
            break;

        if(new_size > -1)
            size = new_size + 1;
        else
            size *= 2;

        if((newbuf = realloc(outbuf,size)) == NULL) {
            free(outbuf);
            DPRINTF(E_FATAL,L_MISC,"malloc error in vasprintf\n");
            exit(1);
        }
        outbuf = newbuf;
        VA_COPY(ap,ap2);
    }

    return outbuf;
}


#ifdef DEBUG_MEM
void *util_malloc(char *file, char *line, size_t size);
void *util_calloc(char *file, char *line, size_t count, size_t size);
void *util_realloc(char *file, char *line, void *ptr, size_t size);
void util_free(void *ptr);
#endif