diff options
Diffstat (limited to 'src/recompiler/cutils.c')
-rw-r--r-- | src/recompiler/cutils.c | 752 |
1 files changed, 752 insertions, 0 deletions
diff --git a/src/recompiler/cutils.c b/src/recompiler/cutils.c new file mode 100644 index 00000000..5fbf70bd --- /dev/null +++ b/src/recompiler/cutils.c @@ -0,0 +1,752 @@ +/* + * Simple C functions to supplement the C library + * + * Copyright (c) 2006 Fabrice Bellard + * + * Permission is hereby granted, free of charge, to any person obtaining a copy + * of this software and associated documentation files (the "Software"), to deal + * in the Software without restriction, including without limitation the rights + * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell + * copies of the Software, and to permit persons to whom the Software is + * furnished to do so, subject to the following conditions: + * + * The above copyright notice and this permission notice shall be included in + * all copies or substantial portions of the Software. + * + * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR + * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, + * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL + * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER + * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, + * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN + * THE SOFTWARE. + */ +#include "qemu-common.h" +#include "host-utils.h" + +#ifdef VBOX +# include "osdep.h" + + +static inline int toupper(int ch) { + if ( (unsigned int)(ch - 'a') < 26u ) + ch += 'A' - 'a'; + return ch; +} + +/* Quick sort from OpenSolaris: + http://src.opensolaris.org/source/raw/onnv/onnv-gate/usr/src/common/util/qsort.c */ +/* + * choose a median of 3 values + * + * note: cstyle specifically prohibits nested conditional operators + * but this is the only way to do the median of 3 function in-line + */ +#define med3(a, b, c) (cmp((a), (b)) < 0) \ + ? ((cmp((b), (c)) < 0) ? (b) : (cmp((a), (c)) < 0) ? (c) : (a)) \ + : ((cmp((b), (c)) > 0) ? (b) : (cmp((a), (c)) > 0) ? (c) : (a)) + +#define THRESH_L 5 /* threshold for insertion sort */ +#define THRESH_M3 20 /* threshold for median of 3 */ +#define THRESH_M9 50 /* threshold for median of 9 */ + +typedef struct { + char *b_lim; + size_t nrec; +} stk_t; + +/* + * The following swap functions should not create a stack frame + * the SPARC call / return instruction will be executed + * but the a save / restore will not be executed + * which means we won't do a window turn with the spill / fill overhead + * verify this by examining the assembly code + */ + +/* ARGSUSED */ +static void +swapp32(uint32_t *r1, uint32_t *r2, size_t cnt) +{ + uint32_t temp; + + temp = *r1; + *r1++ = *r2; + *r2++ = temp; +} + +/* ARGSUSED */ +static void +swapp64(uint64_t *r1, uint64_t *r2, size_t cnt) +{ + uint64_t temp; + + temp = *r1; + *r1++ = *r2; + *r2++ = temp; +} + +static void +swapi(uint32_t *r1, uint32_t *r2, size_t cnt) +{ + uint32_t temp; + + /* character by character */ + while (cnt--) { + temp = *r1; + *r1++ = *r2; + *r2++ = temp; + } +} + +static void +swapb(char *r1, char *r2, size_t cnt) +{ + char temp; + + /* character by character */ + while (cnt--) { + temp = *r1; + *r1++ = *r2; + *r2++ = temp; + } +} + +/* + * qsort() is a general purpose, in-place sorting routine using a + * user provided call back function for comparisons. This implementation + * utilizes a ternary quicksort algorithm, and cuts over to an + * insertion sort for partitions involving fewer than THRESH_L records. + * + * Potential User Errors + * There is no return value from qsort, this function has no method + * of alerting the user that a sort did not work or could not work. + * We do not print an error message or exit the process or thread, + * Even if we can detect an error, We CANNOT silently return without + * sorting the data, if we did so the user could never be sure the + * sort completed successfully. + * It is possible we could change the return value of sort from void + * to int and return success or some error codes, but this gets into + * standards and compatibility issues. + * + * Examples of qsort parameter errors might be + * 1) record size (rsiz) equal to 0 + * qsort will loop and never return. + * 2) record size (rsiz) less than 0 + * rsiz is unsigned, so a negative value is insanely large + * 3) number of records (nrec) is 0 + * This is legal - qsort will return without examining any records + * 4) number of records (nrec) is less than 0 + * nrec is unsigned, so a negative value is insanely large. + * 5) nrec * rsiz > memory allocation for sort array + * a segment violation may occur + * corruption of other memory may occur + * 6) The base address of the sort array is invalid + * a segment violation may occur + * corruption of other memory may occur + * 7) The user call back function is invalid + * we may get alignment errors or segment violations + * we may jump into never-never land + * + * Some less obvious errors might be + * 8) The user compare function is not comparing correctly + * 9) The user compare function modifies the data records + */ + +void +qemu_qsort( + void *basep, + size_t nrec, + size_t rsiz, + int (*cmp)(const void *, const void *)) +{ + size_t i; /* temporary variable */ + + /* variables used by swap */ + void (*swapf)(char *, char *, size_t); + size_t loops; + + /* variables used by sort */ + stk_t stack[8 * sizeof (nrec) + 1]; + stk_t *sp; + char *b_lim; /* bottom limit */ + char *b_dup; /* bottom duplicate */ + char *b_par; /* bottom partition */ + char *t_lim; /* top limit */ + char *t_dup; /* top duplicate */ + char *t_par; /* top partition */ + char *m1, *m2, *m3; /* median pointers */ + uintptr_t d_bytelength; /* byte length of duplicate records */ + int b_nrec; + int t_nrec; + int cv; /* results of compare (bottom / top) */ + + /* + * choose a swap function based on alignment and size + * + * The qsort function sorts an array of fixed length records. + * We have very limited knowledge about the data record itself. + * It may be that the data record is in the array we are sorting + * or it may be that the array contains pointers or indexes to + * the actual data record and all that we are sorting is the indexes. + * + * The following decision will choose an optimal swap function + * based on the size and alignment of the data records + * swapp64 will swap 64 bit pointers + * swapp32 will swap 32 bit pointers + * swapi will swap an array of 32 bit integers + * swapb will swap an array of 8 bit characters + * + * swapi and swapb will also require the variable loops to be set + * to control the length of the array being swapped + */ + if ((((uintptr_t)basep & (sizeof (uint64_t) - 1)) == 0) && + (rsiz == sizeof (uint64_t))) { + loops = 1; + swapf = (void (*)(char *, char *, size_t))swapp64; + } else if ((((uintptr_t)basep & (sizeof (uint32_t) - 1)) == 0) && + (rsiz == sizeof (uint32_t))) { + loops = 1; + swapf = (void (*)(char *, char *, size_t))swapp32; + } else if ((((uintptr_t)basep & (sizeof (uint32_t) - 1)) == 0) && + ((rsiz & (sizeof (uint32_t) - 1)) == 0)) { + loops = rsiz / sizeof (int); + swapf = (void (*)(char *, char *, size_t))swapi; + } else { + loops = rsiz; + swapf = swapb; + } + + /* + * qsort is a partitioning sort + * + * the stack is the bookkeeping mechanism to keep track of all + * the partitions. + * + * each sort pass takes one partition and sorts it into two partitions. + * at the top of the loop we simply take the partition on the top + * of the stack and sort it. See the comments at the bottom + * of the loop regarding which partitions to add in what order. + * + * initially put the whole partition on the stack + */ + sp = stack; + sp->b_lim = (char *)basep; + sp->nrec = nrec; + sp++; + while (sp > stack) { + sp--; + b_lim = sp->b_lim; + nrec = sp->nrec; + + /* + * a linear insertion sort i faster than a qsort for + * very small number of records (THRESH_L) + * + * if number records < threshold use linear insertion sort + * + * this also handles the special case where the partition + * 0 or 1 records length. + */ + if (nrec < THRESH_L) { + /* + * Linear insertion sort + */ + t_par = b_lim; + for (i = 1; i < nrec; i++) { + t_par += rsiz; + b_par = t_par; + while (b_par > b_lim) { + b_par -= rsiz; + if ((*cmp)(b_par, b_par + rsiz) <= 0) { + break; + } + (*swapf)(b_par, b_par + rsiz, loops); + } + } + + /* + * a linear insertion sort will put all records + * in their final position and will not create + * subpartitions. + * + * therefore when the insertion sort is complete + * just go to the top of the loop and get the + * next partition to sort. + */ + continue; + } + + /* quicksort */ + + /* + * choose a pivot record + * + * Ideally the pivot record will divide the partition + * into two equal parts. however we have to balance the + * work involved in selecting the pivot record with the + * expected benefit. + * + * The choice of pivot record depends on the number of + * records in the partition + * + * for small partitions (nrec < THRESH_M3) + * we just select the record in the middle of the partition + * + * if (nrec >= THRESH_M3 && nrec < THRESH_M9) + * we select three values and choose the median of 3 + * + * if (nrec >= THRESH_M9) + * then we use an approximate median of 9 + * 9 records are selected and grouped in 3 groups of 3 + * the median of each of these 3 groups is fed into another + * median of 3 decision. + * + * Each median of 3 decision is 2 or 3 compares, + * so median of 9 costs between 8 and 12 compares. + * + * i is byte distance between two consecutive samples + * m2 will point to the pivot record + */ + if (nrec < THRESH_M3) { + m2 = b_lim + (nrec / 2) * rsiz; + } else if (nrec < THRESH_M9) { + /* use median of 3 */ + i = ((nrec - 1) / 2) * rsiz; + m2 = med3(b_lim, b_lim + i, b_lim + 2 * i); + } else { + /* approx median of 9 */ + i = ((nrec - 1) / 8) * rsiz; + m1 = med3(b_lim, b_lim + i, b_lim + 2 * i); + m2 = med3(b_lim + 3 * i, b_lim + 4 * i, b_lim + 5 * i); + m3 = med3(b_lim + 6 * i, b_lim + 7 * i, b_lim + 8 * i); + m2 = med3(m1, m2, m3); + } + + /* + * quick sort partitioning + * + * The partition limits are defined by bottom and top pointers + * b_lim and t_lim. + * + * qsort uses a fairly standard method of moving the + * partitioning pointers, b_par and t_par, to the middle of + * the partition and exchanging records that are in the + * wrong part of the partition. + * + * Two enhancements have been made to the basic algorithm. + * One for handling duplicate records and one to minimize + * the number of swaps. + * + * Two duplicate records pointers are (b_dup and t_dup) are + * initially set to b_lim and t_lim. Each time a record + * whose sort key value is equal to the pivot record is found + * it will be swapped with the record pointed to by + * b_dup or t_dup and the duplicate pointer will be + * incremented toward the center. + * When partitioning is complete, all the duplicate records + * will have been collected at the upper and lower limits of + * the partition and can easily be moved adjacent to the + * pivot record. + * + * The second optimization is to minimize the number of swaps. + * The pointer m2 points to the pivot record. + * During partitioning, if m2 is ever equal to the partitioning + * pointers, b_par or t_par, then b_par or t_par just moves + * onto the next record without doing a compare. + * If as a result of duplicate record detection, + * b_dup or t_dup is ever equal to m2, + * then m2 is changed to point to the duplicate record and + * b_dup or t_dup is incremented with out swapping records. + * + * When partitioning is done, we may not have the same pivot + * record that we started with, but we will have one with + * an equal sort key. + */ + b_dup = b_par = b_lim; + t_dup = t_par = t_lim = b_lim + rsiz * (nrec - 1); + for (;;) { + + /* move bottom pointer up */ + for (; b_par <= t_par; b_par += rsiz) { + if (b_par == m2) { + continue; + } + cv = cmp(b_par, m2); + if (cv > 0) { + break; + } + if (cv == 0) { + if (b_dup == m2) { + m2 = b_par; + } else if (b_dup != b_par) { + (*swapf)(b_dup, b_par, loops); + } + b_dup += rsiz; + } + } + + /* move top pointer down */ + for (; b_par < t_par; t_par -= rsiz) { + if (t_par == m2) { + continue; + } + cv = cmp(t_par, m2); + if (cv < 0) { + break; + } + if (cv == 0) { + if (t_dup == m2) { + m2 = t_par; + } else if (t_dup != t_par) { + (*swapf)(t_dup, t_par, loops); + } + t_dup -= rsiz; + } + } + + /* break if we are done partitioning */ + if (b_par >= t_par) { + break; + } + + /* exchange records at upper and lower break points */ + (*swapf)(b_par, t_par, loops); + b_par += rsiz; + t_par -= rsiz; + } + + /* + * partitioning is now complete + * + * there are two termination conditions from the partitioning + * loop above. Either b_par or t_par have crossed or + * they are equal. + * + * we need to swap the pivot record to its final position + * m2 could be in either the upper or lower partitions + * or it could already be in its final position + */ + /* + * R[b_par] > R[m2] + * R[t_par] < R[m2] + */ + if (t_par < b_par) { + if (m2 < t_par) { + (*swapf)(m2, t_par, loops); + m2 = b_par = t_par; + } else if (m2 > b_par) { + (*swapf)(m2, b_par, loops); + m2 = t_par = b_par; + } else { + b_par = t_par = m2; + } + } else { + if (m2 < t_par) { + t_par = b_par = t_par - rsiz; + } + if (m2 != b_par) { + (*swapf)(m2, b_par, loops); + } + m2 = t_par; + } + + /* + * move bottom duplicates next to pivot + * optimized to eliminate overlap + */ + d_bytelength = b_dup - b_lim; + if (b_par - b_dup < d_bytelength) { + b_dup = b_lim + (b_par - b_dup); + } + while (b_dup > b_lim) { + b_dup -= rsiz; + b_par -= rsiz; + (*swapf)(b_dup, b_par, loops); + } + b_par = m2 - d_bytelength; + + /* + * move top duplicates next to pivot + */ + d_bytelength = t_lim - t_dup; + if (t_dup - t_par < d_bytelength) { + t_dup = t_lim - (t_dup - t_par); + } + while (t_dup < t_lim) { + t_dup += rsiz; + t_par += rsiz; + (*swapf)(t_dup, t_par, loops); + } + t_par = m2 + d_bytelength; + + /* + * when a qsort pass completes there are three partitions + * 1) the lower contains all records less than pivot + * 2) the upper contains all records greater than pivot + * 3) the pivot partition contains all record equal to pivot + * + * all records in the pivot partition are in their final + * position and do not need to be accounted for by the stack + * + * when adding partitions to the stack + * it is important to add the largest partition first + * to prevent stack overflow. + * + * calculate number of unsorted records in top and bottom + * push resulting partitions on stack + */ + b_nrec = (b_par - b_lim) / rsiz; + t_nrec = (t_lim - t_par) / rsiz; + if (b_nrec < t_nrec) { + sp->b_lim = t_par + rsiz; + sp->nrec = t_nrec; + sp++; + sp->b_lim = b_lim; + sp->nrec = b_nrec; + sp++; + } else { + sp->b_lim = b_lim; + sp->nrec = b_nrec; + sp++; + sp->b_lim = t_par + rsiz; + sp->nrec = t_nrec; + sp++; + } + } +} + +#endif /* VBOX */ + +void pstrcpy(char *buf, int buf_size, const char *str) +{ + int c; + char *q = buf; + + if (buf_size <= 0) + return; + + for(;;) { + c = *str++; + if (c == 0 || q >= buf + buf_size - 1) + break; + *q++ = c; + } + *q = '\0'; +} + +/* strcat and truncate. */ +char *pstrcat(char *buf, int buf_size, const char *s) +{ + int len; + len = strlen(buf); + if (len < buf_size) + pstrcpy(buf + len, buf_size - len, s); + return buf; +} + +int strstart(const char *str, const char *val, const char **ptr) +{ + const char *p, *q; + p = str; + q = val; + while (*q != '\0') { + if (*p != *q) + return 0; + p++; + q++; + } + if (ptr) + *ptr = p; + return 1; +} + +int stristart(const char *str, const char *val, const char **ptr) +{ + const char *p, *q; + p = str; + q = val; + while (*q != '\0') { + if (qemu_toupper(*p) != qemu_toupper(*q)) + return 0; + p++; + q++; + } + if (ptr) + *ptr = p; + return 1; +} + +/* XXX: use host strnlen if available ? */ +int qemu_strnlen(const char *s, int max_len) +{ + int i; + + for(i = 0; i < max_len; i++) { + if (s[i] == '\0') { + break; + } + } + return i; +} + +#ifndef VBOX +time_t mktimegm(struct tm *tm) +{ + time_t t; + int y = tm->tm_year + 1900, m = tm->tm_mon + 1, d = tm->tm_mday; + if (m < 3) { + m += 12; + y--; + } + t = 86400 * (d + (153 * m - 457) / 5 + 365 * y + y / 4 - y / 100 + + y / 400 - 719469); + t += 3600 * tm->tm_hour + 60 * tm->tm_min + tm->tm_sec; + return t; +} +#endif /* !VBOX */ + +int qemu_fls(int i) +{ + return 32 - clz32(i); +} + +#ifndef VBOX + +/* + * Make sure data goes on disk, but if possible do not bother to + * write out the inode just for timestamp updates. + * + * Unfortunately even in 2009 many operating systems do not support + * fdatasync and have to fall back to fsync. + */ +int qemu_fdatasync(int fd) +{ +#ifdef CONFIG_FDATASYNC + return fdatasync(fd); +#else + return fsync(fd); +#endif +} + +/* io vectors */ + +void qemu_iovec_init(QEMUIOVector *qiov, int alloc_hint) +{ + qiov->iov = qemu_malloc(alloc_hint * sizeof(struct iovec)); + qiov->niov = 0; + qiov->nalloc = alloc_hint; + qiov->size = 0; +} + +void qemu_iovec_init_external(QEMUIOVector *qiov, struct iovec *iov, int niov) +{ + int i; + + qiov->iov = iov; + qiov->niov = niov; + qiov->nalloc = -1; + qiov->size = 0; + for (i = 0; i < niov; i++) + qiov->size += iov[i].iov_len; +} + +void qemu_iovec_add(QEMUIOVector *qiov, void *base, size_t len) +{ + assert(qiov->nalloc != -1); + + if (qiov->niov == qiov->nalloc) { + qiov->nalloc = 2 * qiov->nalloc + 1; + qiov->iov = qemu_realloc(qiov->iov, qiov->nalloc * sizeof(struct iovec)); + } + qiov->iov[qiov->niov].iov_base = base; + qiov->iov[qiov->niov].iov_len = len; + qiov->size += len; + ++qiov->niov; +} + +/* + * Copies iovecs from src to the end dst until src is completely copied or the + * total size of the copied iovec reaches size. The size of the last copied + * iovec is changed in order to fit the specified total size if it isn't a + * perfect fit already. + */ +void qemu_iovec_concat(QEMUIOVector *dst, QEMUIOVector *src, size_t size) +{ + int i; + size_t done; + + assert(dst->nalloc != -1); + + done = 0; + for (i = 0; (i < src->niov) && (done != size); i++) { + if (done + src->iov[i].iov_len > size) { + qemu_iovec_add(dst, src->iov[i].iov_base, size - done); + break; + } else { + qemu_iovec_add(dst, src->iov[i].iov_base, src->iov[i].iov_len); + } + done += src->iov[i].iov_len; + } +} + +void qemu_iovec_destroy(QEMUIOVector *qiov) +{ + assert(qiov->nalloc != -1); + + qemu_free(qiov->iov); +} + +void qemu_iovec_reset(QEMUIOVector *qiov) +{ + assert(qiov->nalloc != -1); + + qiov->niov = 0; + qiov->size = 0; +} + +void qemu_iovec_to_buffer(QEMUIOVector *qiov, void *buf) +{ + uint8_t *p = (uint8_t *)buf; + int i; + + for (i = 0; i < qiov->niov; ++i) { + memcpy(p, qiov->iov[i].iov_base, qiov->iov[i].iov_len); + p += qiov->iov[i].iov_len; + } +} + +void qemu_iovec_from_buffer(QEMUIOVector *qiov, const void *buf, size_t count) +{ + const uint8_t *p = (const uint8_t *)buf; + size_t copy; + int i; + + for (i = 0; i < qiov->niov && count; ++i) { + copy = count; + if (copy > qiov->iov[i].iov_len) + copy = qiov->iov[i].iov_len; + memcpy(qiov->iov[i].iov_base, p, copy); + p += copy; + count -= copy; + } +} + +#ifndef _WIN32 +/* Sets a specific flag */ +int fcntl_setfl(int fd, int flag) +{ + int flags; + + flags = fcntl(fd, F_GETFL); + if (flags == -1) + return -errno; + + if (fcntl(fd, F_SETFL, flags | flag) == -1) + return -errno; + + return 0; +} +#endif + +#endif /* !VBOX */ + |