| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346 |
- /*
- Copyright (c) 2013 Daniele Bartolini, Michele Rossi
- Copyright (c) 2012 Daniele Bartolini, Simone Boscaratto
- Permission is hereby granted, free of charge, to any person
- obtaining a copy of this software and associated documentation
- files (the "Software"), to deal in the Software without
- restriction, including without limitation the rights to use,
- copy, modify, merge, publish, distribute, sublicense, and/or sell
- copies of the Software, and to permit persons to whom the
- Software is furnished to do so, subject to the following
- conditions:
- The above copyright notice and this permission notice shall be
- included in all copies or substantial portions of the Software.
- THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
- EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
- OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
- NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
- HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
- WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
- FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
- OTHER DEALINGS IN THE SOFTWARE.
- */
- #pragma once
- #include <cstdio>
- #include <cstring>
- #include "assert.h"
- #include "types.h"
- #include "config.h"
- #include "macros.h"
- namespace crown
- {
- namespace string
- {
- inline bool is_alpha(char c)
- {
- return ((c >= 'a' && c <= 'z') || (c >= 'A' && c <= 'Z'));
- }
- inline bool is_digit(char c)
- {
- return !(c < '0' || c > '9');
- }
- inline bool is_upper(char c)
- {
- return (c >= 'A' && c <= 'Z');
- }
- inline bool is_lower(char c)
- {
- return (c >= 'a' && c <= 'z');
- }
- inline bool is_whitespace(char c)
- {
- return (c == ' ' || c == '\t' || c == '\n' || c == '\r');
- }
- inline size_t strlen(const char* str)
- {
- return ::strlen(str);
- }
- inline const char* strstr(const char* str1, const char* str2)
- {
- return ::strstr(str1, str2);
- }
- inline int32_t strcmp(const char* str1, const char* str2)
- {
- return ::strcmp(str1, str2);
- }
- inline int32_t strncmp(const char* s1, const char* s2, size_t len)
- {
- return ::strncmp(s1, s2, len);
- }
- inline char* strncpy(char* dest, const char* src, size_t len)
- {
- char* ret = ::strncpy(dest, src, len);
- dest[len - 1] = '\0';
- return ret;
- }
- inline char* strcat(char* dest, const char* src)
- {
- return ::strcat(dest, src);
- }
- inline char* strncat(char* dest, const char* src, size_t len)
- {
- return ::strncat(dest, src, len);
- }
- inline const char* begin(const char* str)
- {
- CE_ASSERT(str != NULL, "Str must be != NULL");
- return str;
- }
- inline const char* end(const char* str)
- {
- CE_ASSERT(str != NULL, "Str must be != NULL");
- return str + string::strlen(str) + 1;
- }
- inline const char* find_first(const char* str, char c)
- {
- CE_ASSERT(str != NULL, "Str must be != NULL");
- const char* str_begin = string::begin(str);
- while (str_begin != string::end(str))
- {
- if ((*str_begin) == c)
- {
- return str_begin;
- }
- str_begin++;
- }
- return string::end(str);
- }
- inline const char* find_last(const char* str, char c)
- {
- CE_ASSERT(str != NULL, "Str must be != NULL");
- const char* str_end = string::end(str) - 1;
- while (str_end != string::begin(str) - 1)
- {
- if ((*str_end) == c)
- {
- return str_end;
- }
- str_end--;
- }
- return string::end(str);
- }
- inline void substring(const char* begin, const char* end, char* out, size_t len)
- {
- CE_ASSERT(begin != NULL, "Begin must be != NULL");
- CE_ASSERT(end != NULL, "End must be != NULL");
- CE_ASSERT(out != NULL, "Out must be != NULL");
- size_t i = 0;
- char* out_iterator = out;
- while (begin != end && i < len)
- {
- (*out_iterator) = (*begin);
- begin++;
- out_iterator++;
- i++;
- }
- out[i] = '\0';
- }
- inline int32_t parse_int(const char* string)
- {
- int val;
- int ok = sscanf(string, "%d", &val);
- CE_ASSERT(ok == 1, "Failed to parse int: %s", string);
- CE_UNUSED(ok);
- return val;
- }
- inline uint32_t parse_uint(const char* string)
- {
- unsigned int val;
- int ok = sscanf(string, "%u", &val);
- CE_ASSERT(ok == 1, "Failed to parse uint: %s", string);
- CE_UNUSED(ok);
- return val;
- }
- inline float parse_float(const char* string)
- {
- float val;
- int ok = sscanf(string, "%f", &val);
- CE_ASSERT(ok == 1, "Failed to parse float: %s", string);
- CE_UNUSED(ok);
- return val;
- }
- inline double parse_double(const char* string)
- {
- double val;
- int ok = sscanf(string, "%lf", &val);
- CE_ASSERT(ok == 1, "Failed to parse float: %s", string);
- CE_UNUSED(ok);
- return val;
- }
- /// MurmurHash2, by Austin Appleby
- ///
- /// @note
- /// This code makes a few assumptions about how your machine behaves
- ///
- /// 1. We can read a 4-byte value from any address without crashing
- /// 2. sizeof(int) == 4
- ///
- /// And it has a few limitations -
- ///
- /// 1. It will not work incrementally.
- /// 2. It will not produce the same results on little-endian and big-endian
- /// machines.
- inline uint32_t murmur2_32(const void* key, size_t len, uint32_t seed = 0)
- {
- CE_ASSERT_NOT_NULL(key);
- // 'm' and 'r' are mixing constants generated offline.
- // They're not really 'magic', they just happen to work well.
- const unsigned int m = 0x5bd1e995;
- const int r = 24;
- // Initialize the hash to a 'random' value
- unsigned int h = seed ^ len;
- // Mix 4 bytes at a time into the hash
- const unsigned char * data = (const unsigned char *)key;
- while(len >= 4)
- {
- unsigned int k = *(unsigned int *)data;
- k *= m;
- k ^= k >> r;
- k *= m;
- h *= m;
- h ^= k;
- data += 4;
- len -= 4;
- }
- // Handle the last few bytes of the input array
- switch(len)
- {
- case 3: h ^= data[2] << 16;
- case 2: h ^= data[1] << 8;
- case 1: h ^= data[0];
- h *= m;
- };
- // Do a few final mixes of the hash to ensure the last few
- // bytes are well-incorporated.
- h ^= h >> 13;
- h *= m;
- h ^= h >> 15;
- return h;
- }
- inline uint64_t murmur2_64(const void* key, int len, uint64_t seed = 0)
- {
- const uint64_t m = 0xc6a4a7935bd1e995ull;
- const int r = 47;
- uint64_t h = seed ^ (len * m);
- const uint64_t * data = (const uint64_t *)key;
- const uint64_t * end = data + (len/8);
- while(data != end)
- {
- uint64_t k = *data++;
- k *= m;
- k ^= k >> r;
- k *= m;
- h ^= k;
- h *= m;
- }
- const unsigned char * data2 = (const unsigned char*)data;
- switch(len & 7)
- {
- case 7: h ^= uint64_t(data2[6]) << 48;
- case 6: h ^= uint64_t(data2[5]) << 40;
- case 5: h ^= uint64_t(data2[4]) << 32;
- case 4: h ^= uint64_t(data2[3]) << 24;
- case 3: h ^= uint64_t(data2[2]) << 16;
- case 2: h ^= uint64_t(data2[1]) << 8;
- case 1: h ^= uint64_t(data2[0]);
- h *= m;
- };
- h ^= h >> r;
- h *= m;
- h ^= h >> r;
- return h;
- }
- #ifdef CROWN_DEBUG
- inline uint32_t HASH32(const char *s, uint32_t value)
- {
- CE_ASSERT(murmur2_32(s, string::strlen(s), 0) == value, "Hash mismatch");
- return value;
- }
- inline uint64_t HASH64(const char* s, uint64_t value)
- {
- CE_ASSERT(murmur2_64(s, string::strlen(s), 0) == value, "Hash mismatch");
- return value;
- }
- #else
- #define HASH32(s, v) (v)
- #define HASH64(s, v) (v)
- #endif
- } // namespace string
- } // namespace crown
|