123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401 |
- //-----------------------------------------------------------------------------
- // Copyright (c) 2012 GarageGames, LLC
- //
- // Permission is hereby granted, free of charge, to any person obtaining a copy
- // of this software and associated documentation files (the "Software"), to
- // deal in the Software without restriction, including without limitation the
- // rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
- // sell copies of the Software, and to permit persons to whom the Software is
- // furnished to do so, subject to the following conditions:
- //
- // The above copyright notice and this permission notice shall be included in
- // all copies or substantial portions of the Software.
- //
- // THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
- // IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
- // FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
- // AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
- // LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
- // FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
- // IN THE SOFTWARE.
- //-----------------------------------------------------------------------------
- #ifndef _TORQUE_STRING_H_
- #define _TORQUE_STRING_H_
- #include <cstdarg>
- #ifndef _TORQUE_TYPES_H_
- #include "platform/types.h"
- #endif
- #include <string.h>
- template< class T > class Vector;
- typedef UTF8 StringChar;
- /// The String class represents a 0-terminated array of characters.
- class String
- {
- public:
- class StringData;
- /// Default mode is case sensitive starting from the left
- enum Mode
- {
- Case = 0, ///< Case sensitive
- NoCase = 1, ///< Case insensitive
- Left = 0, ///< Start at left end of string
- Right = 2, ///< Start at right end of string
- };
- typedef U32 SizeType;
- typedef StringChar ValueType;
- static const SizeType NPos; ///< Indicates 'not found' when using find() functions
- /// A predefined empty string.
- static const String EmptyString;
- String();
- String(const String &str);
- String(const StringChar *str);
- String(const StringChar *str, SizeType size); ///< Copy from raw data
- String(const UTF16 *str);
- ~String();
- const UTF8 *c_str() const; ///< Return the string as a native type
- const UTF16 *utf16() const;
- const UTF8* utf8() const { return c_str(); }
- SizeType length() const; ///< Returns the length of the string in bytes.
- SizeType size() const; ///< Returns the length of the string in bytes including the NULL terminator.
- SizeType numChars() const; ///< Returns the length of the string in characters.
- bool isEmpty() const; ///< Is this an empty string [""]?
- static bool isEmpty(const char*); // is the input empty?
- bool isNotEmpty() const { return !isEmpty(); } ///< Is this not an empty string [""]?
- /// Erases all characters in a string.
- void clear() { *this = EmptyString; }
- bool isShared() const; ///< Is this string's reference count greater than 1?
- bool isSame( const String& str ) const; ///< Return true if both strings refer to the same shared data.
- U32 getHashCaseSensitive() const; ///< Get the case-sensitive hash of the string [only calculates the hash as necessary]
- U32 getHashCaseInsensitive() const; ///< Get the case-insensitive hash of the string [only calculates the hash as necessary]
- String& operator=(StringChar);
- String& operator+=(StringChar);
- String& operator=(const StringChar*);
- String& operator+=(const StringChar*);
- String& operator=(const String&);
- String& operator+=(const String&);
-
- /**
- Compare this string with another.
- @param str The string to compare against.
- @param len If len is non-zero, then at most len characters are compared.
- @param mode Comparison mode.
- @return Difference between the first two characters that don't match.
- */
- S32 compare(const StringChar *str, SizeType len = 0, U32 mode = Case|Left) const;
- S32 compare(const String &str, SizeType len = 0, U32 mode = Case|Left) const; ///< @see compare(const StringChar *, SizeType, U32) const
- /**
- Compare two strings for equality.
- It will use the string hashes to determine inequality.
- @param str The string to compare against.
- @param mode Comparison mode - case sensitive or not.
- */
- bool equal(const String &str, U32 mode = Case) const;
- SizeType find(StringChar c, SizeType pos = 0, U32 mode = Case|Left) const;
- SizeType find(const StringChar *str, SizeType pos = 0, U32 mode = Case|Left) const;
- SizeType find(const String &str, SizeType pos = 0, U32 mode = Case|Left) const;
-
- String &insert(SizeType pos, const StringChar c) { return insert(pos,&c,1); }
- String &insert(SizeType pos, const StringChar *str);
- String &insert(SizeType pos, const String &str);
- String &insert(SizeType pos, const StringChar *str, SizeType len);
- String &erase(SizeType pos, SizeType len);
- String &replace(SizeType pos, SizeType len, const StringChar *str);
- String &replace(SizeType pos, SizeType len, const String &str);
-
- /// Replace all occurrences of character 'c1' with 'c2'
- String &replace( StringChar c1, StringChar c2 );
- /// Replace all occurrences of StringData 's1' with StringData 's2'
- String &replace(const String &s1, const String &s2);
- String substr( SizeType pos, SizeType len = -1 ) const;
-
- /// Remove leading and trailing whitespace.
- String trim() const;
-
- /// Replace all characters that need to be escaped for the string to be a valid string literal with their
- /// respective escape sequences.
- String expandEscapes() const;
-
- /// Replace all escape sequences in with their respective character codes.
- String collapseEscapes() const;
-
- /// Split the string into its components separated by the given delimiter.
- void split( const char* delimiter, Vector< String >& outElements ) const;
-
- /// Return true if the string starts with the given text.
- bool startsWith( const char* text ) const;
-
- /// Return true if the string ends with the given text.
- bool endsWith( const char* text ) const;
- operator const StringChar*() const { return c_str(); }
- StringChar operator []( U32 i ) const { return c_str()[i]; }
- StringChar operator []( S32 i ) const { return c_str()[i]; }
- bool operator==(const String &str) const;
- bool operator!=(const String &str) const { return !(*this == str); }
- bool operator==( StringChar c ) const;
- bool operator!=( StringChar c ) const { return !(*this == c); }
- bool operator<(const String &str) const;
- bool operator>(const String &str) const;
- bool operator<=(const String &str) const;
- bool operator>=(const String &str) const;
- friend String operator+(const String &a, StringChar c);
- friend String operator+(StringChar c, const String &a);
- friend String operator+(const String &a, const StringChar *b);
- friend String operator+(const String &a, const String &b);
- friend String operator+(const StringChar *a, const String &b);
- public:
- /// @name String Utility routines
- /// @{
- static String ToString(const char *format, ...);
- static String VToString(const char* format, va_list args);
- static String ToString( bool v );
- static inline String ToString( U32 v ) { return ToString( "%u", v ); }
- static inline String ToString( S32 v ) { return ToString( "%d", v ); }
- static inline String ToString( F32 v ) { return ToString( "%g", v ); }
- static inline String ToString( F64 v ) { return ToString( "%Lg", v ); }
- static String SpanToString(const char* start, const char* end);
- static String ToLower(const String &string);
- static String ToUpper(const String &string);
- static String GetTrailingNumber(const char* str, S32& number);
- static String GetFirstNumber(const char* str, U32& startPos, U32& endPos);
- /// @}
- /// @name Interning
- ///
- /// Interning maps identical strings to unique instances so that equality
- /// amounts to simple pointer comparisons.
- ///
- /// Note that using interned strings within global destructors is not safe
- /// as table destruction runs within this phase as well. Uses o interned
- /// strings in global destructors is thus dependent on object file ordering.
- ///
- /// Also, interned strings are not reference-counted. Once interned, a
- /// string will persist until shutdown. This is to avoid costly concurrent
- /// reference counting that would otherwise be necessary.
- ///
- /// @{
-
- /// Return the interned version of the string.
- /// @note Interning is case-sensitive.
- String intern() const;
-
- /// Return true if this string is interned.
- bool isInterned() const;
-
- /// @}
- /** An internal support class for ToString().
- StrFormat manages the formatting of arbitrary length strings.
- The class starts with a default internal fixed size buffer and
- moves to dynamic allocation from the heap when that is exceeded.
- Constructing the class on the stack will result in its most
- efficient use. This class is meant to be used as a helper class,
- and not for the permanent storage of string data.
- @code
- char* indexString(U32 index)
- {
- StrFormat format("Index: %d",index);
- char* str = new char[format.size()];
- format.copy(str);
- return str;
- }
- @endcode
- */
- class StrFormat
- {
- public:
- StrFormat()
- : _dynamicBuffer( NULL ),
- _dynamicSize( 0 ),
- _len( 0 )
- {
- strncpy(_fixedBuffer, "", 2048);
- }
- StrFormat(const char *formatStr, va_list args)
- : _dynamicBuffer( NULL ),
- _dynamicSize( 0 ),
- _len( 0 )
- {
- format(formatStr, args);
- }
- ~StrFormat();
- S32 format( const char *format, va_list args );
- S32 formatAppend( const char *format, va_list args );
- S32 append(const char * str, S32 len);
- S32 append(const char * str);
- String getString() { return String(c_str(),_len); }
- const char * c_str() const { return _dynamicBuffer ? _dynamicBuffer : _fixedBuffer; }
- void reset()
- {
- _len = 0;
- strncpy(_fixedBuffer, "", 2048);
- }
- /// Copy the formatted string into the output buffer which must be at least size() characters.
- char *copy(char* buffer) const;
- /// Return the length of the formated string (does not include the terminating 0)
- U32 length() const { return _len; };
- public:
- char _fixedBuffer[2048]; //< Fixed size buffer
- char *_dynamicBuffer; //< Temporary format buffer
- U32 _dynamicSize; //< Dynamic buffer size
- U32 _len; //< Len of the formatted string
- };
- private:
- String(StringData *str)
- : _string( str ) {}
- // Generate compile error if operator bool is used. Without this we use
- // operator const char *, which is always true...including operator bool
- // causes an ambiguous cast compile error. Making it private is simply
- // more insurance that it isn't used on different compilers.
- // NOTE: disable on GCC since it causes hyper casting to U32 on gcc.
- #if !defined(TORQUE_COMPILER_GCC) && !defined(__clang__)
- operator const bool() const { return false; }
- #endif
- static void copy(StringChar *dst, const StringChar *src, U32 size);
- StringData *_string;
- };
- // Utility class for formatting strings.
- class StringBuilder
- {
- protected:
- ///
- String::StrFormat mFormat;
- public:
- StringBuilder() {}
-
- U32 length() const
- {
- return mFormat.length();
- }
-
- void copy( char* buffer ) const
- {
- mFormat.copy( buffer );
- }
- const char* data() const
- {
- return mFormat.c_str();
- }
- String end()
- {
- return mFormat.getString();
- }
- S32 append( char ch )
- {
- char str[2];
- str[0]=ch;
- str[1]='\0';
- return mFormat.append(str);
- }
- S32 append( const char* str )
- {
- return mFormat.append(str);
- }
- S32 append( const String& str )
- {
- return mFormat.append( str.c_str(), str.length() );
- }
- S32 append( const char* str, U32 length )
- {
- return mFormat.append(str,length);
- }
- S32 format( const char* fmt, ... )
- {
- va_list args;
- va_start(args, fmt);
- return mFormat.formatAppend(fmt, args);
- }
- };
- // For use in hash tables and the like for explicitly requesting case sensitive hashing.
- // Meant to only appear in hash table definition (casting will take care of the rest).
- class StringCase : public String
- {
- public:
- StringCase() : String() {}
- StringCase(const String & s) : String(s) {}
- };
- // For use in hash tables and the like for explicitly requesting case insensitive hashing.
- // Meant to only appear in hash table definition (casting will take care of the rest).
- class StringNoCase : public String
- {
- public:
- StringNoCase() : String() {}
- StringNoCase(const String & s) : String(s) {}
- };
- class FileName : public String
- {
- public:
- FileName() : String() {}
- FileName(const String & s) : String(s) {}
- FileName & operator=(const String & s) { String::operator=(s); return *this; }
- };
- //-----------------------------------------------------------------------------
- extern String operator+(const String &a, StringChar c);
- extern String operator+(StringChar c, const String &a);
- extern String operator+(const String &a, const StringChar *b);
- extern String operator+(const String &a, const String &b);
- extern String operator+(const StringChar *a, const String &b);
- #endif
|