| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298 |
- <!DOCTYPE html PUBLIC "-//W3C//DTD HTML 4.01 Transitional//EN"><html><head>
- <meta http-equiv="content-type" content="text/html; charset=ISO-8859-1">
- <Title>EAString</title>
- <link type="text/css" rel="stylesheet" href="UTFDoc.css">
- <meta name="author" content="Paul Pedriana">
- </head>
- <body bgcolor="#FFFFFF">
- <h1>EAString</h1>
- <h2>Introduction</h2>
- <p>EAString implements an extensive suite of C string functionality from <string.h> in a portable way. Much of this functionality is the same as what
- is present in the C standard and in common (but non-portable) extensions to the C standard. EAString presents a consistent portable interface to its functionality
- in both 8 bit and 16 bit string form.</p>
- <p>The C language provides various functions which work with non-portable data types, such as long. EAString defines all significant data types in terms of portable
- types such as int32_t and int64_t. Additionally, the EAString versions of functions are usually faster than the C runtime library versions, usually because the EAString versions minimize cache misses
- and branching, whereas typical C runtime libraries optimize for the smallest memory footprint with little or no regard to other performance characteristics. Also, the EAString functions do not implement locale-specific functionality and thus save time and space as a result. Other packages within EA implement localization functionality in a way that is better suited to high performance game development.</p>
- <p>C-style printf functionality is separate from EAString and is found in <a href="EASprintf.html">EASprintf</a>. Memcpy functionality (which comes from the <string.h>
- header file) is present in <a href="EAMemory.html">EAMemory</a>. </p>
- <h2>Extension functions</h2>
- <p> EAString provides extended functionality that isn't found in conventional C libraries, but it useful nevertheless.</p>
- <table width="100%" border="1" cellpadding="3">
- <tr>
- <td><b>Function</b></td>
- <td><b>Description</b></td>
- <td><b>Signature</b></td>
- </tr>
- <tr>
- <td>Strlcat</td>
- <td>Safe variation of strncat</td>
- <td><font size="-1">char_t* Strlcat(char_t* pDestination, const char_t* pSource, size_t n); </font></td>
- </tr>
- <tr>
- <td>Strlcpy</td>
- <td>Safe variation of strcpy</td>
- <td><p><font size="-1">char_t* Strlcpy(char_t* pDestination, const char_t* pSource, size_t n); <br>
- int Strlcpy(char16_t* pDestination, const char8_t* pSource, size_t nDestCapacity, size_t nSourceLength = (size_t)~0);<br>
- int Strlcpy(char32_t* pDestination, const char8_t* pSource, size_t nDestCapacity, size_t nSourceLength = (size_t)~0);<br>
- int Strlcpy(char8_t* pDestination, const char16_t* pSource, size_t nDestCapacity, size_t nSourceLength = (size_t)~0);<br>
- int Strlcpy(char32_t* pDestination, const char16_t* pSource, size_t nDestCapacity, size_t nSourceLength = (size_t)~0);<br>
- int Strlcpy(char8_t* pDestination, const char32_t* pSource, size_t nDestCapacity, size_t nSourceLength = (size_t)~0);<br>
- int Strlcpy(char16_t* pDestination, const char32_t* pSource, size_t nDestCapacity, size_t nSourceLength = (size_t)~0); <br>
- int Strlcpy(char8_t* pDestination, const wchar_t* pSource, size_t nDestCapacity, size_t nSourceLength = (size_t)~0);<br>
- int Strlcpy(char16_t* pDestination, const wchar_t* pSource, size_t nDestCapacity, size_t nSourceLength = (size_t)~0); <br>
- int Strlcpy(char32_t* pDestination, const wchar_t* pSource, size_t nDestCapacity, size_t nSourceLength = (size_t)~0);<br>
- int Strlcpy(wchar_t* pDestination, const char8_t* pSource, size_t nDestCapacity, size_t nSourceLength = (size_t)~0);<br>
- int Strlcpy(wchar_t* pDestination, const char16_t* pSource, size_t nDestCapacity, size_t nSourceLength = (size_t)~0); <br>
- int Strlcpy(wchar_t* pDestination, const char32_t* pSource, size_t nDestCapacity, size_t nSourceLength = (size_t)~0);<br>
- bool Strlcpy(char16_t* pDestination, const char8_t* pSource, size_t nDestCapacity, size_t nSourceLength, size_t& nDestUsed, size_t& nSourceUsed);<br>
- bool Strlcpy(char32_t* pDestination, const char8_t* pSource, size_t nDestCapacity, size_t nSourceLength, size_t& nDestUsed, size_t& nSourceUsed);<br>
- bool Strlcpy(char8_t* pDestination, const char16_t* pSource, size_t nDestCapacity, size_t nSourceLength, size_t& nDestUsed, size_t& nSourceUsed);<br>
- bool Strlcpy(char32_t* pDestination, const char16_t* pSource, size_t nDestCapacity, size_t nSourceLength, size_t& nDestUsed, size_t& nSourceUsed);<br>
- bool Strlcpy(char8_t* pDestination, const char32_t* pSource, size_t nDestCapacity, size_t nSourceLength, size_t& nDestUsed, size_t& nSourceUsed);<br>
- bool Strlcpy(char16_t* pDestination, const char32_t* pSource, size_t nDestCapacity, size_t nSourceLength, size_t& nDestUsed, size_t& nSourceUsed);<br>
- bool Strlcpy(char8_t* pDestination, const wchar_t* pSource, size_t nDestCapacity, size_t nSourceLength, size_t& nDestUsed, size_t& nSourceUsed);<br>
- bool Strlcpy(char16_t* pDestination, const wchar_t* pSource, size_t nDestCapacity, size_t nSourceLength, size_t& nDestUsed, size_t& nSourceUsed);<br>
- bool Strlcpy(char32_t* pDestination, const wchar_t* pSource, size_t nDestCapacity, size_t nSourceLength, size_t& nDestUsed, size_t& nSourceUsed);<br>
- bool Strlcpy(wchar_t* pDestination, const char8_t* pSource, size_t nDestCapacity, size_t nSourceLength, size_t& nDestUsed, size_t& nSourceUsed);<br>
- bool Strlcpy(wchar_t* pDestination, const char16_t* pSource, size_t nDestCapacity, size_t nSourceLength, size_t& nDestUsed, size_t& nSourceUsed);<br>
- bool Strlcpy(wchar_t* pDestination, const char32_t* pSource, size_t nDestCapacity, size_t nSourceLength, size_t& nDestUsed, size_t& nSourceUsed);
- </font></p>
- </td>
- </tr>
- <tr>
- <td>Stristr</td>
- <td>Case insensitive version of strstr (find string within string)</td>
- <td><font size="-1">char_t* Stristr(const char_t* pString, const char_t* pSubString);</font></td>
- </tr>
- <tr>
- <td>FtoaEnglish</td>
- <td>
- <p>Float to ascii; always use English numeric format, regardless of the current locale.</p>
- </td>
- <td><font size="-1">char_t* FtoaEnglish(double dValue, char_t* pResult, int nInputLength, int nPrecision, bool bExponentEnabled); </font></td>
- </tr>
- <tr>
- <td>AtofEnglish</td>
- <td>Ascii to float; always use English numeric format, regardless of the current locale.</td>
- <td><font size="-1">double AtofEnglish(const char_t* pString); </font></td>
- </tr>
- <tr>
- <td> StrtodEnglish</td>
- <td>Same as strtod, but always use English numeric format, regardless of the current locale.</td>
- <td><font size="-1">double StrtodEnglish(const char_t* pString, char_t** ppStringEnd);</font></td>
- </tr>
- <tr>
- <td>Memset16</td>
- <td>Sets 16 bit values in memory (as opposed to memset's 8 bit values)</td>
- <td><font size="-1">uint16_t* Memset16(void* pDestination, uint16_t c, size_t count); </font></td>
- </tr>
- <tr>
- <td>Memset32</td>
- <td>Sets 32 bit values in memory (as opposed to memset's 8 bit values)</td>
- <td><font size="-1"> uint32_t* Memset32(void* pDestination, uint32_t c, size_t count);</font></td>
- </tr>
- <tr>
- <td>Memset64</td>
- <td>Sets 64 bit values in memory (as opposed to memset's 8 bit values)</td>
- <td><font size="-1">uint64_t* Memset64(void* pDestination, uint64_t c, size_t count);</font></td>
- </tr>
- <tr>
- <td>MemsetN</td>
- <td>Sets arbitrarily sized values in memory.</td>
- <td><font size="-1">void* MemsetN (void* pDestination, const void* pSource, size_t sourceBytes, size_t count); </font></td>
- </tr>
- <tr>
- <td>EcvtBuf</td>
- <td>Base function for converting a float to a %e string.</td>
- <td>
- <p><font size="-1">char_t* EcvtBuf(double dValue, int nDigitCount, int* decimalPos, int* sign, char_t* buffer); </font></p>
- </td>
- </tr>
- <tr>
- <td>FcvtBuf</td>
- <td>Base function for converting a float to a %f string.</td>
- <td><font size="-1">char_t* FcvtBuf(double dValue, int nDigitCountAfterDecimal, int* decimalPos, int* sign, char_t* buffer); </font></td>
- </tr>
- </table>
- <h2>Example usage </h2>
- <p>We provide a random smattering of example code here.</p>
- <pre class="code-example">char16_t buffer[32] = L"hello ";
- Strcat(buffer, L"world");
- </pre>
- <p>Strlcpy, Strlcat:</p>
- <pre class="code-example">char8_t buffer[32];
- Strlcpy(buffer, "Hello ", sizeof(buffer));<br>Strlcat(buffer, "world", sizeof(buffer));
- </pre>
- <p>Strlcpy, used to translate UTF8 to UTF16: </p>
- <pre class="code-example">char8_t buffer8[64];
- char16_t buffer16[64];
- int length16 = Strlcpy(buffer16, buffer8, 64);</pre>
- <p>U64toa:</p>
- <pre class="code-example">char buffer[32];
- U64toa(UINT64_C(12345678901234567890), buffer, 16);
- </pre>
- <p>AtoI32:</p>
- <pre class="code-example">int32_t x = AtoI32("1234567890");
- </pre>
- <p>Strtod:</p>
- <pre class="code-example">const char16_t* pString = L"12345.678 123.456 1.23456";
- while(*pString)
- {
- double value = Strtod(pString, &pString);
- printf("Field = %f\n, value);
- }
- </pre>
- <h2>Interface</h2>
- <p>In each of the functions below, there is an char8_t and char16_t version. So for Strcat there are the following:</p>
- <blockquote>
- <p><span class="code-example-span">char8_t* Strcat(char8_t* pDestination, const char8_t* pSource)<br>
- </span><span class="code-example-span">char16_t* Strcat(char16_t* pDestination, const char16_t* pSource)</span></p>
- </blockquote>
- <p>The list below may be out of date as you read this, so see EAString.h for a definitive list of supported functionality.</p>
- <pre class="code-example">char_t* Strcat(char_t* pDestination, const char_t* pSource);
- char_t* Strncat(char_t* pDestination, const char_t* pSource, size_t n);
- char_t* Strlcat(char_t* pDestination, const char_t* pSource, size_t n);
- char_t* Strcpy(char_t* pDestination, const char_t* pSource);
- char_t* Strncpy(char_t* pDestination, const char_t* pSource, size_t n);
- char_t* Strlcpy(char_t* pDestination, const char_t* pSource, size_t n);
- int Strlcpy(char16_t* pDestination, const char8_t* pSource, size_t nDestCapacity, size_t nSourceLength = (size_t)~0);
- int Strlcpy(char32_t* pDestination, const char8_t* pSource, size_t nDestCapacity, size_t nSourceLength = (size_t)~0);
- int Strlcpy(char8_t* pDestination, const char16_t* pSource, size_t nDestCapacity, size_t nSourceLength = (size_t)~0);
- int Strlcpy(char32_t* pDestination, const char16_t* pSource, size_t nDestCapacity, size_t nSourceLength = (size_t)~0);
- int Strlcpy(char8_t* pDestination, const char32_t* pSource, size_t nDestCapacity, size_t nSourceLength = (size_t)~0);
- int Strlcpy(char16_t* pDestination, const char32_t* pSource, size_t nDestCapacity, size_t nSourceLength = (size_t)~0);
- int Strlcpy(char8_t* pDestination, const wchar_t* pSource, size_t nDestCapacity, size_t nSourceLength = (size_t)~0);
- int Strlcpy(char16_t* pDestination, const wchar_t* pSource, size_t nDestCapacity, size_t nSourceLength = (size_t)~0);
- int Strlcpy(char32_t* pDestination, const wchar_t* pSource, size_t nDestCapacity, size_t nSourceLength = (size_t)~0);
- int Strlcpy(wchar_t* pDestination, const char8_t* pSource, size_t nDestCapacity, size_t nSourceLength = (size_t)~0);
- int Strlcpy(wchar_t* pDestination, const char16_t* pSource, size_t nDestCapacity, size_t nSourceLength = (size_t)~0);
- int Strlcpy(wchar_t* pDestination, const char32_t* pSource, size_t nDestCapacity, size_t nSourceLength = (size_t)~0);
- bool Strlcpy(char16_t* pDestination, const char8_t* pSource, size_t nDestCapacity, size_t nSourceLength, size_t& nDestUsed, size_t& nSourceUsed);
- bool Strlcpy(char32_t* pDestination, const char8_t* pSource, size_t nDestCapacity, size_t nSourceLength, size_t& nDestUsed, size_t& nSourceUsed);
- bool Strlcpy(char8_t* pDestination, const char16_t* pSource, size_t nDestCapacity, size_t nSourceLength, size_t& nDestUsed, size_t& nSourceUsed);
- bool Strlcpy(char32_t* pDestination, const char16_t* pSource, size_t nDestCapacity, size_t nSourceLength, size_t& nDestUsed, size_t& nSourceUsed);
- bool Strlcpy(char8_t* pDestination, const char32_t* pSource, size_t nDestCapacity, size_t nSourceLength, size_t& nDestUsed, size_t& nSourceUsed);
- bool Strlcpy(char16_t* pDestination, const char32_t* pSource, size_t nDestCapacity, size_t nSourceLength, size_t& nDestUsed, size_t& nSourceUsed);
- bool Strlcpy(char8_t* pDestination, const wchar_t* pSource, size_t nDestCapacity, size_t nSourceLength, size_t& nDestUsed, size_t& nSourceUsed);
- bool Strlcpy(char16_t* pDestination, const wchar_t* pSource, size_t nDestCapacity, size_t nSourceLength, size_t& nDestUsed, size_t& nSourceUsed);
- bool Strlcpy(char32_t* pDestination, const wchar_t* pSource, size_t nDestCapacity, size_t nSourceLength, size_t& nDestUsed, size_t& nSourceUsed);
- bool Strlcpy(wchar_t* pDestination, const char8_t* pSource, size_t nDestCapacity, size_t nSourceLength, size_t& nDestUsed, size_t& nSourceUsed);
- bool Strlcpy(wchar_t* pDestination, const char16_t* pSource, size_t nDestCapacity, size_t nSourceLength, size_t& nDestUsed, size_t& nSourceUsed);
- bool Strlcpy(wchar_t* pDestination, const char32_t* pSource, size_t nDestCapacity, size_t nSourceLength, size_t& nDestUsed, size_t& nSourceUsed);
- size_t Strlen(const char_t* pString);
- size_t Strxfrm(char_t* pDest, const char_t* pSource, size_t n);
- char_t* Strdup(const char_t* pString);
- char_t* Strlwr(char_t* pString);
- char_t* Strupr(char_t* pString);
- char_t* Strchr(const char_t* pString, char_t c);
- size_t Strcspn(const char_t* pString1, const char_t* pString2);
- char_t* Strpbrk(const char_t* pString1, const char_t* pString2);
- char_t* Strrchr(const char_t* pString, char_t c);
- size_t Strspn(const char_t* pString, const char_t* pSubString);
- char_t* Strstr(const char_t* pString, const char_t* pSubString);
- char_t* Stristr(const char_t* pString, const char_t* pSubString);
- char_t* Strtok(char_t* pString, const char_t* pTokens, char_t** pContext);
- char_t* Strset(char_t* pString, char_t c);
- char_t* Strnset(char_t* pString, char_t c, size_t n);
- char_t* Strrev(char_t* pString);
- int Strcmp(const char_t* pString1, const char_t* pString2);
- int Strncmp(const char_t* pString1, const char_t* pString2, size_t n);
- int Stricmp(const char_t* pString1, const char_t* pString2);
- int Strnicmp(const char_t* pString1, const char_t* pString2, size_t n);
- int Strcoll(const char_t* pString1, const char_t* pString2);
- int Strncoll(const char_t* pString1, const char_t* pString2, size_t n);
- int Stricoll(const char_t* pString1, const char_t* pString2);
- int Strnicoll(const char_t* pString1, const char_t* pString1, size_t n);
- char_t* EcvtBuf(double dValue, int nDigitCount, int* decimalPos, int* sign, char_t* buffer);
- char_t* FcvtBuf(double dValue, int nDigitCountAfterDecimal, int* decimalPos, int* sign, char_t* buffer);
- char_t* I32toa(int32_t nValue, char_t* pResult, int nBase);
- char_t* U32toa(uint32_t nValue, char_t* pResult, int nBase);
- char_t* I64toa(int64_t nValue, char_t* pBuffer, int nBase);
- char_t* U64toa(uint64_t nValue, char_t* pBuffer, int nBase);
- double Strtod(const char_t* pString, char_t** ppStringEnd);
- double StrtodEnglish(const char_t* pString, char_t** ppStringEnd);
- int64_t StrtoI64(const char_t* pString, char_t** ppStringEnd, int nBase);
- uint64_t StrtoU64(const char_t* pString, char_t** ppStringEnd, int nBase);
- int32_t StrtoI32(const char_t* pString, char_t** ppStringEnd, int nBase);
- uint32_t StrtoU32(const char_t* pString, char_t** ppStringEnd, int nBase);
- int32_t AtoI32(const char_t* pString);
- uint32_t AtoU32(const char_t* pString);
- int64_t AtoI64(const char_t* pString);
- uint64_t AtoU64(const char_t* pString);
- double Atof(const char_t* pString);
- double AtofEnglish(const char_t* pString);
- char_t* Ftoa(double dValue, char_t* pResult, int nInputLength, int nPrecision, bool bExponentEnabled);
- char_t* FtoaEnglish(double dValue, char_t* pResult, int nInputLength, int nPrecision, bool bExponentEnabled);
- </pre>
- <h2>Encoded Strlcpy Issue </h2>
- <p>The Strlcpy function <span class="code-example-comment"> size_t Strlcpy(char16_t* pDestination, const char8_t* pSource, size_t nDestCapacity, size_t nSourceLength)</span> converts UTF8 text (char8_t) to UCS2 (char16_t). It doesn't work if your pSource string isn't truly UTF8-encoded. Typically this would happen because the source string is using Windows code page 1252 or HTML's ISO 8859-1. All 8 bit strings in EAStdC are assumed to be UTF8 unless specifically documented otherwise. </p>
- <p>Any 8 bit text that's not UTF8 has to be defined within the context of a code page; otherwise any chars above 127 have an arbitrary meaning, and may include multi-byte characters for some code pages. If you need to convert code page 1252 to UCS2, you need to implement a function which uses a table that maps the high byte values into their proper Unicode values. It's not so simple to just cast the byte value to char16_t, as some of the code page 1252 characters don't map directly to their numerical values in Unicode, though ISO 8859-1 characters to completely map to their equivalent Unicode values. </p>
- <p>The following is an implementation of Strcpy and Strlcpy for ISO 8859-1 char8_t text which isn't currently part of EAStdC: </p>
- <p class="code-example">char16_t* StrcpyISO8859_1(char16_t* pDestination, const char8_t* pSource)<br>
- {<br>
- char16_t* pDestSaved = pDestination;<br>
- <br>
- while(*pSource)<br>
- *(pDestination++) = (uint8_t)*pSource++;<br>
- <br>
- *pDestination = 0;<br>
- <br>
- return pDestSaved;<br>
- }</p>
- <p> </p>
- <p class="code-example">size_t StrlcpyISO8859_1(char16_t* pDestination, const char8_t* pSource, size_t nDestCapacity)<br>
- {<br>
- const char8_t* s = pSource;<br>
- size_t n = nDestCapacity;<br>
- <br>
- if(n && --n)<br>
- {<br>
- do{<br>
- if((*pDestination++ = (uint8_t)*s++) == 0)<br>
- break;<br>
- } while(--n);<br>
- }<br>
- <br>
- if(!n)<br>
- {<br>
- if(nDestCapacity)<br>
- *pDestination = 0;<br>
- <br>
- while(*s)<br>
- ++s;<br>
- }<br>
- <br>
- return (s - pSource - 1);<br>
- }</p>
- <hr>
- <p> </p>
- <p> </p>
- <p> </p>
- <p> </p>
- <p> </p>
- <p> </p>
- <p> </p>
- <p> </p>
- <p> </p>
- <p> </p>
- <p> </p>
- <p> </p>
- <p> </p>
- <p> </p>
- </body>
- </html>
|