BsDataStream.cpp 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473
  1. //********************************** Banshee Engine (www.banshee3d.com) **************************************************//
  2. //**************** Copyright (c) 2016 Marko Pintera ([email protected]). All rights reserved. **********************//
  3. #include "BsDataStream.h"
  4. #include <codecvt>
  5. namespace BansheeEngine
  6. {
  7. const UINT32 DataStream::StreamTempSize = 128;
  8. /** Checks does the provided buffer has an UTF32 byte order mark in little endian order. */
  9. bool isUTF32LE(const UINT8* buffer)
  10. {
  11. return buffer[0] == 0xFF && buffer[1] == 0xFE && buffer[2] == 0x00 && buffer[3] == 0x00;
  12. }
  13. /** Checks does the provided buffer has an UTF32 byte order mark in big endian order. */
  14. bool isUTF32BE(const UINT8* buffer)
  15. {
  16. return buffer[0] == 0x00 && buffer[1] == 0x00 && buffer[2] == 0xFE && buffer[3] == 0xFF;
  17. }
  18. /** Checks does the provided buffer has an UTF16 byte order mark in little endian order. */
  19. bool isUTF16LE(const UINT8* buffer)
  20. {
  21. return buffer[0] == 0xFF && buffer[1] == 0xFE;
  22. }
  23. /** Checks does the provided buffer has an UTF16 byte order mark in big endian order. */
  24. bool isUTF16BE(const UINT8* buffer)
  25. {
  26. return buffer[0] == 0xFE && buffer[1] == 0xFF;
  27. }
  28. /** Checks does the provided buffer has an UTF8 byte order mark. */
  29. bool isUTF8(const UINT8* buffer)
  30. {
  31. return (buffer[0] == 0xEF && buffer[1] == 0xBB && buffer[2] == 0xBF);
  32. }
  33. template <typename T> DataStream& DataStream::operator>> (T& val)
  34. {
  35. read(static_cast<void*>(&val), sizeof(T));
  36. return *this;
  37. }
  38. void DataStream::writeString(const String& string, StringEncoding encoding)
  39. {
  40. if (encoding == StringEncoding::UTF16)
  41. {
  42. const std::codecvt_mode convMode = (std::codecvt_mode)(std::generate_header);
  43. typedef std::codecvt_utf8_utf16<char, 1114111, convMode> UTF8ToUTF16Conv;
  44. std::wstring_convert<UTF8ToUTF16Conv, char> conversion("?");
  45. std::string encodedString = conversion.from_bytes(string.c_str());
  46. write(encodedString.data(), encodedString.length());
  47. }
  48. else
  49. {
  50. write(string.data(), string.length());
  51. }
  52. }
  53. void DataStream::writeString(const WString& string, StringEncoding encoding)
  54. {
  55. if (encoding == StringEncoding::UTF16)
  56. {
  57. const std::codecvt_mode convMode = (std::codecvt_mode)(std::generate_header | std::little_endian);
  58. typedef std::codecvt_utf16<wchar_t, 1114111, convMode> WCharToUTF16Conv;
  59. std::wstring_convert<WCharToUTF16Conv, wchar_t> conversion("?");
  60. std::string encodedString = conversion.to_bytes(string.c_str());
  61. write(encodedString.data(), encodedString.length());
  62. }
  63. else
  64. {
  65. const std::codecvt_mode convMode = (std::codecvt_mode)(std::generate_header);
  66. typedef std::codecvt_utf8<wchar_t, 1114111, convMode> WCharToUTF8Conv;
  67. std::wstring_convert<WCharToUTF8Conv, wchar_t> conversion("?");
  68. std::string encodedString = conversion.to_bytes(string.c_str());
  69. write(encodedString.data(), encodedString.length());
  70. }
  71. }
  72. String DataStream::getAsString()
  73. {
  74. // Read the entire buffer - ideally in one read, but if the size of
  75. // the buffer is unknown, do multiple fixed size reads.
  76. size_t bufSize = (mSize > 0 ? mSize : 4096);
  77. std::stringstream::char_type* tempBuffer = (std::stringstream::char_type*)bs_alloc((UINT32)bufSize);
  78. // Ensure read from begin of stream
  79. seek(0);
  80. std::stringstream result;
  81. while (!eof())
  82. {
  83. size_t numReadBytes = read(tempBuffer, bufSize);
  84. result.write(tempBuffer, numReadBytes);
  85. }
  86. free(tempBuffer);
  87. std::string string = result.str();
  88. UINT32 readBytes = (UINT32)string.size();
  89. if (readBytes >= 4)
  90. {
  91. if (isUTF32LE((UINT8*)string.data()))
  92. {
  93. const std::codecvt_mode convMode = (std::codecvt_mode)(std::consume_header | std::little_endian);
  94. typedef std::codecvt_utf8<UINT32, 1114111, convMode> utf8utf32;
  95. std::wstring_convert<utf8utf32, UINT32> conversion("?");
  96. UINT32* start = (UINT32*)string.data();
  97. UINT32* end = (start + (string.size() - 1) / 4);
  98. return conversion.to_bytes(start, end).c_str();
  99. }
  100. else if (isUTF32BE((UINT8*)string.data()))
  101. {
  102. const std::codecvt_mode convMode = (std::codecvt_mode)(std::consume_header);
  103. typedef std::codecvt_utf8<UINT32, 1114111, convMode> utf8utf32;
  104. std::wstring_convert<utf8utf32, UINT32> conversion("?");
  105. UINT32* start = (UINT32*)string.data();
  106. UINT32* end = (start + (string.size() - 1) / 4);
  107. return conversion.to_bytes(start, end).c_str();
  108. }
  109. }
  110. if (readBytes >= 3)
  111. {
  112. if (isUTF8((UINT8*)string.data()))
  113. {
  114. return string.c_str() + 3;
  115. }
  116. }
  117. if (readBytes >= 2)
  118. {
  119. if (isUTF16LE((UINT8*)string.data()))
  120. {
  121. const std::codecvt_mode convMode = (std::codecvt_mode)(std::little_endian);
  122. typedef std::codecvt_utf8_utf16<UINT16, 1114111, convMode> utf8utf16;
  123. std::wstring_convert<utf8utf16, UINT16> conversion("?");
  124. UINT16* start = (UINT16*)(string.c_str() + 2); // Bug?: std::consume_header seems to be ignored so I manually remove the header
  125. return conversion.to_bytes(start).c_str();
  126. }
  127. else if (isUTF16BE((UINT8*)string.data()))
  128. {
  129. const std::codecvt_mode convMode = (std::codecvt_mode)(0);
  130. typedef std::codecvt_utf8_utf16<UINT16, 1114111, convMode> utf8utf16;
  131. // Bug?: Regardless of not providing the std::little_endian flag it seems that is how the data is read
  132. // so I manually flip it
  133. UINT32 numChars = (UINT32)(string.size() - 2) / 2;
  134. for (UINT32 i = 0; i < numChars; i++)
  135. std::swap(string[i * 2 + 0], string[i * 2 + 1]);
  136. std::wstring_convert<utf8utf16, UINT16> conversion("?");
  137. UINT16* start = (UINT16*)(string.c_str() + 2); // Bug?: std::consume_header seems to be ignored so I manually remove the header
  138. return conversion.to_bytes(start).c_str();
  139. }
  140. }
  141. return string.c_str();
  142. }
  143. WString DataStream::getAsWString()
  144. {
  145. // Read the entire buffer - ideally in one read, but if the size of
  146. // the buffer is unknown, do multiple fixed size reads.
  147. size_t bufSize = (mSize > 0 ? mSize : 4096);
  148. std::stringstream::char_type* tempBuffer = (std::stringstream::char_type*)bs_alloc((UINT32)bufSize);
  149. // Ensure read from begin of stream
  150. seek(0);
  151. std::stringstream result;
  152. while (!eof())
  153. {
  154. size_t numReadBytes = read(tempBuffer, bufSize);
  155. result.write(tempBuffer, numReadBytes);
  156. }
  157. free(tempBuffer);
  158. std::string string = result.str();
  159. UINT32 readBytes = (UINT32)string.size();
  160. if (readBytes >= 4)
  161. {
  162. if (isUTF32LE((UINT8*)string.data()))
  163. {
  164. // Not supported
  165. }
  166. else if (isUTF32BE((UINT8*)string.data()))
  167. {
  168. // Not supported
  169. }
  170. }
  171. if (readBytes >= 3)
  172. {
  173. if (isUTF8((UINT8*)string.data()))
  174. {
  175. const std::codecvt_mode convMode = (std::codecvt_mode)(std::consume_header);
  176. typedef std::codecvt_utf8<wchar_t, 1114111, convMode> wcharutf8;
  177. std::wstring_convert<wcharutf8> conversion("?");
  178. return conversion.from_bytes(string).c_str();
  179. }
  180. }
  181. if (readBytes >= 2)
  182. {
  183. if (isUTF16LE((UINT8*)string.data()))
  184. {
  185. const std::codecvt_mode convMode = (std::codecvt_mode)(std::consume_header | std::little_endian);
  186. typedef std::codecvt_utf16<wchar_t, 1114111, convMode> wcharutf16;
  187. std::wstring_convert<wcharutf16> conversion("?");
  188. return conversion.from_bytes(string).c_str();
  189. }
  190. else if (isUTF16BE((UINT8*)string.data()))
  191. {
  192. const std::codecvt_mode convMode = (std::codecvt_mode)(std::consume_header);
  193. typedef std::codecvt_utf16<wchar_t, 1114111, convMode> wcharutf16;
  194. std::wstring_convert<wcharutf16> conversion("?");
  195. return conversion.from_bytes(string).c_str();
  196. }
  197. }
  198. {
  199. const std::codecvt_mode convMode = (std::codecvt_mode)(std::consume_header);
  200. typedef std::codecvt_utf8<wchar_t, 1114111, convMode> wcharutf8;
  201. std::wstring_convert<wcharutf8> conversion("?");
  202. return conversion.from_bytes(string).c_str();
  203. }
  204. }
  205. MemoryDataStream::MemoryDataStream(void* memory, size_t inSize)
  206. : DataStream(READ | WRITE), mData(nullptr)
  207. {
  208. mData = mPos = static_cast<UINT8*>(memory);
  209. mSize = inSize;
  210. mEnd = mData + mSize;
  211. assert(mEnd >= mPos);
  212. }
  213. MemoryDataStream::MemoryDataStream(DataStream& sourceStream)
  214. : DataStream(READ | WRITE), mData(nullptr)
  215. {
  216. // Copy data from incoming stream
  217. mSize = sourceStream.size();
  218. mData = (UINT8*)bs_alloc((UINT32)mSize);
  219. mPos = mData;
  220. mEnd = mData + sourceStream.read(mData, mSize);
  221. assert(mEnd >= mPos);
  222. }
  223. MemoryDataStream::MemoryDataStream(const SPtr<DataStream>& sourceStream)
  224. :DataStream(READ | WRITE), mData(nullptr)
  225. {
  226. // Copy data from incoming stream
  227. mSize = sourceStream->size();
  228. mData = (UINT8*)bs_alloc((UINT32)mSize);
  229. mPos = mData;
  230. mEnd = mData + sourceStream->read(mData, mSize);
  231. assert(mEnd >= mPos);
  232. }
  233. MemoryDataStream::~MemoryDataStream()
  234. {
  235. close();
  236. }
  237. size_t MemoryDataStream::read(void* buf, size_t count)
  238. {
  239. size_t cnt = count;
  240. if (mPos + cnt > mEnd)
  241. cnt = mEnd - mPos;
  242. if (cnt == 0)
  243. return 0;
  244. assert (cnt <= count);
  245. memcpy(buf, mPos, cnt);
  246. mPos += cnt;
  247. return cnt;
  248. }
  249. size_t MemoryDataStream::write(const void* buf, size_t count)
  250. {
  251. size_t written = 0;
  252. if (isWriteable())
  253. {
  254. written = count;
  255. if (mPos + written > mEnd)
  256. written = mEnd - mPos;
  257. if (written == 0)
  258. return 0;
  259. memcpy(mPos, buf, written);
  260. mPos += written;
  261. }
  262. return written;
  263. }
  264. void MemoryDataStream::skip(size_t count)
  265. {
  266. size_t newpos = (size_t)( (mPos - mData) + count );
  267. assert(mData + newpos <= mEnd);
  268. mPos = mData + newpos;
  269. }
  270. void MemoryDataStream::seek(size_t pos)
  271. {
  272. assert(mData + pos <= mEnd);
  273. mPos = mData + pos;
  274. }
  275. size_t MemoryDataStream::tell() const
  276. {
  277. return mPos - mData;
  278. }
  279. bool MemoryDataStream::eof() const
  280. {
  281. return mPos >= mEnd;
  282. }
  283. void MemoryDataStream::close()
  284. {
  285. if (mData != nullptr)
  286. {
  287. bs_free(mData);
  288. mData = nullptr;
  289. }
  290. }
  291. FileDataStream::FileDataStream(SPtr<std::ifstream> s, bool freeOnClose)
  292. : DataStream(READ), mpInStream(s), mpFStreamRO(s), mpFStream(0), mFreeOnClose(freeOnClose)
  293. {
  294. mpInStream->seekg(0, std::ios_base::end);
  295. mSize = (size_t)mpInStream->tellg();
  296. mpInStream->seekg(0, std::ios_base::beg);
  297. determineAccess();
  298. }
  299. FileDataStream::FileDataStream(SPtr<std::ifstream> s, size_t inSize, bool freeOnClose)
  300. : DataStream(READ), mpInStream(s), mpFStreamRO(s), mpFStream(0), mFreeOnClose(freeOnClose)
  301. {
  302. mSize = inSize;
  303. determineAccess();
  304. }
  305. FileDataStream::FileDataStream(SPtr<std::fstream> s, bool freeOnClose)
  306. : DataStream(READ | WRITE), mpInStream(s), mpFStreamRO(0), mpFStream(s), mFreeOnClose(freeOnClose)
  307. {
  308. mpInStream->seekg(0, std::ios_base::end);
  309. mSize = (size_t)mpInStream->tellg();
  310. mpInStream->seekg(0, std::ios_base::beg);
  311. determineAccess();
  312. }
  313. FileDataStream::FileDataStream(SPtr<std::fstream> s, size_t inSize, bool freeOnClose)
  314. : DataStream(READ | WRITE), mpInStream(s), mpFStreamRO(0), mpFStream(s), mFreeOnClose(freeOnClose)
  315. {
  316. mSize = inSize;
  317. determineAccess();
  318. }
  319. void FileDataStream::determineAccess()
  320. {
  321. mAccess = 0;
  322. if (mpInStream)
  323. mAccess |= READ;
  324. if (mpFStream)
  325. mAccess |= WRITE;
  326. }
  327. FileDataStream::~FileDataStream()
  328. {
  329. close();
  330. }
  331. size_t FileDataStream::read(void* buf, size_t count)
  332. {
  333. mpInStream->read(static_cast<char*>(buf), static_cast<std::streamsize>(count));
  334. return (size_t)mpInStream->gcount();
  335. }
  336. size_t FileDataStream::write(const void* buf, size_t count)
  337. {
  338. size_t written = 0;
  339. if (isWriteable() && mpFStream)
  340. {
  341. mpFStream->write(static_cast<const char*>(buf), static_cast<std::streamsize>(count));
  342. written = count;
  343. }
  344. return written;
  345. }
  346. void FileDataStream::skip(size_t count)
  347. {
  348. mpInStream->clear(); // Clear fail status in case eof was set
  349. mpInStream->seekg(static_cast<std::ifstream::pos_type>(count), std::ios::cur);
  350. }
  351. void FileDataStream::seek(size_t pos)
  352. {
  353. mpInStream->clear(); // Clear fail status in case eof was set
  354. mpInStream->seekg(static_cast<std::streamoff>(pos), std::ios::beg);
  355. }
  356. size_t FileDataStream::tell() const
  357. {
  358. mpInStream->clear(); // Clear fail status in case eof was set
  359. return (size_t)mpInStream->tellg();
  360. }
  361. bool FileDataStream::eof() const
  362. {
  363. return mpInStream->eof();
  364. }
  365. void FileDataStream::close()
  366. {
  367. if (mpInStream)
  368. {
  369. if (mpFStreamRO)
  370. mpFStreamRO->close();
  371. if (mpFStream)
  372. {
  373. mpFStream->flush();
  374. mpFStream->close();
  375. }
  376. if (mFreeOnClose)
  377. {
  378. mpInStream = nullptr;
  379. mpFStreamRO = nullptr;
  380. mpFStream = nullptr;
  381. }
  382. }
  383. }
  384. }