| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905 |
- //
- // UTF8EncodingTest.cs - NUnit Test Cases for System.Text.UTF8Encoding
- //
- // Authors:
- // Patrick Kalkman [email protected]
- // Sebastien Pouliot ([email protected])
- //
- // (C) 2003 Patrick Kalkman
- // (C) 2004 Novell (http://www.novell.com)
- //
- using NUnit.Framework;
- using System;
- using System.Text;
- #if NET_2_0
- using DecoderException = System.Text.DecoderFallbackException;
- #else
- using DecoderException = System.ArgumentException;
- #endif
- namespace MonoTests.System.Text {
- [TestFixture]
- public class UTF8EncodingTest : Assertion {
- private UTF8Encoding utf8;
- [SetUp]
- public void Create ()
- {
- utf8 = new UTF8Encoding (true, true);
- }
- [Test]
- public void TestEncodingGetBytes1()
- {
- UTF8Encoding utf8Enc = new UTF8Encoding ();
- string UniCode = "\u0041\u2262\u0391\u002E";
-
- // "A<NOT IDENTICAL TO><ALPHA>." may be encoded as 41 E2 89 A2 CE 91 2E
- // see (RFC 2044)
- byte[] utf8Bytes = utf8Enc.GetBytes (UniCode);
-
- Assertion.AssertEquals ("UTF #1", 0x41, utf8Bytes [0]);
- Assertion.AssertEquals ("UTF #2", 0xE2, utf8Bytes [1]);
- Assertion.AssertEquals ("UTF #3", 0x89, utf8Bytes [2]);
- Assertion.AssertEquals ("UTF #4", 0xA2, utf8Bytes [3]);
- Assertion.AssertEquals ("UTF #5", 0xCE, utf8Bytes [4]);
- Assertion.AssertEquals ("UTF #6", 0x91, utf8Bytes [5]);
- Assertion.AssertEquals ("UTF #7", 0x2E, utf8Bytes [6]);
- }
-
- [Test]
- public void TestEncodingGetBytes2()
- {
- UTF8Encoding utf8Enc = new UTF8Encoding ();
- string UniCode = "\u0048\u0069\u0020\u004D\u006F\u006D\u0020\u263A\u0021";
-
- // "Hi Mom <WHITE SMILING FACE>!" may be encoded as 48 69 20 4D 6F 6D 20 E2 98 BA 21
- // see (RFC 2044)
- byte[] utf8Bytes = new byte [11];
-
- int ByteCnt = utf8Enc.GetBytes (UniCode.ToCharArray(), 0, UniCode.Length, utf8Bytes, 0);
-
- Assertion.AssertEquals ("UTF #1", 11, ByteCnt);
- Assertion.AssertEquals ("UTF #2", 0x48, utf8Bytes [0]);
- Assertion.AssertEquals ("UTF #3", 0x69, utf8Bytes [1]);
- Assertion.AssertEquals ("UTF #4", 0x20, utf8Bytes [2]);
- Assertion.AssertEquals ("UTF #5", 0x4D, utf8Bytes [3]);
- Assertion.AssertEquals ("UTF #6", 0x6F, utf8Bytes [4]);
- Assertion.AssertEquals ("UTF #7", 0x6D, utf8Bytes [5]);
- Assertion.AssertEquals ("UTF #8", 0x20, utf8Bytes [6]);
- Assertion.AssertEquals ("UTF #9", 0xE2, utf8Bytes [7]);
- Assertion.AssertEquals ("UTF #10", 0x98, utf8Bytes [8]);
- Assertion.AssertEquals ("UTF #11", 0xBA, utf8Bytes [9]);
- Assertion.AssertEquals ("UTF #12", 0x21, utf8Bytes [10]);
- }
-
- [Test]
- public void TestDecodingGetChars1()
- {
- UTF8Encoding utf8Enc = new UTF8Encoding ();
- // 41 E2 89 A2 CE 91 2E may be decoded as "A<NOT IDENTICAL TO><ALPHA>."
- // see (RFC 2044)
- byte[] utf8Bytes = new byte [] {0x41, 0xE2, 0x89, 0xA2, 0xCE, 0x91, 0x2E};
- char[] UniCodeChars = utf8Enc.GetChars(utf8Bytes);
-
- Assertion.AssertEquals ("UTF #1", 0x0041, UniCodeChars [0]);
- Assertion.AssertEquals ("UTF #2", 0x2262, UniCodeChars [1]);
- Assertion.AssertEquals ("UTF #3", 0x0391, UniCodeChars [2]);
- Assertion.AssertEquals ("UTF #4", 0x002E, UniCodeChars [3]);
- }
-
- [Test]
- public void TestMaxCharCount()
- {
- UTF8Encoding UTF8enc = new UTF8Encoding ();
- Assertion.AssertEquals ("UTF #1", 50, UTF8enc.GetMaxCharCount(50));
- }
-
- [Test]
- public void TestMaxByteCount()
- {
- UTF8Encoding UTF8enc = new UTF8Encoding ();
- Assertion.AssertEquals ("UTF #1", 200, UTF8enc.GetMaxByteCount(50));
- }
- // regression for bug #59648
- [Test]
- public void TestThrowOnInvalid ()
- {
- UTF8Encoding u = new UTF8Encoding (true, false);
- byte[] data = new byte [] { 0xC0, 0xAF };
- string s = u.GetString (data);
- AssertEquals (0, s.Length);
- data = new byte [] { 0x30, 0x31, 0xC0, 0xAF, 0x30, 0x32 };
- s = u.GetString (data);
- AssertEquals (4, s.Length);
- AssertEquals (0x30, (int) s [0]);
- AssertEquals (0x31, (int) s [1]);
- AssertEquals (0x30, (int) s [2]);
- AssertEquals (0x32, (int) s [3]);
- }
- // UTF8 decoding tests from http://www.cl.cam.ac.uk/~mgk25/
- [Test]
- public void T1_Correct_GreekWord_kosme ()
- {
- byte[] data = { 0xCE, 0xBA, 0xE1, 0xBD, 0xB9, 0xCF, 0x83, 0xCE, 0xBC, 0xCE, 0xB5 };
- string s = utf8.GetString (data);
- // cute but saving source code in unicode can be problematic
- // so we just ensure we can re-encode this
- AssertEquals ("Reconverted", BitConverter.ToString (data), BitConverter.ToString (utf8.GetBytes (s)));
- }
- [Test]
- public void T2_Boundary_1_FirstPossibleSequence_Pass ()
- {
- byte[] data211 = { 0x00 };
- string s = utf8.GetString (data211);
- AssertEquals ("1 byte (U-00000000)", "\0", s);
- AssertEquals ("Reconverted-1", BitConverter.ToString (data211), BitConverter.ToString (utf8.GetBytes (s)));
- byte[] data212 = { 0xC2, 0x80 };
- s = utf8.GetString (data212);
- AssertEquals ("2 bytes (U-00000080)", 128, s [0]);
- AssertEquals ("Reconverted-2", BitConverter.ToString (data212), BitConverter.ToString (utf8.GetBytes (s)));
- byte[] data213 = { 0xE0, 0xA0, 0x80 };
- s = utf8.GetString (data213);
- AssertEquals ("3 bytes (U-00000800)", 2048, s [0]);
- AssertEquals ("Reconverted-3", BitConverter.ToString (data213), BitConverter.ToString (utf8.GetBytes (s)));
- byte[] data214 = { 0xF0, 0x90, 0x80, 0x80 };
- s = utf8.GetString (data214);
- AssertEquals ("4 bytes (U-00010000)-0", 55296, s [0]);
- AssertEquals ("4 bytes (U-00010000)-1", 56320, s [1]);
- AssertEquals ("Reconverted-4", BitConverter.ToString (data214), BitConverter.ToString (utf8.GetBytes (s)));
- }
- [Test]
- // Fail on MS Fx 1.1
- [ExpectedException (typeof (DecoderException))]
- public void T2_Boundary_1_FirstPossibleSequence_Fail_5 ()
- {
- byte[] data215 = { 0xF8, 0x88, 0x80, 0x80, 0x80 };
- string s = utf8.GetString (data215);
- AssertNull ("5 bytes (U-00200000)", s);
- AssertEquals ("Reconverted-5", BitConverter.ToString (data215), BitConverter.ToString (utf8.GetBytes (s)));
- }
- [Test]
- // Fail on MS Fx 1.1
- [ExpectedException (typeof (DecoderException))]
- public void T2_Boundary_1_FirstPossibleSequence_Fail_6 ()
- {
- byte[] data216 = { 0xFC, 0x84, 0x80, 0x80, 0x80, 0x80 };
- string s = utf8.GetString (data216);
- AssertNull ("6 bytes (U-04000000)", s);
- AssertEquals ("Reconverted-6", BitConverter.ToString (data216), BitConverter.ToString (utf8.GetBytes (s)));
- }
- [Test]
- public void T2_Boundary_2_LastPossibleSequence_Pass ()
- {
- byte[] data221 = { 0x7F };
- string s = utf8.GetString (data221);
- AssertEquals ("1 byte (U-0000007F)", 127, s [0]);
- AssertEquals ("Reconverted-1", BitConverter.ToString (data221), BitConverter.ToString (utf8.GetBytes (s)));
- byte[] data222 = { 0xDF, 0xBF };
- s = utf8.GetString (data222);
- AssertEquals ("2 bytes (U-000007FF)", 2047, s [0]);
- AssertEquals ("Reconverted-2", BitConverter.ToString (data222), BitConverter.ToString (utf8.GetBytes (s)));
- byte[] data223 = { 0xEF, 0xBF, 0xBF };
- s = utf8.GetString (data223);
- AssertEquals ("3 bytes (U-0000FFFF)", 65535, s [0]);
- AssertEquals ("Reconverted-3", BitConverter.ToString (data223), BitConverter.ToString (utf8.GetBytes (s)));
- }
- [Test]
- // Fail on MS Fx 1.1
- [ExpectedException (typeof (DecoderException))]
- public void T2_Boundary_2_LastPossibleSequence_Fail_4 ()
- {
- byte[] data224 = { 0x7F, 0xBF, 0xBF, 0xBF };
- string s = utf8.GetString (data224);
- AssertNull ("4 bytes (U-001FFFFF)", s);
- AssertEquals ("Reconverted-4", BitConverter.ToString (data224), BitConverter.ToString (utf8.GetBytes (s)));
- }
- [Test]
- // Fail on MS Fx 1.1
- [ExpectedException (typeof (DecoderException))]
- public void T2_Boundary_2_LastPossibleSequence_Fail_5 ()
- {
- byte[] data225 = { 0xFB, 0xBF, 0xBF, 0xBF, 0xBF };
- string s = utf8.GetString (data225);
- AssertNull ("5 bytes (U-03FFFFFF)", s);
- AssertEquals ("Reconverted-5", BitConverter.ToString (data225), BitConverter.ToString (utf8.GetBytes (s)));
- }
- [Test]
- // Fail on MS Fx 1.1
- [ExpectedException (typeof (DecoderException))]
- public void T2_Boundary_2_LastPossibleSequence_Fail_6 ()
- {
- byte[] data226 = { 0xFD, 0xBF, 0xBF, 0xBF, 0xBF, 0xBF };
- string s = utf8.GetString (data226);
- AssertNull ("6 bytes (U-7FFFFFFF)", s);
- AssertEquals ("Reconverted-6", BitConverter.ToString (data226), BitConverter.ToString (utf8.GetBytes (s)));
- }
- [Test]
- public void T2_Boundary_3_Other_Pass ()
- {
- byte[] data231 = { 0xED, 0x9F, 0xBF };
- string s = utf8.GetString (data231);
- AssertEquals ("U-0000D7FF", 55295, s [0]);
- AssertEquals ("Reconverted-1", BitConverter.ToString (data231), BitConverter.ToString (utf8.GetBytes (s)));
- byte[] data232 = { 0xEE, 0x80, 0x80 };
- s = utf8.GetString (data232);
- AssertEquals ("U-0000E000", 57344, s [0]);
- AssertEquals ("Reconverted-2", BitConverter.ToString (data232), BitConverter.ToString (utf8.GetBytes (s)));
- byte[] data233 = { 0xEF, 0xBF, 0xBD };
- s = utf8.GetString (data233);
- AssertEquals ("U-0000FFFD", 65533, s [0]);
- AssertEquals ("Reconverted-3", BitConverter.ToString (data233), BitConverter.ToString (utf8.GetBytes (s)));
- byte[] data234 = { 0xF4, 0x8F, 0xBF, 0xBF };
- s = utf8.GetString (data234);
- AssertEquals ("U-0010FFFF-0", 56319, s [0]);
- AssertEquals ("U-0010FFFF-1", 57343, s [1]);
- AssertEquals ("Reconverted-4", BitConverter.ToString (data234), BitConverter.ToString (utf8.GetBytes (s)));
- }
- [Test]
- // Fail on MS Fx 1.1
- [ExpectedException (typeof (DecoderException))]
- public void T2_Boundary_3_Other_Fail_5 ()
- {
- byte[] data235 = { 0xF4, 0x90, 0x80, 0x80 };
- string s = utf8.GetString (data235);
- AssertNull ("U-00110000", s);
- AssertEquals ("Reconverted-5", BitConverter.ToString (data235), BitConverter.ToString (utf8.GetBytes (s)));
- }
- [Test]
- [ExpectedException (typeof (DecoderException))]
- public void T3_Malformed_1_UnexpectedContinuation_311 ()
- {
- byte[] data = { 0x80 };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- }
- [Test]
- [ExpectedException (typeof (DecoderException))]
- public void T3_Malformed_1_UnexpectedContinuation_312 ()
- {
- byte[] data = { 0xBF };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- }
- [Test]
- [ExpectedException (typeof (DecoderException))]
- public void T3_Malformed_1_UnexpectedContinuation_313 ()
- {
- byte[] data = { 0x80, 0xBF };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- }
- [Test]
- [ExpectedException (typeof (DecoderException))]
- public void T3_Malformed_1_UnexpectedContinuation_314 ()
- {
- byte[] data = { 0x80, 0xBF, 0x80 };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- }
- [Test]
- [ExpectedException (typeof (DecoderException))]
- public void T3_Malformed_1_UnexpectedContinuation_315 ()
- {
- byte[] data = { 0x80, 0xBF, 0x80, 0xBF };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- }
- [Test]
- [ExpectedException (typeof (DecoderException))]
- public void T3_Malformed_1_UnexpectedContinuation_316 ()
- {
- byte[] data = { 0x80, 0xBF, 0x80, 0xBF, 0x80 };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- }
- [Test]
- [ExpectedException (typeof (DecoderException))]
- public void T3_Malformed_1_UnexpectedContinuation_317 ()
- {
- byte[] data = { 0x80, 0xBF, 0x80, 0xBF, 0x80, 0xBF };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- }
- [Test]
- [ExpectedException (typeof (DecoderException))]
- public void T3_Malformed_1_UnexpectedContinuation_318 ()
- {
- byte[] data = { 0x80, 0xBF, 0x80, 0xBF, 0x80, 0xBF, 0x80 };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- }
- [Test]
- [ExpectedException (typeof (DecoderException))]
- public void T3_Malformed_1_UnexpectedContinuation_319 ()
- {
- // 64 different continuation characters
- byte[] data = {
- 0x80, 0x81, 0x82, 0x83, 0x84, 0x85, 0x86, 0x87, 0x88, 0x89, 0x8A, 0x8B, 0x8C, 0x8D, 0x8E, 0x8F,
- 0x90, 0x91, 0x92, 0x93, 0x94, 0x95, 0x96, 0x97, 0x98, 0x99, 0x9A, 0x9B, 0x9C, 0x9D, 0x9E, 0x9F,
- 0xA0, 0xA1, 0xA2, 0xA3, 0xA4, 0xA5, 0xA6, 0xA7, 0xA8, 0xA9, 0xAA, 0xAB, 0xAC, 0xAD, 0xAE, 0xAF,
- 0xB0, 0xB1, 0xB2, 0xB3, 0xB4, 0xB5, 0xB6, 0xB7, 0xB8, 0xB9, 0xBA, 0xBB, 0xBC, 0xBD, 0xBE, 0xBF };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- }
- [Test]
- [ExpectedException (typeof (DecoderException))]
- public void T3_Malformed_2_LonelyStart_321 ()
- {
- byte[] data = {
- 0xC0, 0x20, 0xC1, 0x20, 0xC2, 0x20, 0xC3, 0x20, 0xC4, 0x20, 0xC5, 0x20, 0xC6, 0x20, 0xC7, 0x20,
- 0xC8, 0x20, 0xC9, 0x20, 0xCA, 0x20, 0xCB, 0x20, 0xCC, 0x20, 0xCD, 0x20, 0xCE, 0x20, 0xCF, 0x20,
- 0xD0, 0x20, 0xD1, 0x20, 0xD2, 0x20, 0xD3, 0x20, 0xD4, 0x20, 0xD5, 0x20, 0xD6, 0x20, 0xD7, 0x20,
- 0xD8, 0x20, 0xD9, 0x20, 0xDA, 0x20, 0xDB, 0x20, 0xDC, 0x20, 0xDD, 0x20, 0xDE, 0x20, 0xDF, 0x20 };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- }
- [Test]
- [ExpectedException (typeof (DecoderException))]
- public void T3_Malformed_2_LonelyStart_322 ()
- {
- byte[] data = {
- 0xE0, 0x20, 0xE1, 0x20, 0xE2, 0x20, 0xE3, 0x20, 0xE4, 0x20, 0xE5, 0x20, 0xE6, 0x20, 0xE7, 0x20,
- 0xE8, 0x20, 0xE9, 0x20, 0xEA, 0x20, 0xEB, 0x20, 0xEC, 0x20, 0xED, 0x20, 0xEE, 0x20, 0xEF, 0x20 };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- }
- [Test]
- [ExpectedException (typeof (DecoderException))]
- public void T3_Malformed_2_LonelyStart_323 ()
- {
- byte[] data = { 0xF0, 0x20, 0xF1, 0x20, 0xF2, 0x20, 0xF3, 0x20, 0xF4, 0x20, 0xF5, 0x20, 0xF6, 0x20, 0xF7, 0x20 };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- }
- [Test]
- [ExpectedException (typeof (DecoderException))]
- public void T3_Malformed_2_LonelyStart_324 ()
- {
- byte[] data = { 0xF0, 0x20, 0xF1, 0x20, 0xF2, 0x20, 0xF3, 0x20, 0xF4, 0x20, 0xF5, 0x20, 0xF6, 0x20, 0xF7, 0x20 };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- }
- [Test]
- [ExpectedException (typeof (DecoderException))]
- public void T3_Malformed_2_LonelyStart_325 ()
- {
- byte[] data = { 0xFC, 0x20, 0xFD, 0x20 };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- }
- [Test]
- [ExpectedException (typeof (DecoderException))]
- public void T3_Malformed_3_LastContinuationMissing_331 ()
- {
- byte[] data = { 0xC0 };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- }
- [Test]
- [ExpectedException (typeof (DecoderException))]
- public void T3_Malformed_3_LastContinuationMissing_332 ()
- {
- byte[] data = { 0xE0, 0x80 };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- }
- [Test]
- [ExpectedException (typeof (DecoderException))]
- public void T3_Malformed_3_LastContinuationMissing_333 ()
- {
- byte[] data = { 0xF0, 0x80, 0x80 };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- }
- [Test]
- [ExpectedException (typeof (DecoderException))]
- public void T3_Malformed_3_LastContinuationMissing_334 ()
- {
- byte[] data = { 0xF8, 0x80, 0x80, 0x80 };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- }
- [Test]
- [ExpectedException (typeof (DecoderException))]
- public void T3_Malformed_3_LastContinuationMissing_335 ()
- {
- byte[] data = { 0xFC, 0x80, 0x80, 0x80, 0x80 };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- }
- [Test]
- // MS Fx 1.1 accept this
- // [ExpectedException (typeof (DecoderException))]
- public void T3_Malformed_3_LastContinuationMissing_336 ()
- {
- byte[] data = { 0xDF };
- try {
- string s = utf8.GetString (data);
- // exception is "really" expected here
- AssertEquals ("MS FX 1.1 behaviour", String.Empty, s);
- }
- catch (DecoderException) {
- // but Mono doesn't - better stick to the standard
- }
- }
- [Test]
- // MS Fx 1.1 accept this
- // [ExpectedException (typeof (DecoderException))]
- public void T3_Malformed_3_LastContinuationMissing_337 ()
- {
- byte[] data = { 0xEF, 0xBF };
- try {
- string s = utf8.GetString (data);
- // exception is "really" expected here
- AssertEquals ("MS FX 1.1 behaviour", String.Empty, s);
- }
- catch (DecoderException) {
- // but Mono doesn't - better stick to the standard
- }
- }
- [Test]
- [ExpectedException (typeof (DecoderException))]
- public void T3_Malformed_3_LastContinuationMissing_338 ()
- {
- byte[] data = { 0xF7, 0xBF, 0xBF };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- }
- [Test]
- [ExpectedException (typeof (DecoderException))]
- public void T3_Malformed_3_LastContinuationMissing_339 ()
- {
- byte[] data = { 0xF, 0xBF, 0xBF, 0xBF };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- }
- [Test]
- [ExpectedException (typeof (DecoderException))]
- public void T3_Malformed_3_LastContinuationMissing_3310 ()
- {
- byte[] data = { 0xFD, 0xBF, 0xBF, 0xBF, 0xBF };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- }
- [Test]
- [ExpectedException (typeof (DecoderException))]
- public void T3_Malformed_4_ConcatenationImcomplete ()
- {
- byte[] data = {
- 0xC0, 0xE0, 0x80, 0xF0, 0x80, 0x80, 0xF8, 0x80, 0x80, 0x80, 0xFC, 0x80, 0x80, 0x80, 0x80, 0xDF,
- 0xEF, 0xBF, 0xF7, 0xBF, 0xBF, 0xFB, 0xBF, 0xBF, 0xBF, 0xFD, 0xBF, 0xBF, 0xBF, 0xBF };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- }
- [Test]
- [ExpectedException (typeof (DecoderException))]
- public void T3_Malformed_5_ImpossibleBytes_351 ()
- {
- byte[] data = { 0xFE };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- }
- [Test]
- [ExpectedException (typeof (DecoderException))]
- public void T3_Malformed_5_ImpossibleBytes_352 ()
- {
- byte[] data = { 0xFF };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- }
- [Test]
- [ExpectedException (typeof (DecoderException))]
- public void T3_Malformed_5_ImpossibleBytes_353 ()
- {
- byte[] data = { 0xFE, 0xFE, 0xFF, 0xFF };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- }
- // Overlong == dangereous -> "safe" decoder should reject them
- [Test]
- [ExpectedException (typeof (DecoderException))]
- public void T4_Overlong_1_ASCII_Slash_411 ()
- {
- byte[] data = { 0xC0, 0xAF };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- }
- [Test]
- [ExpectedException (typeof (DecoderException))]
- public void T4_Overlong_1_ASCII_Slash_412 ()
- {
- byte[] data = { 0xE0, 0x80, 0xAF };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- }
- [Test]
- [ExpectedException (typeof (DecoderException))]
- public void T4_Overlong_1_ASCII_Slash_413 ()
- {
- byte[] data = { 0xF0, 0x80, 0x80, 0xAF };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- }
- [Test]
- [ExpectedException (typeof (DecoderException))]
- public void T4_Overlong_1_ASCII_Slash_414 ()
- {
- byte[] data = { 0xF8, 0x80, 0x80, 0x80, 0xAF };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- }
- [Test]
- [ExpectedException (typeof (DecoderException))]
- public void T4_Overlong_1_ASCII_Slash_415 ()
- {
- byte[] data = { 0xFC, 0x80, 0x80, 0x80, 0x80, 0xAF };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- }
- [Test]
- [ExpectedException (typeof (DecoderException))]
- public void T4_Overlong_2_MaximumBoundary_421 ()
- {
- byte[] data = { 0xC1, 0xBF };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- }
- [Test]
- [ExpectedException (typeof (DecoderException))]
- public void T4_Overlong_2_MaximumBoundary_422 ()
- {
- byte[] data = { 0xE0, 0x9F, 0xBF };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- }
- [Test]
- [ExpectedException (typeof (DecoderException))]
- public void T4_Overlong_2_MaximumBoundary_423 ()
- {
- byte[] data = { 0xF0, 0x8F, 0xBF, 0xBF };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- }
- [Test]
- [ExpectedException (typeof (DecoderException))]
- public void T4_Overlong_2_MaximumBoundary_424 ()
- {
- byte[] data = { 0xF8, 0x87, 0xBF, 0xBF, 0xBF };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- }
- [Test]
- [ExpectedException (typeof (DecoderException))]
- public void T4_Overlong_2_MaximumBoundary_425 ()
- {
- byte[] data = { 0xFC, 0x83, 0xBF, 0xBF, 0xBF, 0xBF };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- }
- [Test]
- [ExpectedException (typeof (DecoderException))]
- public void T4_Overlong_3_NUL_431 ()
- {
- byte[] data = { 0xC0, 0x80 };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- }
- [Test]
- [ExpectedException (typeof (DecoderException))]
- public void T4_Overlong_3_NUL_432 ()
- {
- byte[] data = { 0xE0, 0x80, 0x80 };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- }
- [Test]
- [ExpectedException (typeof (DecoderException))]
- public void T4_Overlong_3_NUL_433 ()
- {
- byte[] data = { 0xF0, 0x80, 0x80, 0x80 };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- }
- [Test]
- [ExpectedException (typeof (DecoderException))]
- public void T4_Overlong_3_NUL_434 ()
- {
- byte[] data = { 0xF8, 0x80, 0x80, 0x80, 0x80 };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- }
- [Test]
- [ExpectedException (typeof (DecoderException))]
- public void T4_Overlong_3_NUL_435 ()
- {
- byte[] data = { 0xFC, 0x80, 0x80, 0x80, 0x80, 0x80 };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- }
- [Test]
- // MS Fx 1.1 accept this
- // [ExpectedException (typeof (DecoderException))]
- public void T5_IllegalCodePosition_1_UTF16Surrogates_511 ()
- {
- byte[] data = { 0xED, 0xA0, 0x80 };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- AssertEquals ("MS FX 1.1 behaviour", 55296, s [0]);
- }
- [Test]
- // MS Fx 1.1 accept this
- // [ExpectedException (typeof (DecoderException))]
- public void T5_IllegalCodePosition_1_UTF16Surrogates_512 ()
- {
- byte[] data = { 0xED, 0xAD, 0xBF };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- AssertEquals ("MS FX 1.1 behaviour", 56191, s [0]);
- }
- [Test]
- // MS Fx 1.1 accept this
- // [ExpectedException (typeof (DecoderException))]
- public void T5_IllegalCodePosition_1_UTF16Surrogates_513 ()
- {
- byte[] data = { 0xED, 0xAE, 0x80 };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- AssertEquals ("MS FX 1.1 behaviour", 56192, s [0]);
- }
- [Test]
- // MS Fx 1.1 accept this
- // [ExpectedException (typeof (DecoderException))]
- public void T5_IllegalCodePosition_1_UTF16Surrogates_514 ()
- {
- byte[] data = { 0xED, 0xAF, 0xBF };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- AssertEquals ("MS FX 1.1 behaviour", 56319, s [0]);
- }
- [Test]
- // MS Fx 1.1 accept this
- // [ExpectedException (typeof (DecoderException))]
- public void T5_IllegalCodePosition_1_UTF16Surrogates_515 ()
- {
- byte[] data = { 0xED, 0xB0, 0x80 };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- AssertEquals ("MS FX 1.1 behaviour", 56320, s [0]);
- }
- [Test]
- // MS Fx 1.1 accept this
- // [ExpectedException (typeof (DecoderException))]
- public void T5_IllegalCodePosition_1_UTF16Surrogates_516 ()
- {
- byte[] data = { 0xED, 0xBE, 0x80 };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- AssertEquals ("MS FX 1.1 behaviour", 57216, s [0]);
- }
- [Test]
- // MS Fx 1.1 accept this
- // [ExpectedException (typeof (DecoderException))]
- public void T5_IllegalCodePosition_1_UTF16Surrogates_517 ()
- {
- byte[] data = { 0xED, 0xBF, 0xBF };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- AssertEquals ("MS FX 1.1 behaviour", 57343, s [0]);
- }
- [Test]
- // MS Fx 1.1 accept this
- // [ExpectedException (typeof (DecoderException))]
- public void T5_IllegalCodePosition_2_PairedUTF16Surrogates_521 ()
- {
- byte[] data = { 0xED, 0xA0, 0x80, 0xED, 0xB0, 0x80 };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- AssertEquals ("MS FX 1.1 behaviour", 55296, s [0]);
- AssertEquals ("MS FX 1.1 behaviour", 56320, s [1]);
- }
- [Test]
- // MS Fx 1.1 accept this
- // [ExpectedException (typeof (DecoderException))]
- public void T5_IllegalCodePosition_2_PairedUTF16Surrogates_522 ()
- {
- byte[] data = { 0xED, 0xA0, 0x80, 0xED, 0xBF, 0xBF };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- AssertEquals ("MS FX 1.1 behaviour", 55296, s [0]);
- AssertEquals ("MS FX 1.1 behaviour", 57343, s [1]);
- }
- [Test]
- // MS Fx 1.1 accept this
- // [ExpectedException (typeof (DecoderException))]
- public void T5_IllegalCodePosition_2_PairedUTF16Surrogates_523 ()
- {
- byte[] data = { 0xED, 0xAD, 0xBF, 0xED, 0xB0, 0x80 };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- AssertEquals ("MS FX 1.1 behaviour", 56191, s [0]);
- AssertEquals ("MS FX 1.1 behaviour", 56320, s [1]);
- }
- [Test]
- // MS Fx 1.1 accept this
- // [ExpectedException (typeof (DecoderException))]
- public void T5_IllegalCodePosition_2_PairedUTF16Surrogates_524 ()
- {
- byte[] data = { 0xED, 0xAD, 0xBF, 0xED, 0xBF, 0xBF };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- AssertEquals ("MS FX 1.1 behaviour", 56191, s [0]);
- AssertEquals ("MS FX 1.1 behaviour", 57343, s [1]);
- }
- [Test]
- // MS Fx 1.1 accept this
- // [ExpectedException (typeof (DecoderException))]
- public void T5_IllegalCodePosition_2_PairedUTF16Surrogates_525 ()
- {
- byte[] data = { 0xED, 0xAE, 0x80, 0xED, 0xB0, 0x80 };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- AssertEquals ("MS FX 1.1 behaviour", 56192, s [0]);
- AssertEquals ("MS FX 1.1 behaviour", 56320, s [1]);
- }
- [Test]
- // MS Fx 1.1 accept this
- // [ExpectedException (typeof (DecoderException))]
- public void T5_IllegalCodePosition_2_PairedUTF16Surrogates_526 ()
- {
- byte[] data = { 0xED, 0xAE, 0x80, 0xED, 0xBF, 0x8F };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- AssertEquals ("MS FX 1.1 behaviour", 56192, s [0]);
- AssertEquals ("MS FX 1.1 behaviour", 57295, s [1]);
- }
- [Test]
- // MS Fx 1.1 accept this
- // [ExpectedException (typeof (DecoderException))]
- public void T5_IllegalCodePosition_2_PairedUTF16Surrogates_527 ()
- {
- byte[] data = { 0xED, 0xAF, 0xBF, 0xED, 0xB0, 0x80 };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- AssertEquals ("MS FX 1.1 behaviour", 56319, s [0]);
- AssertEquals ("MS FX 1.1 behaviour", 56320, s [1]);
- }
- [Test]
- // MS Fx 1.1 accept this
- // [ExpectedException (typeof (DecoderException))]
- public void T5_IllegalCodePosition_2_PairedUTF16Surrogates_528 ()
- {
- byte[] data = { 0xED, 0xAF, 0xBF, 0xED, 0xBF, 0xBF };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- AssertEquals ("MS FX 1.1 behaviour", 56319, s [0]);
- AssertEquals ("MS FX 1.1 behaviour", 57343, s [1]);
- }
- [Test]
- // MS Fx 1.1 accept this
- // [ExpectedException (typeof (DecoderException))]
- public void T5_IllegalCodePosition_3_Other_531 ()
- {
- byte[] data = { 0xEF, 0xBF, 0xBE };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- AssertEquals ("MS FX 1.1 behaviour", 65534, s [0]);
- }
- [Test]
- // MS Fx 1.1 accept this
- // [ExpectedException (typeof (DecoderException))]
- public void T5_IllegalCodePosition_3_Other_532 ()
- {
- byte[] data = { 0xEF, 0xBF, 0xBF };
- string s = utf8.GetString (data);
- // exception is "really" expected here
- AssertEquals ("MS FX 1.1 behaviour", 65535, s [0]);
- }
- [Test]
- // bug #75065 and #73086.
- public void GetCharsFEFF ()
- {
- byte [] data = new byte [] {0xEF, 0xBB, 0xBF};
- Encoding enc = new UTF8Encoding (false, true);
- string s = enc.GetString (data);
- AssertEquals ("\uFEFF", s);
- Encoding utf = Encoding.UTF8;
- char[] testChars = {'\uFEFF','A'};
- byte[] bytes = utf.GetBytes(testChars);
- char[] chars = utf.GetChars(bytes);
- AssertEquals ("#1", '\uFEFF', chars [0]);
- AssertEquals ("#2", 'A', chars [1]);
- }
- }
- }
|