12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046 |
- using System;
- using System.Collections.Generic;
- using System.Globalization;
- using System.Runtime.CompilerServices;
- using System.Security;
- using System.Text;
- using System.Text.RegularExpressions;
- namespace Godot
- {
- public static class StringExtensions
- {
- private static int GetSliceCount(this string instance, string splitter)
- {
- if (instance.Empty() || splitter.Empty())
- return 0;
- int pos = 0;
- int slices = 1;
- while ((pos = instance.Find(splitter, pos, caseSensitive: true)) >= 0)
- {
- slices++;
- pos += splitter.Length;
- }
- return slices;
- }
- private static string GetSliceCharacter(this string instance, char splitter, int slice)
- {
- if (!instance.Empty() && slice >= 0)
- {
- int i = 0;
- int prev = 0;
- int count = 0;
- while (true)
- {
- bool end = instance.Length <= i;
- if (end || instance[i] == splitter)
- {
- if (slice == count)
- {
- return instance.Substring(prev, i - prev);
- }
- else if (end)
- {
- return string.Empty;
- }
- count++;
- prev = i + 1;
- }
- i++;
- }
- }
- return string.Empty;
- }
- // <summary>
- // If the string is a path to a file, return the path to the file without the extension.
- // </summary>
- public static string BaseName(this string instance)
- {
- int index = instance.LastIndexOf('.');
- if (index > 0)
- return instance.Substring(0, index);
- return instance;
- }
- // <summary>
- // Return true if the strings begins with the given string.
- // </summary>
- public static bool BeginsWith(this string instance, string text)
- {
- return instance.StartsWith(text);
- }
- // <summary>
- // Return the bigrams (pairs of consecutive letters) of this string.
- // </summary>
- public static string[] Bigrams(this string instance)
- {
- var b = new string[instance.Length - 1];
- for (int i = 0; i < b.Length; i++)
- {
- b[i] = instance.Substring(i, 2);
- }
- return b;
- }
- // <summary>
- // Return the amount of substrings in string.
- // </summary>
- public static int Count(this string instance, string what, bool caseSensitive = true, int from = 0, int to = 0)
- {
- if (what.Length == 0)
- {
- return 0;
- }
- int len = instance.Length;
- int slen = what.Length;
- if (len < slen)
- {
- return 0;
- }
- string str;
- if (from >= 0 && to >= 0)
- {
- if (to == 0)
- {
- to = len;
- }
- else if (from >= to)
- {
- return 0;
- }
- if (from == 0 && to == len)
- {
- str = instance;
- }
- else
- {
- str = instance.Substring(from, to - from);
- }
- }
- else
- {
- return 0;
- }
- int c = 0;
- int idx;
- do
- {
- idx = str.IndexOf(what, caseSensitive ? StringComparison.Ordinal : StringComparison.OrdinalIgnoreCase);
- if (idx != -1)
- {
- str = str.Substring(idx + slen);
- ++c;
- }
- } while (idx != -1);
- return c;
- }
- // <summary>
- // Return a copy of the string with special characters escaped using the C language standard.
- // </summary>
- public static string CEscape(this string instance)
- {
- var sb = new StringBuilder(string.Copy(instance));
- sb.Replace("\\", "\\\\");
- sb.Replace("\a", "\\a");
- sb.Replace("\b", "\\b");
- sb.Replace("\f", "\\f");
- sb.Replace("\n", "\\n");
- sb.Replace("\r", "\\r");
- sb.Replace("\t", "\\t");
- sb.Replace("\v", "\\v");
- sb.Replace("\'", "\\'");
- sb.Replace("\"", "\\\"");
- sb.Replace("?", "\\?");
- return sb.ToString();
- }
- // <summary>
- // Return a copy of the string with escaped characters replaced by their meanings according to the C language standard.
- // </summary>
- public static string CUnescape(this string instance)
- {
- var sb = new StringBuilder(string.Copy(instance));
- sb.Replace("\\a", "\a");
- sb.Replace("\\b", "\b");
- sb.Replace("\\f", "\f");
- sb.Replace("\\n", "\n");
- sb.Replace("\\r", "\r");
- sb.Replace("\\t", "\t");
- sb.Replace("\\v", "\v");
- sb.Replace("\\'", "\'");
- sb.Replace("\\\"", "\"");
- sb.Replace("\\?", "?");
- sb.Replace("\\\\", "\\");
- return sb.ToString();
- }
- // <summary>
- // Change the case of some letters. Replace underscores with spaces, convert all letters to lowercase then capitalize first and every letter following the space character. For [code]capitalize camelCase mixed_with_underscores[/code] it will return [code]Capitalize Camelcase Mixed With Underscores[/code].
- // </summary>
- public static string Capitalize(this string instance)
- {
- string aux = instance.Replace("_", " ").ToLower();
- var cap = string.Empty;
- for (int i = 0; i < aux.GetSliceCount(" "); i++)
- {
- string slice = aux.GetSliceCharacter(' ', i);
- if (slice.Length > 0)
- {
- slice = char.ToUpper(slice[0]) + slice.Substring(1);
- if (i > 0)
- cap += " ";
- cap += slice;
- }
- }
- return cap;
- }
- // <summary>
- // Perform a case-sensitive comparison to another string, return -1 if less, 0 if equal and +1 if greater.
- // </summary>
- public static int CasecmpTo(this string instance, string to)
- {
- return instance.CompareTo(to, caseSensitive: true);
- }
- // <summary>
- // Perform a comparison to another string, return -1 if less, 0 if equal and +1 if greater.
- // </summary>
- public static int CompareTo(this string instance, string to, bool caseSensitive = true)
- {
- if (instance.Empty())
- return to.Empty() ? 0 : -1;
- if (to.Empty())
- return 1;
- int instanceIndex = 0;
- int toIndex = 0;
- if (caseSensitive) // Outside while loop to avoid checking multiple times, despite some code duplication.
- {
- while (true)
- {
- if (to[toIndex] == 0 && instance[instanceIndex] == 0)
- return 0; // We're equal
- if (instance[instanceIndex] == 0)
- return -1; // If this is empty, and the other one is not, then we're less... I think?
- if (to[toIndex] == 0)
- return 1; // Otherwise the other one is smaller...
- if (instance[instanceIndex] < to[toIndex]) // More than
- return -1;
- if (instance[instanceIndex] > to[toIndex]) // Less than
- return 1;
- instanceIndex++;
- toIndex++;
- }
- } else
- {
- while (true)
- {
- if (to[toIndex] == 0 && instance[instanceIndex] == 0)
- return 0; // We're equal
- if (instance[instanceIndex] == 0)
- return -1; // If this is empty, and the other one is not, then we're less... I think?
- if (to[toIndex] == 0)
- return 1; // Otherwise the other one is smaller..
- if (char.ToUpper(instance[instanceIndex]) < char.ToUpper(to[toIndex])) // More than
- return -1;
- if (char.ToUpper(instance[instanceIndex]) > char.ToUpper(to[toIndex])) // Less than
- return 1;
- instanceIndex++;
- toIndex++;
- }
- }
- }
- // <summary>
- // Return true if the string is empty.
- // </summary>
- public static bool Empty(this string instance)
- {
- return string.IsNullOrEmpty(instance);
- }
- // <summary>
- // Return true if the strings ends with the given string.
- // </summary>
- public static bool EndsWith(this string instance, string text)
- {
- return instance.EndsWith(text);
- }
- // <summary>
- // Erase [code]chars[/code] characters from the string starting from [code]pos[/code].
- // </summary>
- public static void Erase(this StringBuilder instance, int pos, int chars)
- {
- instance.Remove(pos, chars);
- }
- // <summary>
- // If the string is a path to a file, return the extension.
- // </summary>
- public static string Extension(this string instance)
- {
- int pos = instance.FindLast(".");
- if (pos < 0)
- return instance;
- return instance.Substring(pos + 1);
- }
- /// <summary>Find the first occurrence of a substring. Optionally, the search starting position can be passed.</summary>
- /// <returns>The starting position of the substring, or -1 if not found.</returns>
- public static int Find(this string instance, string what, int from = 0, bool caseSensitive = true)
- {
- return instance.IndexOf(what, from, caseSensitive ? StringComparison.Ordinal : StringComparison.OrdinalIgnoreCase);
- }
- /// <summary>Find the last occurrence of a substring.</summary>
- /// <returns>The starting position of the substring, or -1 if not found.</returns>
- public static int FindLast(this string instance, string what, bool caseSensitive = true)
- {
- return instance.FindLast(what, instance.Length - 1, caseSensitive);
- }
- /// <summary>Find the last occurrence of a substring specifying the search starting position.</summary>
- /// <returns>The starting position of the substring, or -1 if not found.</returns>
- public static int FindLast(this string instance, string what, int from, bool caseSensitive = true)
- {
- return instance.LastIndexOf(what, from, caseSensitive ? StringComparison.Ordinal : StringComparison.OrdinalIgnoreCase);
- }
- /// <summary>Find the first occurrence of a substring but search as case-insensitive. Optionally, the search starting position can be passed.</summary>
- /// <returns>The starting position of the substring, or -1 if not found.</returns>
- public static int FindN(this string instance, string what, int from = 0)
- {
- return instance.IndexOf(what, from, StringComparison.OrdinalIgnoreCase);
- }
- // <summary>
- // If the string is a path to a file, return the base directory.
- // </summary>
- public static string GetBaseDir(this string instance)
- {
- int basepos = instance.Find("://");
- string rs;
- var @base = string.Empty;
- if (basepos != -1)
- {
- var end = basepos + 3;
- rs = instance.Substring(end);
- @base = instance.Substring(0, end);
- }
- else
- {
- if (instance.BeginsWith("/"))
- {
- rs = instance.Substring(1);
- @base = "/";
- }
- else
- {
- rs = instance;
- }
- }
- int sep = Mathf.Max(rs.FindLast("/"), rs.FindLast("\\"));
- if (sep == -1)
- return @base;
- return @base + rs.Substr(0, sep);
- }
- // <summary>
- // If the string is a path to a file, return the file and ignore the base directory.
- // </summary>
- public static string GetFile(this string instance)
- {
- int sep = Mathf.Max(instance.FindLast("/"), instance.FindLast("\\"));
- if (sep == -1)
- return instance;
- return instance.Substring(sep + 1);
- }
- // <summary>
- // Hash the string and return a 32 bits integer.
- // </summary>
- public static int Hash(this string instance)
- {
- int index = 0;
- int hashv = 5381;
- int c;
- while ((c = instance[index++]) != 0)
- hashv = (hashv << 5) + hashv + c; // hash * 33 + c
- return hashv;
- }
- // <summary>
- // Convert a string containing an hexadecimal number into an int.
- // </summary>
- public static int HexToInt(this string instance)
- {
- int sign = 1;
- if (instance[0] == '-')
- {
- sign = -1;
- instance = instance.Substring(1);
- }
- if (!instance.StartsWith("0x"))
- return 0;
- return sign * int.Parse(instance.Substring(2), NumberStyles.HexNumber);
- }
- // <summary>
- // Insert a substring at a given position.
- // </summary>
- public static string Insert(this string instance, int pos, string what)
- {
- return instance.Insert(pos, what);
- }
- // <summary>
- // If the string is a path to a file or directory, return true if the path is absolute.
- // </summary>
- public static bool IsAbsPath(this string instance)
- {
- return System.IO.Path.IsPathRooted(instance);
- }
- // <summary>
- // If the string is a path to a file or directory, return true if the path is relative.
- // </summary>
- public static bool IsRelPath(this string instance)
- {
- return !System.IO.Path.IsPathRooted(instance);
- }
- // <summary>
- // Check whether this string is a subsequence of the given string.
- // </summary>
- public static bool IsSubsequenceOf(this string instance, string text, bool caseSensitive = true)
- {
- int len = instance.Length;
- if (len == 0)
- return true; // Technically an empty string is subsequence of any string
- if (len > text.Length)
- return false;
- int source = 0;
- int target = 0;
- while (source < len && target < text.Length)
- {
- bool match;
- if (!caseSensitive)
- {
- char sourcec = char.ToLower(instance[source]);
- char targetc = char.ToLower(text[target]);
- match = sourcec == targetc;
- }
- else
- {
- match = instance[source] == text[target];
- }
- if (match)
- {
- source++;
- if (source >= len)
- return true;
- }
- target++;
- }
- return false;
- }
- // <summary>
- // Check whether this string is a subsequence of the given string, ignoring case differences.
- // </summary>
- public static bool IsSubsequenceOfI(this string instance, string text)
- {
- return instance.IsSubsequenceOf(text, caseSensitive: false);
- }
- // <summary>
- // Check whether the string contains a valid float.
- // </summary>
- public static bool IsValidFloat(this string instance)
- {
- float f;
- return float.TryParse(instance, out f);
- }
- // <summary>
- // Check whether the string contains a valid color in HTML notation.
- // </summary>
- public static bool IsValidHtmlColor(this string instance)
- {
- return Color.HtmlIsValid(instance);
- }
- // <summary>
- // Check whether the string is a valid identifier. As is common in programming languages, a valid identifier may contain only letters, digits and underscores (_) and the first character may not be a digit.
- // </summary>
- public static bool IsValidIdentifier(this string instance)
- {
- int len = instance.Length;
- if (len == 0)
- return false;
- for (int i = 0; i < len; i++)
- {
- if (i == 0)
- {
- if (instance[0] >= '0' && instance[0] <= '9')
- return false; // Don't start with number plz
- }
- bool validChar = instance[i] >= '0' &&
- instance[i] <= '9' || instance[i] >= 'a' &&
- instance[i] <= 'z' || instance[i] >= 'A' &&
- instance[i] <= 'Z' || instance[i] == '_';
- if (!validChar)
- return false;
- }
- return true;
- }
- // <summary>
- // Check whether the string contains a valid integer.
- // </summary>
- public static bool IsValidInteger(this string instance)
- {
- int f;
- return int.TryParse(instance, out f);
- }
- // <summary>
- // Check whether the string contains a valid IP address.
- // </summary>
- public static bool IsValidIPAddress(this string instance)
- {
- // TODO: Support IPv6 addresses
- string[] ip = instance.Split(".");
- if (ip.Length != 4)
- return false;
- for (int i = 0; i < ip.Length; i++)
- {
- string n = ip[i];
- if (!n.IsValidInteger())
- return false;
- int val = n.ToInt();
- if (val < 0 || val > 255)
- return false;
- }
- return true;
- }
- // <summary>
- // Return a copy of the string with special characters escaped using the JSON standard.
- // </summary>
- public static string JSONEscape(this string instance)
- {
- var sb = new StringBuilder(string.Copy(instance));
- sb.Replace("\\", "\\\\");
- sb.Replace("\b", "\\b");
- sb.Replace("\f", "\\f");
- sb.Replace("\n", "\\n");
- sb.Replace("\r", "\\r");
- sb.Replace("\t", "\\t");
- sb.Replace("\v", "\\v");
- sb.Replace("\"", "\\\"");
- return sb.ToString();
- }
- // <summary>
- // Return an amount of characters from the left of the string.
- // </summary>
- public static string Left(this string instance, int pos)
- {
- if (pos <= 0)
- return string.Empty;
- if (pos >= instance.Length)
- return instance;
- return instance.Substring(0, pos);
- }
- /// <summary>
- /// Return the length of the string in characters.
- /// </summary>
- public static int Length(this string instance)
- {
- return instance.Length;
- }
- // <summary>
- // Do a simple expression match, where '*' matches zero or more arbitrary characters and '?' matches any single character except '.'.
- // </summary>
- public static bool ExprMatch(this string instance, string expr, bool caseSensitive)
- {
- if (expr.Length == 0 || instance.Length == 0)
- return false;
- switch (expr[0])
- {
- case '\0':
- return instance[0] == 0;
- case '*':
- return ExprMatch(expr + 1, instance, caseSensitive) || instance[0] != 0 && ExprMatch(expr, instance + 1, caseSensitive);
- case '?':
- return instance[0] != 0 && instance[0] != '.' && ExprMatch(expr + 1, instance + 1, caseSensitive);
- default:
- return (caseSensitive ? instance[0] == expr[0] : char.ToUpper(instance[0]) == char.ToUpper(expr[0])) &&
- ExprMatch(expr + 1, instance + 1, caseSensitive);
- }
- }
- // <summary>
- // Do a simple case sensitive expression match, using ? and * wildcards (see [method expr_match]).
- // </summary>
- public static bool Match(this string instance, string expr, bool caseSensitive = true)
- {
- return instance.ExprMatch(expr, caseSensitive);
- }
- // <summary>
- // Do a simple case insensitive expression match, using ? and * wildcards (see [method expr_match]).
- // </summary>
- public static bool MatchN(this string instance, string expr)
- {
- return instance.ExprMatch(expr, caseSensitive: false);
- }
- // <summary>
- // Return the MD5 hash of the string as an array of bytes.
- // </summary>
- public static byte[] MD5Buffer(this string instance)
- {
- return godot_icall_String_md5_buffer(instance);
- }
- [MethodImpl(MethodImplOptions.InternalCall)]
- internal extern static byte[] godot_icall_String_md5_buffer(string str);
- // <summary>
- // Return the MD5 hash of the string as a string.
- // </summary>
- public static string MD5Text(this string instance)
- {
- return godot_icall_String_md5_text(instance);
- }
- [MethodImpl(MethodImplOptions.InternalCall)]
- internal extern static string godot_icall_String_md5_text(string str);
- // <summary>
- // Perform a case-insensitive comparison to another string, return -1 if less, 0 if equal and +1 if greater.
- // </summary>
- public static int NocasecmpTo(this string instance, string to)
- {
- return instance.CompareTo(to, caseSensitive: false);
- }
- // <summary>
- // Return the character code at position [code]at[/code].
- // </summary>
- public static int OrdAt(this string instance, int at)
- {
- return instance[at];
- }
- // <summary>
- // Format a number to have an exact number of [code]digits[/code] after the decimal point.
- // </summary>
- public static string PadDecimals(this string instance, int digits)
- {
- int c = instance.Find(".");
- if (c == -1)
- {
- if (digits <= 0)
- return instance;
- instance += ".";
- c = instance.Length - 1;
- }
- else
- {
- if (digits <= 0)
- return instance.Substring(0, c);
- }
- if (instance.Length - (c + 1) > digits)
- {
- instance = instance.Substring(0, c + digits + 1);
- }
- else
- {
- while (instance.Length - (c + 1) < digits)
- {
- instance += "0";
- }
- }
- return instance;
- }
- // <summary>
- // Format a number to have an exact number of [code]digits[/code] before the decimal point.
- // </summary>
- public static string PadZeros(this string instance, int digits)
- {
- string s = instance;
- int end = s.Find(".");
- if (end == -1)
- end = s.Length;
- if (end == 0)
- return s;
- int begin = 0;
- while (begin < end && (s[begin] < '0' || s[begin] > '9'))
- {
- begin++;
- }
- if (begin >= end)
- return s;
- while (end - begin < digits)
- {
- s = s.Insert(begin, "0");
- end++;
- }
- return s;
- }
- // <summary>
- // Decode a percent-encoded string. See [method percent_encode].
- // </summary>
- public static string PercentDecode(this string instance)
- {
- return Uri.UnescapeDataString(instance);
- }
- // <summary>
- // Percent-encode a string. This is meant to encode parameters in a URL when sending a HTTP GET request and bodies of form-urlencoded POST request.
- // </summary>
- public static string PercentEncode(this string instance)
- {
- return Uri.EscapeDataString(instance);
- }
- // <summary>
- // If the string is a path, this concatenates [code]file[/code] at the end of the string as a subpath. E.g. [code]"this/is".plus_file("path") == "this/is/path"[/code].
- // </summary>
- public static string PlusFile(this string instance, string file)
- {
- if (instance.Length > 0 && instance[instance.Length - 1] == '/')
- return instance + file;
- return instance + "/" + file;
- }
- // <summary>
- // Replace occurrences of a substring for different ones inside the string.
- // </summary>
- public static string Replace(this string instance, string what, string forwhat)
- {
- return instance.Replace(what, forwhat);
- }
- // <summary>
- // Replace occurrences of a substring for different ones inside the string, but search case-insensitive.
- // </summary>
- public static string ReplaceN(this string instance, string what, string forwhat)
- {
- return Regex.Replace(instance, what, forwhat, RegexOptions.IgnoreCase);
- }
- // <summary>
- // Perform a search for a substring, but start from the end of the string instead of the beginning.
- // </summary>
- public static int RFind(this string instance, string what, int from = -1)
- {
- return godot_icall_String_rfind(instance, what, from);
- }
- [MethodImpl(MethodImplOptions.InternalCall)]
- internal extern static int godot_icall_String_rfind(string str, string what, int from);
- // <summary>
- // Perform a search for a substring, but start from the end of the string instead of the beginning. Also search case-insensitive.
- // </summary>
- public static int RFindN(this string instance, string what, int from = -1)
- {
- return godot_icall_String_rfindn(instance, what, from);
- }
- [MethodImpl(MethodImplOptions.InternalCall)]
- internal extern static int godot_icall_String_rfindn(string str, string what, int from);
- // <summary>
- // Return the right side of the string from a given position.
- // </summary>
- public static string Right(this string instance, int pos)
- {
- if (pos >= instance.Length)
- return instance;
- if (pos < 0)
- return string.Empty;
- return instance.Substring(pos, instance.Length - pos);
- }
- public static byte[] SHA256Buffer(this string instance)
- {
- return godot_icall_String_sha256_buffer(instance);
- }
- [MethodImpl(MethodImplOptions.InternalCall)]
- internal extern static byte[] godot_icall_String_sha256_buffer(string str);
- // <summary>
- // Return the SHA-256 hash of the string as a string.
- // </summary>
- public static string SHA256Text(this string instance)
- {
- return godot_icall_String_sha256_text(instance);
- }
- [MethodImpl(MethodImplOptions.InternalCall)]
- internal extern static string godot_icall_String_sha256_text(string str);
- // <summary>
- // Return the similarity index of the text compared to this string. 1 means totally similar and 0 means totally dissimilar.
- // </summary>
- public static float Similarity(this string instance, string text)
- {
- if (instance == text)
- {
- // Equal strings are totally similar
- return 1.0f;
- }
- if (instance.Length < 2 || text.Length < 2)
- {
- // No way to calculate similarity without a single bigram
- return 0.0f;
- }
- string[] sourceBigrams = instance.Bigrams();
- string[] targetBigrams = text.Bigrams();
- int sourceSize = sourceBigrams.Length;
- int targetSize = targetBigrams.Length;
- float sum = sourceSize + targetSize;
- float inter = 0;
- for (int i = 0; i < sourceSize; i++)
- {
- for (int j = 0; j < targetSize; j++)
- {
- if (sourceBigrams[i] == targetBigrams[j])
- {
- inter++;
- break;
- }
- }
- }
- return 2.0f * inter / sum;
- }
- // <summary>
- // Split the string by a divisor string, return an array of the substrings. Example "One,Two,Three" will return ["One","Two","Three"] if split by ",".
- // </summary>
- public static string[] Split(this string instance, string divisor, bool allowEmpty = true)
- {
- return instance.Split(new[] { divisor }, StringSplitOptions.RemoveEmptyEntries);
- }
- // <summary>
- // Split the string in floats by using a divisor string, return an array of the substrings. Example "1,2.5,3" will return [1,2.5,3] if split by ",".
- // </summary>
- public static float[] SplitFloats(this string instance, string divisor, bool allowEmpty = true)
- {
- var ret = new List<float>();
- int from = 0;
- int len = instance.Length;
- while (true)
- {
- int end = instance.Find(divisor, from, caseSensitive: true);
- if (end < 0)
- end = len;
- if (allowEmpty || end > from)
- ret.Add(float.Parse(instance.Substring(from)));
- if (end == len)
- break;
- from = end + divisor.Length;
- }
- return ret.ToArray();
- }
- private static readonly char[] _nonPrintable = {
- (char)00, (char)01, (char)02, (char)03, (char)04, (char)05,
- (char)06, (char)07, (char)08, (char)09, (char)10, (char)11,
- (char)12, (char)13, (char)14, (char)15, (char)16, (char)17,
- (char)18, (char)19, (char)20, (char)21, (char)22, (char)23,
- (char)24, (char)25, (char)26, (char)27, (char)28, (char)29,
- (char)30, (char)31, (char)32
- };
- // <summary>
- // Return a copy of the string stripped of any non-printable character at the beginning and the end. The optional arguments are used to toggle stripping on the left and right edges respectively.
- // </summary>
- public static string StripEdges(this string instance, bool left = true, bool right = true)
- {
- if (left)
- {
- if (right)
- return instance.Trim(_nonPrintable);
- return instance.TrimStart(_nonPrintable);
- }
- return instance.TrimEnd(_nonPrintable);
- }
- // <summary>
- // Return part of the string from the position [code]from[/code], with length [code]len[/code].
- // </summary>
- public static string Substr(this string instance, int from, int len)
- {
- int max = instance.Length - from;
- return instance.Substring(from, len > max ? max : len);
- }
- // <summary>
- // Convert the String (which is a character array) to PoolByteArray (which is an array of bytes). The conversion is speeded up in comparison to to_utf8() with the assumption that all the characters the String contains are only ASCII characters.
- // </summary>
- public static byte[] ToAscii(this string instance)
- {
- return Encoding.ASCII.GetBytes(instance);
- }
- // <summary>
- // Convert a string, containing a decimal number, into a [code]float[/code].
- // </summary>
- public static float ToFloat(this string instance)
- {
- return float.Parse(instance);
- }
- // <summary>
- // Convert a string, containing an integer number, into an [code]int[/code].
- // </summary>
- public static int ToInt(this string instance)
- {
- return int.Parse(instance);
- }
- // <summary>
- // Return the string converted to lowercase.
- // </summary>
- public static string ToLower(this string instance)
- {
- return instance.ToLower();
- }
- // <summary>
- // Return the string converted to uppercase.
- // </summary>
- public static string ToUpper(this string instance)
- {
- return instance.ToUpper();
- }
- // <summary>
- // Convert the String (which is an array of characters) to PoolByteArray (which is an array of bytes). The conversion is a bit slower than to_ascii(), but supports all UTF-8 characters. Therefore, you should prefer this function over to_ascii().
- // </summary>
- public static byte[] ToUTF8(this string instance)
- {
- return Encoding.UTF8.GetBytes(instance);
- }
- // <summary>
- // Return a copy of the string with special characters escaped using the XML standard.
- // </summary>
- public static string XMLEscape(this string instance)
- {
- return SecurityElement.Escape(instance);
- }
- // <summary>
- // Return a copy of the string with escaped characters replaced by their meanings according to the XML standard.
- // </summary>
- public static string XMLUnescape(this string instance)
- {
- return SecurityElement.FromString(instance).Text;
- }
- }
- }
|