using System.Collections.Generic;
namespace StringBuilderToUTF8
public static class StringExtensions
private static readonly Encoding Utf8Encoder = UTF8Encoding.GetEncoding("UTF-8", new EncoderReplacementFallback(string.Empty), new DecoderExceptionFallback());
private static readonly Encoding Utf16Encoder = UTF8Encoding.GetEncoding("UTF-16", new EncoderReplacementFallback(string.Empty), new DecoderExceptionFallback());
private static readonly Encoding ISO88591Encoder = UTF8Encoding.GetEncoding("ISO-8859-1", new EncoderReplacementFallback(string.Empty), new DecoderExceptionFallback());
public static string toUTF8String(this StringBuilder sb)
byte[] bytesUTF16 = Utf16Encoder.GetBytes(sb.ToString());
char[] charsUTF16 = Utf16Encoder.GetChars(bytesUTF16);
byte[] bytesUTF8 = Utf8Encoder.GetBytes(sb.ToString());
char[] charsUTF8 = Utf8Encoder.GetChars(bytesUTF8);
byte[] bytesISO88591 = ISO88591Encoder.GetBytes(sb.ToString());
char[] charsISO88591 = ISO88591Encoder.GetChars(bytesUTF16);
byte[] bytes = Encoding.Default.GetBytes(sb.ToString());
char[] chars = Encoding.Default.GetChars(bytes);
return Utf8Encoder.GetString(bytesUTF8, 0, bytesUTF8.Length);
public static string toISO88591String(this StringBuilder sb)
byte[] bytesISO88591 = ISO88591Encoder.GetBytes(sb.ToString());
return ISO88591Encoder.GetString(bytesISO88591, 0, bytesISO88591.Length);
public static string toUTF8StringFastCopy(this StringBuilder sb)
char[] bytes = new char[sb.Length];
sb.CopyTo(0, bytes, 0, sb.Length);
return Utf8Encoder.GetString(Utf8Encoder.GetBytes(bytes));
public static string UnicodeToANSI(this string s)
var newStringBuilder = new StringBuilder();
newStringBuilder.Append(s.Normalize(NormalizationForm.FormKD)
.Where(x => (x > 30 && x <= 255))
return newStringBuilder.ToString();
public static void Main(string[] args)
string utf16 = "Menü \uD852\uDF62 a\u0304\u0308 你好";
StringBuilder sb = new StringBuilder(utf16);
Console.WriteLine("Clean UTF8 only = " + utf16);
Console.WriteLine("Clean ISO-8859-1 only = " + sb.toISO88591String());
Console.WriteLine("Clean UTF8 only = " + sb.toUTF8String());
Console.WriteLine("Clean UTF8 fast copy = " + sb.toUTF8StringFastCopy());