{"id":8235,"date":"2024-01-31T11:29:46","date_gmt":"2024-01-31T10:29:46","guid":{"rendered":"https:\/\/solidt.eu\/site\/?p=8235"},"modified":"2024-01-31T11:43:47","modified_gmt":"2024-01-31T10:43:47","slug":"c-detect-latin1-encoding","status":"publish","type":"post","link":"https:\/\/solidt.eu\/site\/c-detect-latin1-encoding\/","title":{"rendered":"C# Detect Latin1 encoding"},"content":{"rendered":"\n<div style=\"height: 250px; position:relative; margin-bottom: 50px;\" class=\"wp-block-simple-code-block-ace\"><pre class=\"wp-block-simple-code-block-ace\" style=\"position:absolute;top:0;right:0;bottom:0;left:0\" data-mode=\"csharp\" data-theme=\"monokai\" data-fontsize=\"14\" data-lines=\"Infinity\" data-showlines=\"true\" data-copy=\"false\">public class EncodingHelper\r\n{\r\n    private static Encoding Latin1 = Encoding.GetEncoding(\"ISO-8859-1\");\r\n\r\n    static List&lt;string> wrongCharacters = GetWrongCharacters();\r\n\r\n    \/\/public static void Test()\r\n    \/\/{\r\n    \/\/    Console.OutputEncoding = Encoding.UTF8;\r\n    \/\/    Console.WriteLine(ToUTF8(\"Acci\u00c3\u00b3n\"));\r\n    \/\/    Console.WriteLine(ToUTF8(\"Acci\u00f3n\"));\r\n    \/\/}\r\n\r\n    private static List&lt;string> GetWrongCharacters()\r\n    {\r\n        var replacements = new List&lt;string>();\r\n        for (int i = 128; i &lt; 256; i++)\r\n        {\r\n            var b = GetConvertedByte((byte)i);\r\n            replacements.Add(b);\r\n        }\r\n        return replacements;\r\n    }\r\n\r\n    public static string GetConvertedByte(byte b)\r\n    {\r\n        return Latin1.GetString(Encoding.UTF8.GetBytes(Latin1.GetString(new byte[] { b })));\r\n    }\r\n\r\n    public static bool IsLikelyConvertedLatin1(string text)\r\n    {\r\n        foreach (var r in wrongCharacters)\r\n        {\r\n            if (text.Contains(r))\r\n                return true;\r\n        }\r\n        return false;\r\n    }\r\n\r\n    public static string ToUTF8(string text)\r\n    {\r\n        if (IsLikelyConvertedLatin1(text))\r\n            return Latin1ToUtf8(text);\r\n        return text;\r\n    }\r\n\r\n    public static string Latin1ToUtf8(string s) => Encoding.UTF8.GetString(Latin1.GetBytes(s));\r\n}<\/pre><\/div>\n","protected":false},"excerpt":{"rendered":"","protected":false},"author":1,"featured_media":0,"comment_status":"open","ping_status":"closed","sticky":false,"template":"","format":"standard","meta":{"inline_featured_image":false,"footnotes":""},"categories":[1],"tags":[],"class_list":["post-8235","post","type-post","status-publish","format-standard","hentry","category-uncategorized"],"_links":{"self":[{"href":"https:\/\/solidt.eu\/site\/wp-json\/wp\/v2\/posts\/8235","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/solidt.eu\/site\/wp-json\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/solidt.eu\/site\/wp-json\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/solidt.eu\/site\/wp-json\/wp\/v2\/users\/1"}],"replies":[{"embeddable":true,"href":"https:\/\/solidt.eu\/site\/wp-json\/wp\/v2\/comments?post=8235"}],"version-history":[{"count":1,"href":"https:\/\/solidt.eu\/site\/wp-json\/wp\/v2\/posts\/8235\/revisions"}],"predecessor-version":[{"id":8236,"href":"https:\/\/solidt.eu\/site\/wp-json\/wp\/v2\/posts\/8235\/revisions\/8236"}],"wp:attachment":[{"href":"https:\/\/solidt.eu\/site\/wp-json\/wp\/v2\/media?parent=8235"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/solidt.eu\/site\/wp-json\/wp\/v2\/categories?post=8235"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/solidt.eu\/site\/wp-json\/wp\/v2\/tags?post=8235"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}