Monday, October 31, 2016

HTML Special Characters in your web application

HTMLEncode and HTMLDecode are common methods which can be in HttpUtility or WebUtility to encode and decode html tags or templates in your web application. Usually, HTML templates are updated by the Admin which uses the same system with admin rights. 
But what if the application you develop is accessing different databases that are updated from various admin portals or platforms. Hence the templates may contain many tags or characters and the above HTMLDecode will not work for them. 
Following method represents the conversion of those special characters to the HTML Encoded values so that it can be understood by the browser to show the correct symbol.
To do so, you will need to first get the ASCII of each of the character and if the values falls in to a special character, replace it with a properly formatted string. Simply it looks like below;

 public static string GetSpecialCharactersEncoded(string text)  
     {  
       if (text == null)  
         return text;  
       string returnString = text;  
       Dictionary<int, string> dicList = new Dictionary<int, string>();  
       StringBuilder sb = new StringBuilder();  
       foreach (var c in text.ToCharArray())  
       {  
         sb.Append(GetEncodedValue(c.ToString()));  
       }  
       return sb.ToString();  
     }  

     private static string GetEncodedValue(string text)  
     {  
       string encTxt = text;  
       int iAscii = (int)Convert.ToChar(text);  
       if (iAscii == 8230)  
         encTxt = "&hellip;";  
       else if (iAscii == 8211)  
         encTxt = "&ndash;";  
       else if (iAscii == 8212)  
         encTxt = "&mdash;";  
       else if (iAscii == 8216)  
         encTxt = "&lsquo; ";  
       else if (iAscii == 8217)  
         encTxt = "&rsquo;";  
       else if (iAscii == 8218)  
         encTxt = "&lsquor;";  
       else if (iAscii == 8220)  
         encTxt = "&ldquo; ";  
       else if (iAscii == 8221)  
         encTxt = "&rdquo;";  
       else if (iAscii == 8222)  
         encTxt = "&ldquor;";  
       else if (iAscii == 8224)  
         encTxt = "&dagger;";  
       else if (iAscii == 8225)  
         encTxt = "&Dagger;";  
       else if (iAscii == 8226)  
         encTxt = "&bull;";  
       else if (iAscii == 8240)  
         encTxt = "&permil;";  
       else if (iAscii == 8364)  
         encTxt = "&euro;";  
       else if (iAscii == 8482)  
         encTxt = "&trade;";  
       else if (iAscii == 402)  
         encTxt = "&fnof;";  
       else if (iAscii == 376)  
         encTxt = "&yuml;";  
       else if (iAscii == 353)  
         encTxt = "&scaron;";  
       else if (iAscii == 352)  
         encTxt = "&Scaron;";  
       else if (iAscii == 339)  
         encTxt = "&oelig;";  
       else if (iAscii == 338)  
         encTxt = "&OElig;";  
       else if (iAscii == 255)  
         encTxt = "&yuml;";  
       else if (iAscii == 254)  
         encTxt = "&thorn;";  
       else if (iAscii == 253)  
         encTxt = "&yacute;";  
       else if (iAscii == 252)  
         encTxt = "&uuml;";  
       else if (iAscii == 251)  
         encTxt = "&ucirc;";  
       else if (iAscii == 250)  
         encTxt = "&uacute;";  
       else if (iAscii == 249)  
         encTxt = "&ugrave;";  
       else if (iAscii == 248)  
         encTxt = "&oslash;";  
       else if (iAscii == 247)  
         encTxt = "&divide;";  
       else if (iAscii == 246)  
         encTxt = "&ouml;";  
       else if (iAscii == 245)  
         encTxt = "&otilde;";  
       else if (iAscii == 244)  
         encTxt = "&ocirc;";  
       else if (iAscii == 243)  
         encTxt = "&oacute;";  
       else if (iAscii == 242)  
         encTxt = "&ograve;";  
       else if (iAscii == 241)  
         encTxt = "&ntilde;";  
       else if (iAscii == 240)  
         encTxt = "&eth;";  
       else if (iAscii == 239)  
         encTxt = "&iuml;";  
       else if (iAscii == 238)  
         encTxt = "&icirc;";  
       else if (iAscii == 237)  
         encTxt = "&iacute;";  
       else if (iAscii == 236)  
         encTxt = "&igrave;";  
       else if (iAscii == 235)  
         encTxt = "&euml;";  
       else if (iAscii == 234)  
         encTxt = "&ecirc;";  
       else if (iAscii == 233)  
         encTxt = "&eacute;";  
       else if (iAscii == 232)  
         encTxt = "&egrave;";  
       else if (iAscii == 231)  
         encTxt = "&ccedil;";  
       else if (iAscii == 230)  
         encTxt = "&aelig;";  
       else if (iAscii == 229)  
         encTxt = "&aring;";  
       else if (iAscii == 228)  
         encTxt = "&auml;";  
       else if (iAscii == 227)  
         encTxt = "&atilde;";  
       else if (iAscii == 226)  
         encTxt = "&acirc;";  
       else if (iAscii == 225)  
         encTxt = "&aacute;";  
       else if (iAscii == 224)  
         encTxt = "&agrave;";  
       else if (iAscii == 223)  
         encTxt = "&szlig;";  
       else if (iAscii == 222)  
         encTxt = "&THORN;";  
       else if (iAscii == 221)  
         encTxt = "&Yacute;";  
       else if (iAscii == 220)  
         encTxt = "&Uuml;";  
       else if (iAscii == 219)  
         encTxt = "&Ucirc;";  
       else if (iAscii == 218)  
         encTxt = "&Uacute;";  
       else if (iAscii == 217)  
         encTxt = "&Ugrave;";  
       else if (iAscii == 216)  
         encTxt = "&Oslash;";  
       else if (iAscii == 215)  
         encTxt = "&times;";  
       else if (iAscii == 214)  
         encTxt = "&Ouml;";  
       else if (iAscii == 213)  
         encTxt = "&Otilde;";  
       else if (iAscii == 212)  
         encTxt = "&Ocirc;";  
       else if (iAscii == 211)  
         encTxt = "&Oacute;";  
       else if (iAscii == 210)  
         encTxt = "&Ograve;";  
       else if (iAscii == 209)  
         encTxt = "&Ntilde;";  
       else if (iAscii == 208)  
         encTxt = "&ETH;";  
       else if (iAscii == 207)  
         encTxt = "&Iuml;";  
       else if (iAscii == 206)  
         encTxt = "&Icirc;";  
       else if (iAscii == 205)  
         encTxt = "&Iacute;";  
       else if (iAscii == 204)  
         encTxt = "&Igrave;";  
       else if (iAscii == 203)  
         encTxt = "&Euml;";  
       else if (iAscii == 202)  
         encTxt = "&Ecirc;";  
       else if (iAscii == 201)  
         encTxt = "&Eacute;";  
       else if (iAscii == 200)  
         encTxt = "&Egrave;";  
       else if (iAscii == 199)  
         encTxt = "&Ccedil;";  
       else if (iAscii == 198)  
         encTxt = "&AElig;";  
       else if (iAscii == 197)  
         encTxt = "&#197;";  
       else if (iAscii == 196)  
         encTxt = "&Auml;";  
       else if (iAscii == 195)  
         encTxt = "&Atilde;";  
       else if (iAscii == 194)  
         encTxt = "&Acirc;";  
       else if (iAscii == 193)  
         encTxt = "&Aacute;";  
       else if (iAscii == 192)  
         encTxt = "&Agrave;";  
       else if (iAscii == 191)  
         encTxt = "&iquest;";  
       else if (iAscii == 190)  
         encTxt = "&frac34;";  
       else if (iAscii == 189)  
         encTxt = "&frac12;";  
       else if (iAscii == 188)  
         encTxt = "&frac14;";  
       else if (iAscii == 187)  
         encTxt = "&raquo;";  
       else if (iAscii == 186)  
         encTxt = "&ordm;";  
       else if (iAscii == 185)  
         encTxt = "&sup1;";  
       else if (iAscii == 184)  
         encTxt = "&cedil;";  
       else if (iAscii == 183)  
         encTxt = "&middot;";  
       else if (iAscii == 182)  
         encTxt = "&para;";  
       else if (iAscii == 181)  
         encTxt = "&micro;";  
       else if (iAscii == 180)  
         encTxt = "&acute;";  
       else if (iAscii == 179)  
         encTxt = "&sup3;";  
       else if (iAscii == 178)  
         encTxt = "&sup2;";  
       else if (iAscii == 177)  
         encTxt = "&plusmn;";  
       else if (iAscii == 176)  
         encTxt = "&deg;";  
       else if (iAscii == 175)  
         encTxt = "&macr;";  
       else if (iAscii == 174)  
         encTxt = "&reg;";  
       else if (iAscii == 173)  
         encTxt = "&shy;";  
       else if (iAscii == 172)  
         encTxt = "&not;";  
       else if (iAscii == 171)  
         encTxt = "&laquo;";  
       else if (iAscii == 170)  
         encTxt = "&ordf;";  
       else if (iAscii == 169)  
         encTxt = "&copy;";  
       else if (iAscii == 168)  
         encTxt = "&uml;";  
       else if (iAscii == 167)  
         encTxt = "&sect;";  
       else if (iAscii == 166)  
         encTxt = "&brvbar;";  
       else if (iAscii == 165)  
         encTxt = "&yen;";  
       else if (iAscii == 164)  
         encTxt = "&curren;";  
       else if (iAscii == 163)  
         encTxt = "&pound;";  
       else if (iAscii == 162)  
         encTxt = "&cent;";  
       else if (iAscii == 161)  
         encTxt = "&iexcl;";  
       else if (iAscii == 160)  
         encTxt = "&nbsp;";  
       else if (iAscii == 34)  
         encTxt = "&quot;";  
       return encTxt;  
     }  

To call this method;

string res = GetSpecialCharactersEncoded(str);

For further reading, visit here (http://www.ascii.cl/htmlcodes.htm)

The character entity reference chart is here. (https://dev.w3.org/html5/html-author/charref)

Using this method will show the special characters without any issues.

Happy coding... :)


No comments:

Post a Comment