Homepage > html encode and decode

html encode and decode

20/03/2012 18:39

protected void Page_Load(object sender, EventArgs e)
    {
	// This could mess up HTML.
	string text = "you & me > them"; // 1

	// Replace > with >
	string htmlEncoded = Server.HtmlEncode(text); // 2

	// Now has the > again.
	string original = Server.HtmlDecode(htmlEncoded); // 3

	// This is how you can access the Server in any class.
	string alsoEncoded = HttpContext.Current.Server.HtmlEncode(text); // 4

	StringWriter stringWriter = new StringWriter();
	using (HtmlTextWriter writer = new HtmlTextWriter(stringWriter))
	{
	    // Write a DIV with encoded text.
	    writer.RenderBeginTag(HtmlTextWriterTag.Div);
	    writer.WriteEncodedText(text);
	    writer.RenderEndTag();
	}
	string html = stringWriter.ToString(); // 5
    }

//Pud this in webconfig file with in Tag.

ValidateRequest="false" put this in top of the html page like this

<%@ Page Language="C#" AutoEventWireup="true" CodeBehind="Question.aspx.cs" EnableEventValidation="false"

ValidateRequest="false" Inherits="EmpRecuit.Question" %>

//then,this is the decode html code call this function to decode html file

public string StripHTML(object source)

{

try

{

string result;

// Remove HTML Development formatting

// Replace line breaks with space

// because browsers inserts space

result = (source).ToString().Replace("\r", " ");

// Replace line breaks with space

// because browsers inserts space

result = result.Replace("\n", " ");

// Remove step-formatting

result = result.Replace("\t", string.Empty);

// Remove repeating spaces because browsers ignore them

result = System.Text.RegularExpressions.Regex.Replace(result,

@"( )+", " ");

// Remove the header (prepare first by clearing attributes)

result = System.Text.RegularExpressions.Regex.Replace(result,

@"<( )*head([^>])*>", "

System.Text.RegularExpressions.RegexOptions.IgnoreCase);

result = System.Text.RegularExpressions.Regex.Replace(result,

@"(<( )*(/)( )*head( )*>)", "",

System.Text.RegularExpressions.RegexOptions.IgnoreCase);

result = System.Text.RegularExpressions.Regex.Replace(result,

).*()", string.Empty,

System.Text.RegularExpressions.RegexOptions.IgnoreCase);

// remove all scripts (prepare first by clearing attributes)

result = System.Text.RegularExpressions.Regex.Replace(result,

@"<( )*script([^>])*>", "",

System.Text.RegularExpressions.RegexOptions.IgnoreCase);

//result = System.Text.RegularExpressions.Regex.Replace(result,

// @"()])*()",

// string.Empty,

// System.Text.RegularExpressions.RegexOptions.IgnoreCase);

result = System.Text.RegularExpressions.Regex.Replace(result,

@"()", string.Empty,

System.Text.RegularExpressions.RegexOptions.IgnoreCase);

// remove all styles (prepare first by clearing attributes)

result = System.Text.RegularExpressions.Regex.Replace(result,

@"<( )*style([^>])*>", " ",

System.Text.RegularExpressions.RegexOptions.IgnoreCase);

result = System.Text.RegularExpressions.Regex.Replace(result,

"( )", string.Empty,

System.Text.RegularExpressions.RegexOptions.IgnoreCase);

// insert tabs in spaces of tags

result = System.Text.RegularExpressions.Regex.Replace(result,

@"<( )*td([^>])*>", "\t",

System.Text.RegularExpressions.RegexOptions.IgnoreCase);

// insert line breaks in places of
and

tags

result = System.Text.RegularExpressions.Regex.Replace(result,

@"<( )*br( )*>", "\r",

System.Text.RegularExpressions.RegexOptions.IgnoreCase);

result = System.Text.RegularExpressions.Regex.Replace(result,

@"<( )*li( )*>", "\r",

System.Text.RegularExpressions.RegexOptions.IgnoreCase);

// insert line paragraphs (double line breaks) in place

// if

and tags

result = System.Text.RegularExpressions.Regex.Replace(result,

@"<( )*div([^>])*>", "\r\r",

System.Text.RegularExpressions.RegexOptions.IgnoreCase);

result = System.Text.RegularExpressions.Regex.Replace(result,

@"<( )*tr([^>])*>", "\r\r",

System.Text.RegularExpressions.RegexOptions.IgnoreCase);

result = System.Text.RegularExpressions.Regex.Replace(result,

@"<( )*p([^>])*>", "\r\r",

System.Text.RegularExpressions.RegexOptions.IgnoreCase);

// Remove remaining tags like , links, images,

// comments etc - anything that's enclosed inside < >

result = System.Text.RegularExpressions.Regex.Replace(result,

@"<[^>]*>", string.Empty,

System.Text.RegularExpressions.RegexOptions.IgnoreCase);

// replace special characters:

result = System.Text.RegularExpressions.Regex.Replace(result,

@" ", " ",

System.Text.RegularExpressions.RegexOptions.IgnoreCase);

result = System.Text.RegularExpressions.Regex.Replace(result,

@"•", " * ",

System.Text.RegularExpressions.RegexOptions.IgnoreCase);

result = System.Text.RegularExpressions.Regex.Replace(result,

@"‹", "<",

System.Text.RegularExpressions.RegexOptions.IgnoreCase);

result = System.Text.RegularExpressions.Regex.Replace(result,

@"›", ">",

System.Text.RegularExpressions.RegexOptions.IgnoreCase);

result = System.Text.RegularExpressions.Regex.Replace(result,

@"™", "(tm)",

System.Text.RegularExpressions.RegexOptions.IgnoreCase);

result = System.Text.RegularExpressions.Regex.Replace(result,

@"⁄", "/",

System.Text.RegularExpressions.RegexOptions.IgnoreCase);

result = System.Text.RegularExpressions.Regex.Replace(result,

@"<", "<",

System.Text.RegularExpressions.RegexOptions.IgnoreCase);

result = System.Text.RegularExpressions.Regex.Replace(result,

@">", ">",

System.Text.RegularExpressions.RegexOptions.IgnoreCase);

result = System.Text.RegularExpressions.Regex.Replace(result,

@"©", "(c)",

System.Text.RegularExpressions.RegexOptions.IgnoreCase);

result = System.Text.RegularExpressions.Regex.Replace(result,

@"®", "(r)",

System.Text.RegularExpressions.RegexOptions.IgnoreCase);

// Remove all others. More can be added, see

// https://hotwired.lycos.com/webmonkey/reference/special_characters/

result = System.Text.RegularExpressions.Regex.Replace(result,

@"&(.{2,6});", string.Empty,

System.Text.RegularExpressions.RegexOptions.IgnoreCase);

// for testing

//System.Text.RegularExpressions.Regex.Replace(result,

// this.txtRegex.Text,string.Empty,

// System.Text.RegularExpressions.RegexOptions.IgnoreCase);

// make line breaking consistent

result = result.Replace("\n", "\r");

// Remove extra line breaks and tabs:

// replace over 2 breaks with 2 and over 4 tabs with 4.

// Prepare first to remove any whitespaces in between

// the escaped characters and remove redundant tabs in between line breaks

result = System.Text.RegularExpressions.Regex.Replace(result,

"(\r)( )+(\r)", "\r\r",

System.Text.RegularExpressions.RegexOptions.IgnoreCase);

result = System.Text.RegularExpressions.Regex.Replace(result,

"(\t)( )+(\t)", "\t\t",

System.Text.RegularExpressions.RegexOptions.IgnoreCase);

result = System.Text.RegularExpressions.Regex.Replace(result,

"(\t)( )+(\r)", "\t\r",

System.Text.RegularExpressions.RegexOptions.IgnoreCase);

result = System.Text.RegularExpressions.Regex.Replace(result,

"(\r)( )+(\t)", "\r\t",

System.Text.RegularExpressions.RegexOptions.IgnoreCase);

// Remove redundant tabs

result = System.Text.RegularExpressions.Regex.Replace(result,

"(\r)(\t)+(\r)", "\r\r",

System.Text.RegularExpressions.RegexOptions.IgnoreCase);

// Remove multiple tabs following a line break with just one tab

result = System.Text.RegularExpressions.Regex.Replace(result,

"(\r)(\t)+", "\r\t",

System.Text.RegularExpressions.RegexOptions.IgnoreCase);

// Initial replacement target string for line breaks

string breaks = "\r\r\r";

// Initial replacement target string for tabs

string tabs = "\t\t\t\t\t";

for (int index = 0; index < result.Length; index++)

{

result = result.Replace(breaks, "\r\r");

result = result.Replace(tabs, "\t\t\t\t");

breaks = breaks + "\r";

//MessageBox.Show("Error");

return source.ToString();

}

Tags:

html encode and decode

Back

html encode and decode

Tags:

Contact