Utils.cs - MarkdownDeep - http://www.toptensoftware.com/mar…

/src/ServiceStack/Support/MarkdownDeep/Utils.cs

http://github.com/ServiceStack/ServiceStack · C# · 487 lines · 341 code · 70 blank · 76 comment · 101 complexity · a5a04203606186c360fa3992da4fa1f5 MD5 · raw file

// 

//   MarkdownDeep - http://www.toptensoftware.com/markdowndeep

//	 Copyright (C) 2010-2011 Topten Software

// 

//   Licensed under the Apache License, Version 2.0 (the "License"); you may not use this product except in 

//   compliance with the License. You may obtain a copy of the License at

//

//   http://www.apache.org/licenses/LICENSE-2.0

//

//   Unless required by applicable law or agreed to in writing, software distributed under the License is 

//   distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 

//   See the License for the specific language governing permissions and limitations under the License.

//



using System;

using System.Collections.Generic;

using System.Linq;

using System.Text;

using System.Text.RegularExpressions;

using ServiceStack.Text;



namespace MarkdownDeep

{

	/*

	 * Various utility and extension methods

	 */

	static class Utils

	{

		// Extension method. Get the last item in a list (or null if empty)

		public static T Last<T>(this List<T> list)

		{

		    return list.Count > 0 ? list[list.Count - 1] : default(T);

		}



	    // Extension method. Get the first item in a list (or null if empty)

		public static T First<T>(this List<T> list)

		{

		    return list.Count > 0 ? list[0] : default(T);

		}



	    // Extension method.  Use a list like a stack

		public static void Push<T>(this List<T> list, T value)

		{

			list.Add(value);

		}



		// Extension method.  Remove last item from a list

		public static T Pop<T>(this List<T> list)

		{

			if (list.Count == 0)

				return default(T);

		    

            T val = list[list.Count - 1];

		    list.RemoveAt(list.Count - 1);

		    return val;

		}





		// Scan a string for a valid identifier.  Identifier must start with alpha or underscore

		// and can be followed by alpha, digit or underscore

		// Updates `pos` to character after the identifier if matched

		public static bool ParseIdentifier(string str, ref int pos, ref string identifer)

		{

			if (pos >= str.Length)

				return false;



			// Must start with a letter or underscore

			if (!char.IsLetter(str[pos]) && str[pos] != '_')

			{

				return false;

			}



			// Find the end

			int startpos = pos;

			pos++;

			while (pos < str.Length && (char.IsDigit(str[pos]) || char.IsLetter(str[pos]) || str[pos] == '_'))

				pos++;



			// Return it

			identifer = str.Substring(startpos, pos - startpos);

			return true;

		}



		// Skip over anything that looks like a valid html entity (eg: &amp, &#123, &#nnn) etc...

		// Updates `pos` to character after the entity if matched

		public static bool SkipHtmlEntity(string str, ref int pos, ref string entity)

		{

			if (str[pos] != '&')

				return false;



			int savepos = pos;

			int len = str.Length;

			int i = pos+1;



			// Number entity?

			bool bNumber=false;

			bool bHex = false;

			if (i < len && str[i] == '#')

			{

				bNumber = true;

				i++;



				// Hex identity?

				if (i < len && (str[i] == 'x' || str[i] == 'X'))

				{

					bHex = true;

					i++;

				}

			}



			// Parse the content

			int contentpos = i;

			while (i < len)

			{

				char ch=str[i];



				if (bHex)

				{

					if (!(char.IsDigit(ch) || (ch >= 'a' && ch <= 'f') || (ch >= 'A' && ch <= 'F')))

						break;

				}



				else if (bNumber)

				{

					if (!char.IsDigit(ch))

						break;

				}

				else if (!char.IsLetterOrDigit(ch))

					break;



				i++;

			}



			// Quit if ran out of string

			if (i == len)

				return false;



			// Quit if nothing in the content

			if (i == contentpos)

				return false;



			// Quit if didn't find a semicolon

			if (str[i] != ';')

				return false;



			// Looks good...

			pos = i + 1;



			entity = str.Substring(savepos, pos - savepos);

			return true;

		}



		// Randomize a string using html entities;

		public static void HtmlRandomize(StringBuilder dest, string str)

		{

			// Deterministic random seed

			int seed = 0;

			foreach (char ch in str)

			{

				seed = unchecked(seed + ch);

			}

			Random r = new Random(seed);



			// Randomize

			foreach (char ch in str)

			{

				int x = r.Next() % 100;

				if (x > 90 && ch != '@')

				{

					dest.Append(ch);

				}

				else if (x > 45)

				{

					dest.Append("&#");

					dest.Append(((int)ch).ToString());

					dest.Append(";");

				}

				else

				{

					dest.Append("&#x");

					dest.Append(((int)ch).ToString("x"));

					dest.Append(";");

				}



			}

		}



		// Like HtmlEncode, but don't escape &'s that look like html entities

		public static void SmartHtmlEncodeAmpsAndAngles(StringBuilder dest, string str)

		{

			if (str == null)

				return;



			for (int i=0; i<str.Length; i++)

			{

				switch (str[i])

				{

					case '&':

						int start = i;

						string unused=null;

						if (SkipHtmlEntity(str, ref i, ref unused))

						{

							dest.Append(str, start, i - start);

							i--;

						}

						else

						{

							dest.Append("&amp;");

						}

						break;



					case '<':

						dest.Append("&lt;");

						break;



					case '>':

						dest.Append("&gt;");

						break;



					case '\"':

						dest.Append("&quot;");

						break;



					default:

						dest.Append(str[i]);

						break;

				}

			}

		}





		// Like HtmlEncode, but only escape &'s that don't look like html entities

		public static void SmartHtmlEncodeAmps(StringBuilder dest, string str, int startOffset, int len)

		{

			int end = startOffset + len;

			for (int i = startOffset; i < end; i++)

			{

				switch (str[i])

				{

					case '&':

						int start = i;

						string unused = null;

						if (SkipHtmlEntity(str, ref i, ref unused))

						{

							dest.Append(str, start, i - start);

							i--;

						}

						else

						{

							dest.Append("&amp;");

						}

						break;



					default:

						dest.Append(str[i]);

						break;

				}

			}

		}



		// Check if a string is in an array of strings

		public static bool IsInList(string str, string[] list)

		{

			foreach (var t in list)

			{

				if (string.Compare(t, str) == 0)

					return true;

			}

			return false;

		}



		// Check if a url is "safe" (we require urls start with valid protocol)

		// Definitely don't allow "javascript:" or any of it's encodings.

		public static bool IsSafeUrl(string url)

		{

			if (!url.StartsWith("http://") && !url.StartsWith("https://") && !url.StartsWith("ftp://"))

				return false;



			return true;

		}



		// Check if a character is escapable in markdown

		public static bool IsEscapableChar(char ch, bool ExtraMode)

		{

			switch (ch)

			{

				case '\\':

				case '`':

				case '*':

				case '_':

				case '{':

				case '}':

				case '[':

				case ']':

				case '(':

				case ')':

				case '>':		// Not in markdown documentation, but is in markdown.pl

				case '#':

				case '+':

				case '-':

				case '.':

				case '!':

					return true;



				case ':':

				case '|':

				case '=':		// Added for escaping Setext H1

				case '<':

					return ExtraMode;

			}



			return false;

		}



		// Extension method.  Skip an escapable character, or one normal character

		public static void SkipEscapableChar(this StringScanner p, bool ExtraMode)

		{

			if (p.current == '\\' && IsEscapableChar(p.CharAtOffset(1), ExtraMode))

			{

				p.SkipForward(2);

			}

			else

			{

				p.SkipForward(1);

			}

		}





		// Remove the markdown escapes from a string

		public static string UnescapeString(string str, bool ExtraMode)

		{

			if (str == null || str.IndexOf('\\')==-1)

				return str;



		    var sb = StringBuilderCacheAlt.Allocate();

			for (int i = 0; i < str.Length; i++)

			{

				if (str[i] == '\\' && i+1<str.Length && IsEscapableChar(str[i+1], ExtraMode))

				{

					sb.Append(str[i + 1]);

					i++;

				}

				else

				{

					sb.Append(str[i]);

				}

			}



		    return StringBuilderCacheAlt.ReturnAndFree(sb);

		}



		// Normalize the line ends in a string to just '\n'

		// Handles all encodings - '\r\n' (windows), '\n\r' (mac), '\n' (unix) '\r' (something?)

		static char[] lineends = new char[] { '\r', '\n' };

		public static string NormalizeLineEnds(string str)

		{

			if (str.IndexOfAny(lineends) < 0)

				return str;



            var sb = StringBuilderCacheAlt.Allocate();

            StringScanner sp = new StringScanner(str);

			while (!sp.eof)

			{

				if (sp.eol)

				{

					sb.Append('\n');

					sp.SkipEol();

				}

				else

				{

					sb.Append(sp.current);

					sp.SkipForward(1);

				}

			}



		    return StringBuilderCacheAlt.ReturnAndFree(sb);

		}



		/*

		 * These two functions IsEmailAddress and IsWebAddress

		 * are intended as a quick and dirty way to tell if a 

		 * <autolink> url is email, web address or neither.

		 * 

		 * They are not intended as validating checks.

		 * 

		 * (use of Regex for more correct test unnecessarily

		 *  slowed down some test documents by up to 300%.)

		 */



		// Check if a string looks like an email address

		public static bool IsEmailAddress(string str)

		{

			int posAt = str.IndexOf('@');

			if (posAt < 0)

				return false;



			int posLastDot = str.LastIndexOf('.');

			if (posLastDot < posAt)

				return false;



			return true;

		}



		// Check if a string looks like a url

		public static bool IsWebAddress(string str)

		{

			return str.StartsWith("http://") ||

					str.StartsWith("https://") ||

					str.StartsWith("ftp://") ||

					str.StartsWith("file://");

		}



		// Check if a string is a valid HTML ID identifier

		internal static bool IsValidHtmlID(string str)

		{

			if (String.IsNullOrEmpty(str))

				return false;



			// Must start with a letter

			if (!Char.IsLetter(str[0]))

				return false;



			// Check the rest

			for (int i = 0; i < str.Length; i++)

			{

				char ch = str[i];

				if (Char.IsLetterOrDigit(ch) || ch == '_' || ch == '-' || ch == ':' || ch == '.')

					continue;



				return false;

			}



			// OK

			return true;

		}



		// Strip the trailing HTML ID from a header string

		// ie:      ## header text ##			{#<idhere>}

		//			^start           ^out end              ^end

		//

		// Returns null if no header id

		public static string StripHtmlID(string str, int start, ref int end)

		{

			// Skip trailing whitespace

			int pos = end - 1;

			while (pos >= start && Char.IsWhiteSpace(str[pos]))

			{

				pos--;

			}



			// Skip closing '{'

			if (pos < start || str[pos] != '}')

				return null;



			int endId = pos;

			pos--;



			// Find the opening '{'

			while (pos >= start && str[pos] != '{')

				pos--;



			// Check for the #

			if (pos < start || str[pos + 1] != '#')

				return null;



			// Extract and check the ID

			int startId = pos + 2;

			string strID = str.Substring(startId, endId - startId);

			if (!IsValidHtmlID(strID))

				return null;



			// Skip any preceeding whitespace

			while (pos > start && Char.IsWhiteSpace(str[pos - 1]))

				pos--;



			// Done!

			end = pos;

			return strID;

		}



		public static bool IsUrlFullyQualified(string url)

		{

			return url.Contains("://") || url.StartsWith("mailto:");

		}



	}

}
Tech Fingerprint

.NET Base Class Library
Alerts (22)

'static' Mutable static field detected; use readonly or const to prevent race conditions
27 30 36 42 48 62 86 154 189 283 316 330 354 355 391 405 414 442 481
'switch (' Switch statement detected; include a default case for robustness
196 285
Complexity hotspot; line 427 (total complexity: 9)
427