Utility.cs - This C# code provides a set of utility methods…

/Watcher/Utility.cs

# · C# · 677 lines · 421 code · 93 blank · 163 comment · 78 complexity · ede8bd409245bfe302aeea4fb959c0fd MD5 · raw file

// WATCHER

//

// Utility.cs

// Main implementation of Watcher Utility functions.

//

// Copyright (c) 2010 Casaba Security, LLC

// All Rights Reserved.

//



using System;

using System.IO;

using System.Diagnostics;

using System.Collections.Specialized;

using System.Collections.Generic;

using System.Globalization;

using System.Text;

using System.Text.RegularExpressions;

using System.Web;

using Fiddler;



namespace CasabaSecurity.Web.Watcher

{

    public static class Utility

    {

        #region Public Method(s)



        /// <summary>

        /// Encode the specified ASCII/UTF-8 string to its Base-64 representation.

        /// </summary>

        /// <param name="data">The string to encode.</param>

        /// <returns>The string encoded in Base-64.</returns>

        public static string Base64Encode(String data)

        {

            Debug.Assert(data != null, "Cannot encode a null parameter.");

            if (data == null)

            {

                Trace.TraceWarning("Warning: Base64Encode: Not attempting to encode null parameter.");

                return String.Empty;

            }



            try

            {

                byte[] encodedBytes = System.Text.Encoding.UTF8.GetBytes(data);

                return Convert.ToBase64String(encodedBytes);

            }



            catch (ArgumentNullException e)

            {

                // Thrown if the argument to ToBase64String is null

                Trace.TraceError("Error: ArgumentNullException: {0}", e.Message);

            }



            catch (EncoderFallbackException e)

            {

                // Thrown if the string fails to be converted to UTF8

                Trace.TraceError("Error: DecoderFallerbackException: {0}", e.Message);

            }



            return String.Empty;

        }



        /// <summary>

        /// Decode the specified Base-64 string to its ASCII/UTF-8 equivalent.

        /// </summary>

        /// <param name="data">The encoded Base-64 string.</param>

        /// <returns>The string decoded from Base-64.</returns>

        public static string Base64Decode(String data)

        {

            Debug.Assert(data != null, "Cannot decode a null parameter.");

            if (data == null)

            {

                Trace.TraceWarning("Warning: Base64Decode: Not attempting to decode null parameter.");

                return String.Empty;

            }



            try

            {

                byte[] decodedBytes = Convert.FromBase64String(data);

                return System.Text.Encoding.UTF8.GetString(decodedBytes);

            }



            catch (ArgumentNullException e)

            {

                // Thrown if the argument to GetString is null

                Trace.TraceError("Error: ArgumentNullException: {0}", e.Message);

            }



            catch (FormatException e)

            {

                // Thrown if the string to convert is not in the proper format

                Trace.TraceError("Error: FormatException: {0}", e.Message);

            }



            catch (DecoderFallbackException e)

            {

                // Thrown if the string fails to be converted to UTF8

                Trace.TraceError("Error: DecoderFallerbackException: {0}", e.Message);

            }



            return String.Empty;

        }



        public static void ReadWriteStream(Stream readStream, Stream writeStream)

        {

            int Length = 256;

            Byte[] buffer = new Byte[Length];

            readStream.Position = 0;

            int bytesRead = readStream.Read(buffer, 0, Length);

            // write the required bytes

            while (bytesRead > 0)

            {

                writeStream.Write(buffer, 0, bytesRead);

                bytesRead = readStream.Read(buffer, 0, Length);

            }

            readStream.Close();

            writeStream.Close();

        }



        public static String GetResponseContentType(Session session)

        {

            if (session.oResponse.headers.Exists("content-type"))

                return (session.oResponse.headers["content-type"].ToLower());



            return (null);

        }



        public static bool IsEmailAddress(String s)

        {

            // Doesn't hurt to UrlDecode the string since we're looking for an email address

            s = HttpUtility.UrlDecode(s);

            return (Regex.IsMatch(s, "\\b[A-Z0-9._%+-]+@[A-Z0-9.-]+\\.[A-Z]{2,4}\\b", RegexOptions.IgnoreCase));

        }



        public static bool IsCreditCard(String s)

        {

            // This one will match any major credit card, and is probably the most accurate way to check.

            // However it's slower than the simpler regex above.

            if (Regex.IsMatch(s, "\\b(?:4[0-9]{12}(?:[0-9]{3})?|5[1-5][0-9]{14}|6(?:011|5[0-9][0-9])[0-9]{12}|3[47][0-9]{13}|3(?:0[0-5]|[68][0-9])[0-9]{11}|(?:2131|1800|35\\d{3})\\d{11})\\b", RegexOptions.IgnoreCase))

            {

                // FALSE POSITIVE REDUCTION

                // A common pattern is a session id in the form of 0.1234123412341234 

                // which matches the regex pattern.  We want to ignore patterns that 

                // contain a ".".

                if (!s.Contains("."))

                {

                    return true;

                }

            }



            return false;

        }



        public static bool IsUsSSN(String s)

        {

            // Matches a US Social Security Number provided it has dashes.

            return (Regex.IsMatch(s, "\\b[0-9]{3}-[0-9]{2}-[0-9]{4}\\b", RegexOptions.IgnoreCase));

        }



        public static bool IsResponseContentType(Session session, String contentType)

        {

            string tmp = GetResponseContentType(session);

            return ((tmp != null && tmp.IndexOf(contentType) == 0) ? true : false);

        }



        public static bool IsResponseCharset(Session session, String charset)

        {

            string tmp = GetResponseContentType(session);

            return ((tmp != null && tmp.IndexOf(charset) >= 0) ? true : false);

        }



        /// <summary>

        /// TODO: Fix up to support other variations of text/html.  

        /// FIX: This will match Atom and RSS feeds now, which set text/html but use &lt;?xml&gt; in content

        /// </summary>

        /// <param name="session"></param>

        /// <returns></returns>

        public static bool IsResponseHtml(Session session)

        {

            if (session.responseBodyBytes != null)

            {

                return (IsResponseContentType(session, "text/html") || IsResponseXhtml(session));

            }

            else

            {

                return false;

            }

        }



        public static bool IsResponseXhtml(Session session)

        {

            if (session.responseBodyBytes != null)

            {

                return (IsResponseContentType(session, "application/xhtml+xml") || IsResponseContentType(session, "application/xhtml"));

            }

            else

            {

                return false;

            }

        }



        /// <summary>

        /// TODO: Fix up to support other variations of text/css

        /// </summary>

        /// <param name="session"></param>

        /// <returns></returns>

        public static bool IsResponseCss(Session session)

        {

            return (IsResponseContentType(session, "text/css"));

        }



        /// <summary>

        /// TODO: Fix up to support other variations of javascript

        /// </summary>

        /// <param name="session"></param>

        /// <returns></returns>

        public static bool IsResponseJavascript(Session session)

        {

            return (IsResponseContentType(session, "application/javascript") || IsResponseContentType(session, "application/x-javascript"));

        }



        /// <summary>

        /// TODO: Fix up to support other variations of text/xml

        /// </summary>

        /// <param name="session"></param>

        /// <returns></returns>

        public static bool IsResponseXml(Session session)

        {

            return (IsResponseContentType(session, "text/xml") || IsResponseContentType(session, "application/xml"));

        }



        public static bool IsResponsePlain(Session session)

        {

            return (IsResponseContentType(session, "text/plain"));

        }



        /// <summary>

        /// Attempt to determine the character set used by the response document.  If the character

        /// set cannot be determined, return UTF-8 (a reasonable guess).

        /// </summary>

        /// <remarks>TODO: Extract XML/XHtml character sets?</remarks>

        /// <param name="session">The Fiddler HTTP session to examine.</param>

        /// <returns>The character set specified by the session content or a reasonable guess.</returns>

        public static String GetHtmlCharset(Session session)

        {

            const String DefaultEncoding = "utf-8";     // Return UTF-8 if unsure, ASCII is preserved.



            // Favor the character set from the HTTP Content-Type header if it exists.

            String CharacterSet = session.oResponse.headers.GetTokenValue("Content-Type", "charset");

            if (!String.IsNullOrEmpty(CharacterSet))

            {

                // Found the character set in the header: normalize and return.

                return CharacterSet.Trim().ToLower();

            }



            // If there is no content, return the default character set.

            if (session.responseBodyBytes == null || session.requestBodyBytes.Length == 0)

            {

                Trace.TraceWarning("Warning: Response body byte-array is null, assuming default character set.");

                return DefaultEncoding;

            }



            // Otherwise, parse the document returned for character set hints.

            String ResponseBody = String.Empty;



            try

            {

                // TODO: Pretty hokey here, defaulting to 7-bit ASCII Encoding

                ResponseBody = Encoding.ASCII.GetString(session.responseBodyBytes);

            }



            catch (DecoderFallbackException e)

            {

                // Thrown if a character cannot be decoded

                Trace.TraceError("Error: DecoderFallbackException: {0}", e.Message);

                Trace.TraceWarning("Warning: Assuming default characterencoding due to previous error.");

                return DefaultEncoding;

            }



            String Temp;



            // Find Meta tags specifying the content type, e.g. 

            // <meta http-equiv="content-type" content="text/html; charset=utf-8"/>.

            foreach (Match m in Utility.GetHtmlTags(ResponseBody, "meta"))

            {

                Temp = Utility.GetHtmlTagAttribute(m.ToString(), "http-equiv");

                if (!String.IsNullOrEmpty(Temp))

                {

                    if (Temp.Trim().ToLower(CultureInfo.InvariantCulture) == "content-type")

                    {

                        CharacterSet = Utility.GetHtmlTagAttribute(m.ToString(), "content");

                    }

                }

            }



            // ... and return the last content type attribute if found

            // TODO: Extract the character set from the content type

            if (!String.IsNullOrEmpty(CharacterSet))

            {

                // Found the character set in the response body: normalize and return.

                return CharacterSet.Trim().ToLower();

            }



            // Return the default character set if unsure

            return DefaultEncoding;

        }



        /// <summary>

        /// This method returns the decompressed, dechunked, and normalized HTTP response body.

        /// </summary>

        /// <param name="session">The Fiddler HTTP session to examine.</param>

        /// <returns>Normalized HTTP response body.</returns>

        public static String GetResponseText(Session session)

        {

            // Ensure the response body is available

            if (session.responseBodyBytes == null || session.responseBodyBytes.Length == 0)

            {

                Trace.TraceWarning("Warning: Response body is empty.");

                return String.Empty;

            }



            // Attempt to determine the character set used by the response document

            String CharacterSet = Utility.GetHtmlCharset(session);

            String ResponseBody = String.Empty;



            try

            {

                // Get the decoded session response.

                ResponseBody = Encoding.GetEncoding(CharacterSet).GetString(session.responseBodyBytes);

            }



            catch (DecoderFallbackException e)

            {

                // Thrown if a character cannot be decoded

                Trace.TraceError("Error: DecoderFallbackException: {0}", e.Message);

            }



            catch (ArgumentException e)

            {

                // Thrown if the GetEncoding argument is invalid

                Trace.TraceError("Error: ArgumentException: {0}", e.Message);

            }



            try

            {

                // Fallback to UTF-8 if we failed from a booty CharacterSet name.

                if (ResponseBody == String.Empty)

                {

                    Trace.TraceInformation("Falling back to UTF-8 encoding.");

                    ResponseBody = Encoding.UTF8.GetString(session.responseBodyBytes);

                }

            }



            catch (DecoderFallbackException e)

            {

                // Thrown if a character cannot be decoded

                Trace.TraceError("Error: DecoderFallbackException: {0}", e.Message);

            }



            return ResponseBody;

        }



        /// <summary>

        /// TODO: Update with balanced group constructs

        /// </summary>

        /// <param name="body"></param>

        /// <param name="tagName"></param>

        /// <returns></returns>

        public static MatchCollection GetHtmlTags(String body, String tagName)

        {

            return (Regex.Matches(body, "<\\s*?" + tagName + "((\\s*?)|(\\s+?\\w.*?))>", RegexOptions.IgnoreCase));

        }



        public static String StripQuotes(String val)

        {

            val = val.Trim();



            if (val.StartsWith("\""))

                val = val.TrimStart('\"');

            else

                val = val.TrimStart('\'');



            if (val.EndsWith("\""))

                val = val.TrimEnd('\"');

            else

                val = val.TrimEnd('\'');



            return (val);

        }



        public static bool CompareStrings(String x, String y, bool ignoreCase)

        {

            StringComparer sc;



            if (ignoreCase)

            {

                // Case-insensitive comparer

                sc = StringComparer.InvariantCultureIgnoreCase;

            }

            else

            {

                // Case-sensitive comparer

                sc = StringComparer.InvariantCulture;

            }



            if (x != null && y != null && (sc.Compare(x, y) == 0))

            {

                return true;

            }

            else

            {

                return false;

            }



        }



        public static string ToSafeLower(string s)

        {

            if (s != null)

            {

                return (s.ToLower(CultureInfo.InvariantCulture));

            }

            return (s);

        }





        /// <summary>

        /// Parse single and multi-line comments from HTML.

        /// <!-- this is a comment -->

        /// <!-- this-is-a comment -->

        /// </summary>

        /// <param name="body"></param>

        /// <returns></returns>

        public static MatchCollection GetHtmlComment(String body)

        {

            // avoid catastrophic backtracking

            return (Regex.Matches(body, "<!--.*?-->", RegexOptions.IgnoreCase | RegexOptions.Multiline | RegexOptions.Singleline | RegexOptions.CultureInvariant));

        }



        /// <summary>

        /// Parse single and multi-line comments from javascript

        /// //this is a comment

        /// /* this is a comment */

        /// /* this is a 

        /// * comment

        /// ****/

        /// </summary>

        /// <param name="body"></param>

        /// <returns></returns>

        public static MatchCollection GetJavascriptMultiLineComment(String body)

        {

            return (Regex.Matches(body, @"(/\*.*?\*/)", RegexOptions.Singleline | RegexOptions.Compiled));

        }



        public static MatchCollection GetJavascriptSingleLineComment(String body)

        {

            return (Regex.Matches(body, @"(//.*)", RegexOptions.Compiled));

        }



        public static String GetHtmlTagAttribute(String tag, String attributeName)

        {

            String attribute = null;



            // Parse out attribute field looking for values in single or double quotes

            Match m = Regex.Match(tag, attributeName + "\\s*?=\\s*?(\'|\").*?(\'|\")", RegexOptions.IgnoreCase);



            // Parse out attribute field looking for values that aren't wrapped in single or double quotes

            // TEST: Passed

            Match m1 = Regex.Match(tag, attributeName + "\\s*?=\\s*?.*?(\\s|>)", RegexOptions.IgnoreCase);



            if (m.Success)

            {

                // Parse out attribute value

                Match a = Regex.Match(m.ToString(), "(\'|\").*?(\'|\")", RegexOptions.IgnoreCase);



                if (a.Success)

                {

                    // BUGBUG: Removing UrlDecode() from here, not sure why we're doing this here.

                    // It should be up to a check to want UrlDecoded values.

                    // Otherwise + turns to a space, and other values may break.

                    //

                    // attribute = StripQuotes(HttpUtility.UrlDecode(a.ToString()));

                    attribute = StripQuotes(a.ToString());

                }

            }

            else if (m1.Success)

            {

                // Parse out attribute value, matching to the next whitespace or closing tag

                Match a = Regex.Match(m1.ToString(), "(=).*?(\\s|>)", RegexOptions.IgnoreCase);



                if (a.Success)

                {

                    // BUGBUG: Removing UrlDecode() from here, not sure why we're doing this here.

                    // It should be up to a check to want UrlDecoded values.

                    // Otherwise + turns to a space, and other values may break.

                    // 

                    // attribute = HttpUtility.UrlDecode(a.ToString());

                    attribute = a.ToString();



                    // Trim the leading = character

                    attribute = attribute.Substring(1).Trim();

                }

            }



            return attribute;

        }



        /// <summary>

        /// TODO: Update with balanced group constructs

        /// </summary>

        /// <param name="body"></param>

        /// <param name="tagName"></param>

        /// <param name="stripEnclosingTags"></param>

        /// <returns></returns>

        public static String[] GetHtmlTagBodies(String body, String tagName, bool stripEnclosingTags)

        {

            MatchCollection mc = null;

            String[] bodies = null;

            String tmp = null;

            int x = 0;



            // Match opening->closing tag, nested tags not handled

            mc = Regex.Matches(body, @"<\s*?" + tagName + @"((\s*?)|(\s+?\w.*?))>.*?<\s*?\/\s*?" + tagName + @"\s*?>", RegexOptions.Singleline | RegexOptions.Compiled);



            if (mc != null && mc.Count > 0)

            {

                bodies = new String[mc.Count];



                foreach (Match m in mc)

                {

                    tmp = m.ToString();



                    if (stripEnclosingTags)

                    {

                        tmp = Regex.Replace(tmp, @"<\s*?" + tagName + @"((\s*?)|(\s+?\w.*?))>", "");

                        tmp = Regex.Replace(tmp, @"<\s*?\/\s*?" + tagName + @"\s*?>", "");

                    }



                    bodies[x++] = tmp;

                }

            }

            // Don't return null, return empty string array

            if (bodies == null)

            {

                bodies = new String[] { };

            }

            return bodies;

        }



        public static String[] GetHtmlTagBodies(String body, String tagName)

        {

            return (GetHtmlTagBodies(body, tagName, true));

        }



        public static String GetUriDomainName(String src)

        {

            String dom = null;



            // if uri begins with "http://" or "https://"

            if (src != null && (src.IndexOf("http://") == 0 || src.IndexOf("https://") == 0))

            {

                // get text past ://

                dom = src.Substring(src.IndexOf("://") + 3);



                // If contains "/"

                if (dom.IndexOf("/") >= 0)

                {

                    // Remove everything including "/" and after

                    dom = dom.Substring(0, dom.IndexOf("/"));

                }

            }



            return dom;

        }



        /// <summary>

        /// Checks a URL to see if it's already contained in a running list of URL's

        /// </summary>

        /// <param name="url">A full URI, must include the scheme as in http://www.nottrusted.org.  Provided by session.fullUrl.</param>

        /// <param name="urls">The List<> of URL's to maintain.</param>

        /// <returns></returns>

        public static bool UrlNotInList(String url, List<string> urls)

        {

            // We need to reset our URL List when a user clicks the

            // Clear() button.  This is done through clear button

            // event handler.

            lock (urls)

            {

                Uri uri = new Uri(url);

                url = uri.ToString();// String.Concat(uri.Host, uri.AbsolutePath);



                // URL has already been checked

                if (urls.Contains(url))

                {

                    return false;

                }



                // Host has not been checked yet

                else

                {

                    urls.Add(url);

                    return true;

                }

            }

        }



        public static NameValueCollection GetRequestParameters(Session session)

        {

            NameValueCollection nvc = null;

            String qs = null;



            // If this is GET request

            if (session.HTTPMethodIs("GET"))

            {

                // ...and has query string

                if (session.PathAndQuery.IndexOf("?") > 0)

                {

                    // Get the query string

                    qs = session.PathAndQuery.Substring(session.PathAndQuery.IndexOf("?") + 1);

                }

            }



            // If is a POST request

            if (session.HTTPMethodIs("POST"))

            {

                // ...and has a content-type

                if (session.oRequest.headers.Exists("content-type"))

                {

                    // ... and is urlencoded form data

                    if (session.oRequest.headers["content-type"] == "application/x-www-form-urlencoded")

                    {

                        // TODO: is a decode needed?

                        //session.utilDecodeRequest();



                        // Get the request body as a string

                        qs = System.Text.Encoding.UTF8.GetString(session.requestBodyBytes);

                    }

                }

            }



            // If we have a query string

            if (qs != null)

            {

                // Parse it...

                try

                {

                    nvc = HttpUtility.ParseQueryString(qs);



                    // Remove any nulls from ill-formed query strings

                    List<string> lst = new List<string>();



                    foreach (String param in nvc.Keys)

                    {

                        if (param == null)

                        {

                            lst.Add(param);

                        }

                    }



                    foreach (String param in lst)

                    {

                        nvc.Remove(param);

                    }

                }



                // TODO: Could we be missing things here?  False negatives?

                catch (ArgumentNullException ane)

                {

                    ExceptionLogger.HandleException(ane);// discard

                }

            }



            return (nvc);

        }



        #endregion

    }

}
Summary ✨

This C# code provides a set of utility methods for web development, including parsing query strings, checking URLs against a list, and extracting request parameters from HTTP requests. It also handles common tasks such as URL encoding, decoding, and removing null values from query strings. The code is likely part of a larger framework or library for building web applications.
Tech Fingerprint

.NET Base Class Library
Alerts (29)

'static' Mutable static field detected; use readonly or const to prevent race conditions
23 32 67 103 119 127 134 153 159 165 177 189 206 216 226 231 243 312 368 373 459 514 549 554 581 606
All Visa card numbers start with a 4. New cards have 16 digits. Old cards have 13.
141
Complexity hotspot; line 405 (total complexity: 6)
405
Complexity hotspot; line 559 (total complexity: 6)
559