//------------------------------------------------------------------------------ // // Copyright (c) Microsoft Corporation. All rights reserved. // //------------------------------------------------------------------------------ // The Regex class represents a single compiled instance of a regular // expression. namespace System.Text.RegularExpressions { using System; using System.Threading; using System.Collections; using System.Reflection; #if !FULL_AOT_RUNTIME using System.Reflection.Emit; #endif using System.Globalization; using System.Security.Permissions; using System.Runtime.CompilerServices; using System.Collections.Generic; using System.Diagnostics.CodeAnalysis; #if !SILVERLIGHT using System.Runtime.Serialization; using System.Runtime.Versioning; #endif /// /// /// Represents an immutable, compiled regular expression. Also /// contains static methods that allow use of regular expressions without instantiating /// a Regex explicitly. /// /// #if !SILVERLIGHT [ Serializable() ] #endif public class Regex #if !SILVERLIGHT : ISerializable #endif { // Fields used by precompiled regexes protected internal string pattern; #if !SILVERLIGHT protected internal RegexRunnerFactory factory; // if compiled, this is the RegexRunner subclass #else internal RegexRunnerFactory factory; // if compiled, this is the RegexRunner subclass #endif protected internal RegexOptions roptions; // the top-level options from the options string // *********** Match timeout fields { *********** // We need this because time is queried using Environment.TickCount for performance reasons // (Environment.TickCount returns millisecs as an int and cycles): #if !SILVERLIGHT [NonSerialized()] #endif private static readonly TimeSpan MaximumMatchTimeout = TimeSpan.FromMilliseconds(Int32.MaxValue - 1); // InfiniteMatchTimeout specifies that match timeout is switched OFF. It allows for faster code paths // compared to simply having a very large timeout. // We do not want to ask users to use System.Threading.Timeout.InfiniteTimeSpan as a parameter because: // (1) We do not want to imply any relation between having using a RegEx timeout and using multi-threading. // (2) We do not want to require users to take ref to a contract assembly for threading just to use RegEx. // There may in theory be a SKU that has RegEx, but no multithreading. // We create a public Regex.InfiniteMatchTimeout constant, which for consistency uses the save underlying // value as Timeout.InfiniteTimeSpan creating an implementation detail dependency only. #if !SILVERLIGHT || FEATURE_NETCORE #if !FEATURE_NETCORE [NonSerialized()] #endif public static readonly TimeSpan InfiniteMatchTimeout = #if BOOTSTRAP_BASIC new TimeSpan (0, 0, 0, 0, Timeout.Infinite); #else Timeout.InfiniteTimeSpan; #endif #else internal static readonly TimeSpan InfiniteMatchTimeout = new TimeSpan(0, 0, 0, 0, Timeout.Infinite); #endif // All these protected internal fields in this class really should not be protected. The historic reason // for this is that classes extending Regex that are generated via CompileToAssembly rely on the fact that // these are accessible as protected in order to initialise them in the generated constructor of the // extending class. We should update this initialisation logic to using a protected constructor, but until // that is done we stick to the existing pattern however ugly it may be. #if !SILVERLIGHT [OptionalField(VersionAdded = 2)] protected internal #else internal #endif TimeSpan internalMatchTimeout; // timeout for the execution of this regex // During static initialisation of Regex we check private const String DefaultMatchTimeout_ConfigKeyName = "REGEX_DEFAULT_MATCH_TIMEOUT"; // FallbackDefaultMatchTimeout specifies the match timeout to use if no other timeout was specified // by one means or another. For now it is set to InfiniteMatchTimeout, meaning timeouts are OFF by // default (for Dev12 we plan to set a positive value). // Having this field is helpful to read the code as it makes it clear when we mean // "default that is currently no-timeouts" and when we mean "actually no-timeouts". // In Silverlight, DefaultMatchTimeout is always set to FallbackDefaultMatchTimeout, // on desktop, DefaultMatchTimeout can be configured via AppDomain and falls back to // FallbackDefaultMatchTimeout, if no AppDomain setting is present (see InitDefaultMatchTimeout()). #if !SILVERLIGHT [NonSerialized()] #endif internal static readonly TimeSpan FallbackDefaultMatchTimeout = InfiniteMatchTimeout; // DefaultMatchTimeout specifies the match timeout to use if no other timeout was specified // by one means or another. Typically, it is set to InfiniteMatchTimeout in Dev 11 // (we plan to set a positive timeout in Dev12). // Hosts (e.g.) ASP may set an AppDomain property via SetData to change the default value. #if !SILVERLIGHT [NonSerialized()] internal static readonly TimeSpan DefaultMatchTimeout = InitDefaultMatchTimeout(); #else internal static readonly TimeSpan DefaultMatchTimeout = FallbackDefaultMatchTimeout; #endif // *********** } match timeout fields *********** #if SILVERLIGHT internal Dictionary caps; // if captures are sparse, this is the hashtable capnum->index internal Dictionary capnames; // if named captures are used, this maps names->index #else // desktop build still uses non-generic collections for AppCompat with .NET Framework 3.5 pre-compiled assemblies protected internal Hashtable caps; protected internal Hashtable capnames; #endif protected internal String[] capslist; // if captures are sparse or named captures are used, this is the sorted list of names protected internal int capsize; // the size of the capture array internal ExclusiveReference runnerref; // cached runner internal SharedReference replref; // cached parsed replacement pattern internal RegexCode code; // if interpreted, this is the code for RegexIntepreter internal bool refsInitialized = false; internal static LinkedList livecode = new LinkedList();// the cached of code and factories that are currently loaded internal static int cacheSize = 15; internal const int MaxOptionShift = 10; protected Regex() { // If a compiled-to-assembly RegEx was generated using an earlier version, then internalMatchTimeout will be uninitialised. // Let's do it here. // In distant future, when RegEx generated using pre Dev11 are not supported any more, we can remove this to aid performance: this.internalMatchTimeout = DefaultMatchTimeout; } /* * Compiles and returns a Regex object corresponding to the given pattern */ /// /// /// Creates and compiles a regular expression object for the specified regular /// expression. /// /// public Regex(String pattern) : this(pattern, RegexOptions.None, DefaultMatchTimeout, false) { } /* * Returns a Regex object corresponding to the given pattern, compiled with * the specified options. */ /// /// /// Creates and compiles a regular expression object for the /// specified regular expression /// with options that modify the pattern. /// /// public Regex(String pattern, RegexOptions options) : this(pattern, options, DefaultMatchTimeout, false) { } #if !SILVERLIGHT || FEATURE_NETCORE public #else private #endif Regex(String pattern, RegexOptions options, TimeSpan matchTimeout) : this(pattern, options, matchTimeout, false) { } private Regex(String pattern, RegexOptions options, TimeSpan matchTimeout, bool useCache) { RegexTree tree; CachedCodeEntry cached = null; string cultureKey = null; if (pattern == null) throw new ArgumentNullException("pattern"); if (options < RegexOptions.None || ( ((int) options) >> MaxOptionShift) != 0) throw new ArgumentOutOfRangeException("options"); if ((options & RegexOptions.ECMAScript) != 0 && (options & ~(RegexOptions.ECMAScript | RegexOptions.IgnoreCase | RegexOptions.Multiline | #if !(SILVERLIGHT) || FEATURE_LEGACYNETCF RegexOptions.Compiled | #endif RegexOptions.CultureInvariant #if DBG | RegexOptions.Debug #endif )) != 0) throw new ArgumentOutOfRangeException("options"); ValidateMatchTimeout(matchTimeout); // Try to look up this regex in the cache. We do this regardless of whether useCache is true since there's // really no reason not to. if ((options & RegexOptions.CultureInvariant) != 0) cultureKey = CultureInfo.InvariantCulture.ToString(); // "English (United States)" else cultureKey = CultureInfo.CurrentCulture.ToString(); String key = ((int) options).ToString(NumberFormatInfo.InvariantInfo) + ":" + cultureKey + ":" + pattern; cached = LookupCachedAndUpdate(key); this.pattern = pattern; this.roptions = options; this.internalMatchTimeout = matchTimeout; if (cached == null) { // Parse the input tree = RegexParser.Parse(pattern, roptions); // Extract the relevant information capnames = tree._capnames; capslist = tree._capslist; code = RegexWriter.Write(tree); caps = code._caps; capsize = code._capsize; InitializeReferences(); tree = null; if (useCache) cached = CacheCode(key); } else { caps = cached._caps; capnames = cached._capnames; capslist = cached._capslist; capsize = cached._capsize; code = cached._code; factory = cached._factory; runnerref = cached._runnerref; replref = cached._replref; refsInitialized = true; } #if !(SILVERLIGHT || FULL_AOT_RUNTIME) // if the compile option is set, then compile the code if it's not already if (UseOptionC() && factory == null) { factory = Compile(code, roptions); if (useCache && cached != null) cached.AddCompiled(factory); code = null; } #endif } #if !SILVERLIGHT /* * ISerializable constructor */ protected Regex(SerializationInfo info, StreamingContext context) : this(info.GetString("pattern"), (RegexOptions) info.GetInt32("options")) { try { Int64 timeoutTicks = info.GetInt64("matchTimeout"); TimeSpan timeout = new TimeSpan(timeoutTicks); ValidateMatchTimeout(timeout); this.internalMatchTimeout = timeout; } catch (SerializationException) { // If this occurs, then assume that this object was serialised using a version // before timeout was added. In that case just do not set a timeout // (keep default value) } } /* * ISerializable method */ /// void ISerializable.GetObjectData(SerializationInfo si, StreamingContext context) { si.AddValue("pattern", this.ToString()); si.AddValue("options", this.Options); si.AddValue("matchTimeout", this.MatchTimeout.Ticks); } #endif // !SILVERLIGHT //* Note: "<" is the XML entity for smaller ("<"). /// /// Validates that the specified match timeout value is valid. /// The valid range is TimeSpan.Zero < matchTimeout <= Regex.MaximumMatchTimeout. /// /// The timeout value to validate. /// If the specified timeout is not within a valid range. /// #if !SILVERLIGHT protected internal #else internal #endif static void ValidateMatchTimeout(TimeSpan matchTimeout) { if (InfiniteMatchTimeout == matchTimeout) return; // Change this to make sure timeout is not longer then Environment.Ticks cycle length: if (TimeSpan.Zero < matchTimeout && matchTimeout <= MaximumMatchTimeout) return; throw new ArgumentOutOfRangeException("matchTimeout"); } #if !SILVERLIGHT /// /// Specifies the default RegEx matching timeout value (i.e. the timeout that will be used if no /// explicit timeout is specified). /// The default is queried from the current AppDomain through GetData using /// the key specified in Regex.DefaultMatchTimeout_ConfigKeyName. For that key, the /// current AppDomain is expected to either return null or a TimeSpan /// value specifying the default timeout within a valid range. /// If the AddDomain's data value for that key is not a TimeSpan value or if it is outside the /// valid range, an exception is thrown which will result in a TypeInitializationException for RegEx. /// If the AddDomain's data value for that key is null, a fallback value is returned /// (see FallbackDefaultMatchTimeout in code). /// /// The default RegEx matching timeout for this AppDomain private static TimeSpan InitDefaultMatchTimeout() { // Query AppDomain: AppDomain ad = AppDomain.CurrentDomain; Object defTmOut = ad.GetData(DefaultMatchTimeout_ConfigKeyName); // If no default is specified, use fallback: if (defTmOut == null) return FallbackDefaultMatchTimeout; // If default has invalid type, throw. It will result in a TypeInitializationException: if (!(defTmOut is TimeSpan)) { #if DBG String errMsg = "AppDomain.CurrentDomain.GetData(\"" + DefaultMatchTimeout_ConfigKeyName + "\")" + " is expected to return null or a value of type System.TimeSpan only; but it returned a value of type" + " '" + defTmOut.GetType().FullName + "'."; System.Diagnostics.Debug.WriteLine(errMsg); #endif throw new InvalidCastException(SR.GetString(SR.IllegalDefaultRegexMatchTimeoutInAppDomain, DefaultMatchTimeout_ConfigKeyName)); } // Convert default value: TimeSpan defaultTimeout = (TimeSpan) defTmOut; // If default timeout is outside the valid range, throw. It will result in a TypeInitializationException: try { ValidateMatchTimeout(defaultTimeout); } catch (ArgumentOutOfRangeException) { #if DBG String errMsg = "AppDomain.CurrentDomain.GetData(\"" + DefaultMatchTimeout_ConfigKeyName + "\")" + " returned a TimeSpan value outside the valid range" + " ("+ defaultTimeout.ToString() + ")."; System.Diagnostics.Debug.WriteLine(errMsg); #endif throw new ArgumentOutOfRangeException(SR.GetString(SR.IllegalDefaultRegexMatchTimeoutInAppDomain, DefaultMatchTimeout_ConfigKeyName)); } // We are good: return defaultTimeout; } // private static TimeSpan InitDefaultMatchTimeout #endif // !SILVERLIGHT #if !SILVERLIGHT && !FULL_AOT_RUNTIME /* * This method is here for perf reasons: if the call to RegexCompiler is NOT in the * Regex constructor, we don't load RegexCompiler and its reflection classes when * instantiating a non-compiled regex * This method is internal virtual so the jit does not inline it. */ [ #if MONO_FEATURE_CAS HostProtection(MayLeakOnAbort=true), #endif MethodImplAttribute(MethodImplOptions.NoInlining) ] internal RegexRunnerFactory Compile(RegexCode code, RegexOptions roptions) { return RegexCompiler.Compile(code, roptions); } #endif // !SILVERLIGHT /* * Escape metacharacters within the string */ /// /// /// Escapes /// a minimal set of metacharacters (\, *, +, ?, |, {, [, (, ), ^, $, ., #, and /// whitespace) by replacing them with their \ codes. This converts a string so that /// it can be used as a constant within a regular expression safely. (Note that the /// reason # and whitespace must be escaped is so the string can be used safely /// within an expression parsed with x mode. If future Regex features add /// additional metacharacters, developers should depend on Escape to escape those /// characters as well.) /// /// public static String Escape(String str) { if (str==null) throw new ArgumentNullException("str"); return RegexParser.Escape(str); } /* * Unescape character codes within the string */ /// /// /// Unescapes any escaped characters in the input string. /// /// [SuppressMessage("Microsoft.Naming","CA1704:IdentifiersShouldBeSpelledCorrectly", MessageId="Unescape", Justification="[....]: already shipped since v1 - can't fix without causing a breaking change")] public static String Unescape(String str) { if (str==null) throw new ArgumentNullException("str"); return RegexParser.Unescape(str); } [SuppressMessage("Microsoft.Concurrency", "CA8001", Justification = "Reviewed for thread-safety")] public static int CacheSize { get { return cacheSize; } set { if (value < 0) throw new ArgumentOutOfRangeException("value"); cacheSize = value; if (livecode.Count > cacheSize) { lock (livecode) { while (livecode.Count > cacheSize) livecode.RemoveLast(); } } } } #if NETSTANDARD [CLSCompliant (false)] protected IDictionary Caps { get { var dict = new Dictionary(); foreach (int key in caps.Keys) { dict.Add (key, (int)caps[key]); } return dict; } set { if (value == null) throw new ArgumentNullException("value"); caps = new Hashtable (value.Count); foreach (DictionaryEntry entry in value) { caps[(int)entry.Key] = (int)entry.Value; } } } [CLSCompliant (false)] protected IDictionary CapNames { get { var dict = new Dictionary(); foreach (string key in capnames.Keys) { dict.Add (key, (int)capnames[key]); } return dict; } set { if (value == null) throw new ArgumentNullException("value"); capnames = new Hashtable (value.Count); foreach (DictionaryEntry entry in value) { capnames[(string)entry.Key] = (int)entry.Value; } } } #endif /// /// /// Returns the options passed into the constructor /// /// public RegexOptions Options { get { return roptions;} } /// /// The match timeout used by this Regex instance. /// #if !SILVERLIGHT || FEATURE_NETCORE public #else internal #endif TimeSpan MatchTimeout { get { return internalMatchTimeout; } } /* * True if the regex is leftward */ /// /// /// Indicates whether the regular expression matches from right to /// left. /// /// public bool RightToLeft { get { return UseOptionR(); } } /// /// /// Returns the regular expression pattern passed into the constructor /// /// public override string ToString() { return pattern; } /* * Returns an array of the group names that are used to capture groups * in the regular expression. Only needed if the regex is not known until * runtime, and one wants to extract captured groups. (Probably unusual, * but supplied for completeness.) */ /// /// Returns /// the GroupNameCollection for the regular expression. This collection contains the /// set of strings used to name capturing groups in the expression. /// public String[] GetGroupNames() { String[] result; if (capslist == null) { int max = capsize; result = new String[max]; for (int i = 0; i < max; i++) { result[i] = Convert.ToString(i, CultureInfo.InvariantCulture); } } else { result = new String[capslist.Length]; System.Array.Copy(capslist, 0, result, 0, capslist.Length); } return result; } /* * Returns an array of the group numbers that are used to capture groups * in the regular expression. Only needed if the regex is not known until * runtime, and one wants to extract captured groups. (Probably unusual, * but supplied for completeness.) */ /// /// returns /// the integer group number corresponding to a group name. /// public int[] GetGroupNumbers() { int[] result; if (caps == null) { int max = capsize; result = new int[max]; for (int i = 0; i < max; i++) { result[i] = i; } } else { result = new int[caps.Count]; IDictionaryEnumerator de = caps.GetEnumerator(); while (de.MoveNext()) { result[(int)de.Value] = (int)de.Key; } } return result; } /* * Given a group number, maps it to a group name. Note that nubmered * groups automatically get a group name that is the decimal string * equivalent of its number. * * Returns null if the number is not a recognized group number. */ /// /// /// Retrieves a group name that corresponds to a group number. /// /// public String GroupNameFromNumber(int i) { if (capslist == null) { if (i >= 0 && i < capsize) return i.ToString(CultureInfo.InvariantCulture); return String.Empty; } else { if (caps != null) { #if SILVERLIGHT if (!caps.ContainsKey(i)) #else Object obj = caps[i]; if (obj == null) #endif return String.Empty; #if SILVERLIGHT i = caps[i]; #else i = (int)obj; #endif } if (i >= 0 && i < capslist.Length) return capslist[i]; return String.Empty; } } /* * Given a group name, maps it to a group number. Note that nubmered * groups automatically get a group name that is the decimal string * equivalent of its number. * * Returns -1 if the name is not a recognized group name. */ /// /// /// Returns a group number that corresponds to a group name. /// /// public int GroupNumberFromName(String name) { int result = -1; if (name == null) throw new ArgumentNullException("name"); // look up name if we have a hashtable of names if (capnames != null) { #if SILVERLIGHT if (!capnames.ContainsKey(name)) #else Object ret = capnames[name]; if (ret == null) #endif return -1; #if SILVERLIGHT return capnames[name]; #else return(int)ret; #endif } // convert to an int if it looks like a number result = 0; for (int i = 0; i < name.Length; i++) { char ch = name[i]; if (ch > '9' || ch < '0') return -1; result *= 10; result += (ch - '0'); } // return int if it's in range if (result >= 0 && result < capsize) return result; return -1; } /* * Static version of simple IsMatch call */ /// /// /// Searches the input /// string for one or more occurrences of the text supplied in the pattern /// parameter. /// /// public static bool IsMatch(String input, String pattern) { return IsMatch(input, pattern, RegexOptions.None, DefaultMatchTimeout); } /* * Static version of simple IsMatch call */ /// /// /// Searches the input string for one or more occurrences of the text /// supplied in the pattern parameter with matching options supplied in the options /// parameter. /// /// public static bool IsMatch(String input, String pattern, RegexOptions options) { return IsMatch(input, pattern, options, DefaultMatchTimeout); } #if !SILVERLIGHT || FEATURE_NETCORE public #else private #endif static bool IsMatch(String input, String pattern, RegexOptions options, TimeSpan matchTimeout) { return new Regex(pattern, options, matchTimeout, true).IsMatch(input); } /* * Returns true if the regex finds a match within the specified string */ /// /// /// Searches the input string for one or /// more matches using the previous pattern, options, and starting /// position. /// /// public bool IsMatch(String input) { if (input == null) throw new ArgumentNullException("input"); return IsMatch(input, UseOptionR() ? input.Length : 0); } /* * Returns true if the regex finds a match after the specified position * (proceeding leftward if the regex is leftward and rightward otherwise) */ /// /// /// Searches the input /// string for one or more matches using the previous pattern and options, with /// a new starting position. /// /// public bool IsMatch(String input, int startat) { if (input == null) throw new ArgumentNullException("input"); return (null == Run(true, -1, input, 0, input.Length, startat)); } /* * Static version of simple Match call */ /// /// /// Searches the input string for one or more occurrences of the text /// supplied in the pattern parameter. /// /// public static Match Match(String input, String pattern) { return Match(input, pattern, RegexOptions.None, DefaultMatchTimeout); } /* * Static version of simple Match call */ /// /// /// Searches the input string for one or more occurrences of the text /// supplied in the pattern parameter. Matching is modified with an option /// string. /// /// public static Match Match(String input, String pattern, RegexOptions options) { return Match(input, pattern, options, DefaultMatchTimeout); } #if !SILVERLIGHT || FEATURE_NETCORE public #else private #endif static Match Match(String input, String pattern, RegexOptions options, TimeSpan matchTimeout) { return new Regex(pattern, options, matchTimeout, true).Match(input); } /* * Finds the first match for the regular expression starting at the beginning * of the string (or at the end of the string if the regex is leftward) */ /// /// /// Matches a regular expression with a string and returns /// the precise result as a RegexMatch object. /// /// public Match Match(String input) { if (input == null) throw new ArgumentNullException("input"); return Match(input, UseOptionR() ? input.Length : 0); } /* * Finds the first match, starting at the specified position */ /// /// Matches a regular expression with a string and returns /// the precise result as a RegexMatch object. /// public Match Match(String input, int startat) { if (input == null) throw new ArgumentNullException("input"); return Run(false, -1, input, 0, input.Length, startat); } /* * Finds the first match, restricting the search to the specified interval of * the char array. */ /// /// /// Matches a /// regular expression with a string and returns the precise result as a /// RegexMatch object. /// /// public Match Match(String input, int beginning, int length) { if (input == null) throw new ArgumentNullException("input"); return Run(false, -1, input, beginning, length, UseOptionR() ? beginning + length : beginning); } /* * Static version of simple Matches call */ /// /// /// Returns all the successful matches as if Match were /// called iteratively numerous times. /// /// public static MatchCollection Matches(String input, String pattern) { return Matches(input, pattern, RegexOptions.None, DefaultMatchTimeout); } /* * Static version of simple Matches call */ /// /// /// Returns all the successful matches as if Match were called iteratively /// numerous times. /// /// public static MatchCollection Matches(String input, String pattern, RegexOptions options) { return Matches(input, pattern, options, DefaultMatchTimeout); } #if !SILVERLIGHT || FEATURE_NETCORE public #else private #endif static MatchCollection Matches(String input, String pattern, RegexOptions options, TimeSpan matchTimeout) { return new Regex(pattern, options, matchTimeout, true).Matches(input); } /* * Finds the first match for the regular expression starting at the beginning * of the string Enumerator(or at the end of the string if the regex is leftward) */ /// /// /// Returns /// all the successful matches as if Match was called iteratively numerous /// times. /// /// public MatchCollection Matches(String input) { if (input == null) throw new ArgumentNullException("input"); return Matches(input, UseOptionR() ? input.Length : 0); } /* * Finds the first match, starting at the specified position */ /// /// /// Returns /// all the successful matches as if Match was called iteratively numerous /// times. /// /// public MatchCollection Matches(String input, int startat) { if (input == null) throw new ArgumentNullException("input"); return new MatchCollection(this, input, 0, input.Length, startat); } /* * Static version of simple Replace call */ /// /// /// Replaces /// all occurrences of the pattern with the pattern, starting at /// the first character in the input string. /// /// public static String Replace(String input, String pattern, String replacement) { return Replace(input, pattern, replacement, RegexOptions.None, DefaultMatchTimeout); } /* * Static version of simple Replace call */ /// /// /// Replaces all occurrences of /// the with the /// pattern, starting at the first character in the input string. /// /// public static String Replace(String input, String pattern, String replacement, RegexOptions options) { return Replace(input, pattern, replacement, options, DefaultMatchTimeout); } #if !SILVERLIGHT || FEATURE_NETCORE public #else private #endif static String Replace(String input, String pattern, String replacement, RegexOptions options, TimeSpan matchTimeout) { return new Regex(pattern, options, matchTimeout, true).Replace(input, replacement); } /* * Does the replacement */ /// /// /// Replaces all occurrences of /// the with the pattern, starting at the /// first character in the input string, using the previous patten. /// /// public String Replace(String input, String replacement) { if (input == null) throw new ArgumentNullException("input"); return Replace(input, replacement, -1, UseOptionR() ? input.Length : 0); } /* * Does the replacement */ /// /// /// Replaces all occurrences of the (previously defined) with the /// pattern, starting at the first character in the input string. /// /// public String Replace(String input, String replacement, int count) { if (input == null) throw new ArgumentNullException("input"); return Replace(input, replacement, count, UseOptionR() ? input.Length : 0); } /* * Does the replacement */ /// /// /// Replaces all occurrences of the with the recent /// pattern, starting at the character position /// /// /// public String Replace(String input, String replacement, int count, int startat) { if (input == null) throw new ArgumentNullException("input"); if (replacement == null) throw new ArgumentNullException("replacement"); // a little code to grab a cached parsed replacement object RegexReplacement repl = (RegexReplacement) replref.Get(); if (repl == null || !repl.Pattern.Equals(replacement)) { repl = RegexParser.ParseReplacement(replacement, caps, capsize, capnames, this.roptions); replref.Cache(repl); } return repl.Replace(this, input, count, startat); } /* * Static version of simple Replace call */ /// /// /// Replaces all occurrences of the with the /// pattern /// /// /// public static String Replace(String input, String pattern, MatchEvaluator evaluator) { return Replace(input, pattern, evaluator, RegexOptions.None, DefaultMatchTimeout); } /* * Static version of simple Replace call */ /// /// /// Replaces all occurrences of the with the recent /// pattern, starting at the first character /// /// public static String Replace(String input, String pattern, MatchEvaluator evaluator, RegexOptions options) { return Replace(input, pattern, evaluator, options, DefaultMatchTimeout); } #if !SILVERLIGHT || FEATURE_NETCORE public #else private #endif static String Replace(String input, String pattern, MatchEvaluator evaluator, RegexOptions options, TimeSpan matchTimeout) { return new Regex(pattern, options, matchTimeout, true).Replace(input, evaluator); } /* * Does the replacement */ /// /// /// Replaces all occurrences of the with the recent /// pattern, starting at the first character /// position /// /// public String Replace(String input, MatchEvaluator evaluator) { if (input == null) throw new ArgumentNullException("input"); return Replace(input, evaluator, -1, UseOptionR() ? input.Length : 0); } /* * Does the replacement */ /// /// /// Replaces all occurrences of the with the recent /// pattern, starting at the first character /// position /// /// public String Replace(String input, MatchEvaluator evaluator, int count) { if (input == null) throw new ArgumentNullException("input"); return Replace(input, evaluator, count, UseOptionR() ? input.Length : 0); } /* * Does the replacement */ /// /// /// Replaces all occurrences of the (previouly defined) with /// the recent pattern, starting at the character /// position /// /// public String Replace(String input, MatchEvaluator evaluator, int count, int startat) { if (input == null) throw new ArgumentNullException("input"); return RegexReplacement.Replace(evaluator, this, input, count, startat); } /* * Static version of simple Split call */ /// /// /// Splits the string at the position defined /// by . /// /// public static String[] Split(String input, String pattern) { return Split(input, pattern, RegexOptions.None, DefaultMatchTimeout); } /* * Static version of simple Split call */ /// /// /// Splits the string at the position defined by . /// /// public static String[] Split(String input, String pattern, RegexOptions options) { return Split(input, pattern, options, DefaultMatchTimeout); } #if !SILVERLIGHT || FEATURE_NETCORE public #else private #endif static String[] Split(String input, String pattern, RegexOptions options, TimeSpan matchTimeout) { return new Regex(pattern, options, matchTimeout, true).Split(input); } /* * Does a split */ /// /// /// Splits the string at the position defined by /// a previous /// . /// /// public String[] Split(String input) { if (input == null) throw new ArgumentNullException("input"); return Split(input, 0, UseOptionR() ? input.Length : 0); } /* * Does a split */ /// /// /// Splits the string at the position defined by a previous /// . /// /// public String[] Split(String input, int count) { if (input == null) throw new ArgumentNullException("input"); return RegexReplacement.Split(this, input, count, UseOptionR() ? input.Length : 0); } /* * Does a split */ /// /// /// Splits the string at the position defined by a previous /// . /// /// public String[] Split(String input, int count, int startat) { if (input==null) throw new ArgumentNullException("input"); return RegexReplacement.Split(this, input, count, startat); } #if !(SILVERLIGHT || FULL_AOT_RUNTIME) /// /// #if MONO_FEATURE_CAS [HostProtection(MayLeakOnAbort=true)] #endif [ResourceExposure(ResourceScope.Machine)] // The AssemblyName is interesting. [ResourceConsumption(ResourceScope.Machine)] [SuppressMessage("Microsoft.Naming","CA1704:IdentifiersShouldBeSpelledCorrectly", MessageId="assemblyname", Justification="[....]: already shipped since v1 - can't fix without causing a breaking change")] public static void CompileToAssembly(RegexCompilationInfo[] regexinfos, AssemblyName assemblyname) { CompileToAssemblyInternal(regexinfos, assemblyname, null, null); } /// /// #if MONO_FEATURE_CAS [HostProtection(MayLeakOnAbort=true)] #endif [ResourceExposure(ResourceScope.Machine)] // The AssemblyName is interesting. [ResourceConsumption(ResourceScope.Machine)] [SuppressMessage("Microsoft.Naming","CA1704:IdentifiersShouldBeSpelledCorrectly", MessageId="assemblyname", Justification="[....]: already shipped since v1 - can't fix without causing a breaking change")] public static void CompileToAssembly(RegexCompilationInfo[] regexinfos, AssemblyName assemblyname, CustomAttributeBuilder[] attributes) { CompileToAssemblyInternal(regexinfos, assemblyname, attributes, null); } #if MONO_FEATURE_CAS [HostProtection(MayLeakOnAbort=true)] #endif [ResourceExposure(ResourceScope.Machine)] [ResourceConsumption(ResourceScope.Machine)] [SuppressMessage("Microsoft.Naming","CA1704:IdentifiersShouldBeSpelledCorrectly", MessageId="assemblyname", Justification="[....]: already shipped since v1 - can't fix without causing a breaking change")] public static void CompileToAssembly(RegexCompilationInfo[] regexinfos, AssemblyName assemblyname, CustomAttributeBuilder[] attributes, String resourceFile) { CompileToAssemblyInternal(regexinfos, assemblyname, attributes, resourceFile); } [ResourceExposure(ResourceScope.Machine)] // AssemblyName & resourceFile [ResourceConsumption(ResourceScope.Machine)] private static void CompileToAssemblyInternal (RegexCompilationInfo[] regexinfos, AssemblyName assemblyname, CustomAttributeBuilder[] attributes, String resourceFile) { if (assemblyname == null) throw new ArgumentNullException("assemblyname"); if (regexinfos == null) throw new ArgumentNullException("regexinfos"); RegexCompiler.CompileToAssembly(regexinfos, assemblyname, attributes, resourceFile); } #endif /// /// protected void InitializeReferences() { if (refsInitialized) throw new NotSupportedException(SR.GetString(SR.OnlyAllowedOnce)); refsInitialized = true; runnerref = new ExclusiveReference(); replref = new SharedReference(); } /* * Internal worker called by all the public APIs */ internal Match Run(bool quick, int prevlen, String input, int beginning, int length, int startat) { Match match; RegexRunner runner = null; if (startat < 0 || startat > input.Length) throw new ArgumentOutOfRangeException("start", SR.GetString(SR.BeginIndexNotNegative)); if (length < 0 || length > input.Length) throw new ArgumentOutOfRangeException("length", SR.GetString(SR.LengthNotNegative)); // There may be a cached runner; grab ownership of it if we can. runner = (RegexRunner)runnerref.Get(); // Create a RegexRunner instance if we need to if (runner == null) { // Use the compiled RegexRunner factory if the code was compiled to MSIL if (factory != null) runner = factory.CreateInstance(); else runner = new RegexInterpreter(code, UseOptionInvariant() ? CultureInfo.InvariantCulture : CultureInfo.CurrentCulture); } try { // Do the scan starting at the requested position match = runner.Scan(this, input, beginning, beginning + length, startat, prevlen, quick, internalMatchTimeout); } finally { // Release or fill the cache slot runnerref.Release(runner); } #if DBG if (Debug && match != null) match.Dump(); #endif return match; } /* * Find code cache based on options+pattern */ private static CachedCodeEntry LookupCachedAndUpdate(String key) { lock (livecode) { for (LinkedListNode current = livecode.First; current != null; current = current.Next) { if (current.Value._key == key) { // If we find an entry in the cache, move it to the head at the same time. livecode.Remove(current); livecode.AddFirst(current); return current.Value; } } } return null; } /* * Add current code to the cache */ private CachedCodeEntry CacheCode(String key) { CachedCodeEntry newcached = null; lock (livecode) { // first look for it in the cache and move it to the head for (LinkedListNode current = livecode.First; current != null; current = current.Next) { if (current.Value._key == key) { livecode.Remove(current); livecode.AddFirst(current); return current.Value; } } // it wasn't in the cache, so we'll add a new one. Shortcut out for the case where cacheSize is zero. if (cacheSize != 0) { newcached = new CachedCodeEntry(key, capnames, capslist, code, caps, capsize, runnerref, replref); livecode.AddFirst(newcached); if (livecode.Count > cacheSize) livecode.RemoveLast(); } } return newcached; } #if !SILVERLIGHT /* * True if the O option was set */ /// /// /// protected bool UseOptionC() { #if FULL_AOT_RUNTIME return false; #else #if MONO /* Mono: Set to false until we investigate https://bugzilla.xamarin.com/show_bug.cgi?id=25671 */ return false; #else return(roptions & RegexOptions.Compiled) != 0; #endif #endif } #endif /* * True if the L option was set */ /// /// /// protected bool UseOptionR() { return(roptions & RegexOptions.RightToLeft) != 0; } internal bool UseOptionInvariant() { return(roptions & RegexOptions.CultureInvariant) != 0; } #if DBG /* * True if the regex has debugging enabled */ /// /// /// internal bool Debug { get { return(roptions & RegexOptions.Debug) != 0; } } #endif } /* * Callback class */ /// /// #if !SILVERLIGHT [ Serializable() ] #endif public delegate String MatchEvaluator(Match match); /* * Used to cache byte codes or compiled factories */ internal sealed class CachedCodeEntry { internal string _key; internal RegexCode _code; #if SILVERLIGHT internal Dictionary _caps; internal Dictionary _capnames; #else internal Hashtable _caps; internal Hashtable _capnames; #endif internal String[] _capslist; internal int _capsize; internal RegexRunnerFactory _factory; internal ExclusiveReference _runnerref; internal SharedReference _replref; #if SILVERLIGHT internal CachedCodeEntry(string key, Dictionary capnames, String[] capslist, RegexCode code, Dictionary caps, int capsize, ExclusiveReference runner, SharedReference repl) #else internal CachedCodeEntry(string key, Hashtable capnames, String[] capslist, RegexCode code, Hashtable caps, int capsize, ExclusiveReference runner, SharedReference repl) #endif { _key = key; _capnames = capnames; _capslist = capslist; _code = code; _caps = caps; _capsize = capsize; _runnerref = runner; _replref = repl; } #if !SILVERLIGHT internal void AddCompiled(RegexRunnerFactory factory) { _factory = factory; _code = null; } #endif } /* * Used to cache one exclusive runner reference */ internal sealed class ExclusiveReference { RegexRunner _ref; Object _obj; int _locked; /* * Return an object and grab an exclusive lock. * * If the exclusive lock can't be obtained, null is returned; * if the object can't be returned, the lock is released. * */ internal Object Get() { // try to obtain the lock if (0 == Interlocked.Exchange(ref _locked, 1)) { // grab reference Object obj = _ref; // release the lock and return null if no reference if (obj == null) { _locked = 0; return null; } // remember the reference and keep the lock _obj = obj; return obj; } return null; } /* * Release an object back to the cache * * If the object is the one that's under lock, the lock * is released. * * If there is no cached object, then the lock is obtained * and the object is placed in the cache. * */ internal void Release(Object obj) { if (obj == null) throw new ArgumentNullException("obj"); // if this reference owns the lock, release it if (_obj == obj) { _obj = null; _locked = 0; return; } // if no reference owns the lock, try to cache this reference if (_obj == null) { // try to obtain the lock if (0 == Interlocked.Exchange(ref _locked, 1)) { // if there's really no reference, cache this reference if (_ref == null) _ref = (RegexRunner) obj; // release the lock _locked = 0; return; } } } } /* * Used to cache a weak reference in a threadsafe way */ internal sealed class SharedReference { WeakReference _ref = new WeakReference(null); int _locked; /* * Return an object from a weakref, protected by a lock. * * If the exclusive lock can't be obtained, null is returned; * * Note that _ref.Target is referenced only under the protection * of the lock. (Is this necessary?) */ internal Object Get() { if (0 == Interlocked.Exchange(ref _locked, 1)) { Object obj = _ref.Target; _locked = 0; return obj; } return null; } /* * Suggest an object into a weakref, protected by a lock. * * Note that _ref.Target is referenced only under the protection * of the lock. (Is this necessary?) */ internal void Cache(Object obj) { if (0 == Interlocked.Exchange(ref _locked, 1)) { _ref.Target = obj; _locked = 0; } } } }