我正在使用以下代碼來測試編譯正則表達式的CompileToAssembly性能,但結果不合適。請讓我知道我錯過了什麼。謝謝!!!爲什麼Regex CompileToAssembly的性能比編譯正則表達式和解釋正則表達式慢?
static readonly Regex regex = new Regex(@"(stats|pause\s?(all|\d+(\,\d+)*)|start\s?(all|\d+(\,\d+)*)|add\s?time\s?(all|\d+(\,\d+)*)(\s\d+)|c(?:hange)?\s?p(?:asskey)?|close)(.*)", RegexOptions.Compiled);
static readonly Regex reg = new Regex(@"(stats|pause\s?(all|\d+(\,\d+)*)|start\s?(all|\d+(\,\d+)*)|add\s?time\s?(all|\d+(\,\d+)*)(\s\d+)|c(?:hange)?\s?p(?:asskey)?|close)(.*)");
static readonly Regex level4 = new DuplicatedString();
static void Main()
{
const string str = "add time 243,3453,43543,543,534534,54534543,345345,4354354235,345435,34543534 6873brekgnfkjerkgiengklewrij";
const int itr = 1000000;
CompileToAssembly();
Match match;
Stopwatch sw = new Stopwatch();
sw.Start();
for (int i = 0; i < itr; i++)
{
match = regex.Match(str);
}
sw.Stop();
Console.WriteLine("RegexOptions.Compiled: {0}ms", sw.ElapsedMilliseconds);
sw.Reset();
sw.Start();
for (int i = 0; i < itr; i++)
{
match = level4.Match(str);
}
sw.Stop();
Console.WriteLine("CompiledToAssembly: {0}ms", sw.ElapsedMilliseconds);
sw.Reset();
sw.Start();
for (int i = 0; i < itr; i++)
{
match = reg.Match(str);
}
sw.Stop();
Console.WriteLine("Interpreted: {0}ms", sw.ElapsedMilliseconds);
Console.ReadLine();
}
public static void CompileToAssembly()
{
RegexCompilationInfo expr;
List<RegexCompilationInfo> compilationList = new List<RegexCompilationInfo>();
// Define regular expression to detect duplicate words
expr = new RegexCompilationInfo(@"(stats|pause\s?(all|\d+(\,\d+)*)|start\s?(all|\d+(\,\d+)*)|add\s?time\s?(all|\d+(\,\d+)*)(\s\d+)|c(?:hange)?\s?p(?:asskey)?|close)(.*)",
RegexOptions.Compiled,
"DuplicatedString",
"Utilities.RegularExpressions",
true);
// Add info object to list of objects
compilationList.Add(expr);
// Apply AssemblyTitle attribute to the new assembly
//
// Define the parameter(s) of the AssemblyTitle attribute's constructor
Type[] parameters = { typeof(string) };
// Define the assembly's title
object[] paramValues = { "General-purpose library of compiled regular expressions" };
// Get the ConstructorInfo object representing the attribute's constructor
ConstructorInfo ctor = typeof(System.Reflection.AssemblyTitleAttribute).GetConstructor(parameters);
// Create the CustomAttributeBuilder object array
CustomAttributeBuilder[] attBuilder = { new CustomAttributeBuilder(ctor, paramValues) };
// Generate assembly with compiled regular expressions
RegexCompilationInfo[] compilationArray = new RegexCompilationInfo[compilationList.Count];
AssemblyName assemName = new AssemblyName("RegexLib, Version=1.0.0.1001, Culture=neutral, PublicKeyToken=null");
compilationList.CopyTo(compilationArray);
Regex.CompileToAssembly(compilationArray, assemName, attBuilder);
}
以下是結果:
RegexOptions.Compiled: 3908ms
CompiledToAssembly: 59349ms
Interpreted: 5653ms
我只是自己運行代碼。這是我的結果:'RegexOptions.Compiled:8399ms'; 'CompiledToAssembly:7806ms'; '解釋:10405ms'。正是我所期望的。 – mellamokb 2012-04-09 22:03:39
在調試模式下再次嘗試在Visual Studio中獲得大致相同的結果。你正在分別調用'CompileToAssembly()',然後運行該部分註釋掉,是否正確? – mellamokb 2012-04-09 22:12:19
我試着運行exe現在的結果是更好的...不知道爲什麼它給我奇怪的結果,當我早些時候嘗試。 Neway仍然結果與theroy不匹配以下是10000000次迭代的結果:RegexOption.Compiled:34413msCompiledToAssembly:37125 Interpreted:47322 ....爲什麼遵守彙編比編譯正則表達式更多的時間? – iRock 2012-04-09 22:17:04