风舞残阳 2008-4-2 13:44
在.NET中字符串替换的五种方法
1:使用String.Replace函数替换,但不支持大小写。 2:正则System.Text.Regex替换,用RegExpOption修改是否支持大小写。
3:在小数据的情况下,使用String.SubString和+可以实现间接替换。
4:导入MicrosoftVisualBasicRunTime(Microsoft.VisualBasic.DLL)使用Strings.Replace[wiki]速度[/wiki]很快。
5:参照反射Reflector.FileDisassembler配合Strings.SplitandStrings.Join等实现,速度同5。
一下介绍一种[wiki]算法[/wiki],[wiki]类[/wiki]似KMP算法。有兴趣的参照研究下。
privatestaticstringReplaceEx(stringoriginal,
stringpattern,stringreplacement)
{
intcount,position0,position1;
count=position0=position1=0;
stringupperString=original.ToUpper();
stringupperPattern=pattern.ToUpper();
intinc=(original.Length/pattern.Length)*
(replacement.Length-pattern.Length);
char[]chars=newchar[original.Length+Math.Max(0,inc)];
while((position1=upperString.IndexOf(upperPattern,
position0))!=-1)
{
for(inti=position0;i%26lt;position1;++i)
chars[count++]=original[i];
for(inti=0;i%26lt;replacement.Length;++i)
chars[count++]=replacement[i];
position0=position1+pattern.Length;
}
if(position0==0)returnoriginal;
for(inti=position0;i%26lt;original.Length;++i)
chars[count++]=original[i];
returnnewstring(chars,0,count);
} 测试
staticvoidMain(string[]args)
{
stringsegment="AaBbCc";
stringsource;
stringpattern="AbC";
stringdestination="Some";
stringresult="";
constlongcount=1000;
StringBuilderpressure=newStringBuilder();
HiPerfTimertime;
for(inti=0;i%26lt;count;i++)
{
pressure.Append(segment);
}
source=pressure.ToString();
GC.Collect();
//regexp
time=newHiPerfTimer();
time.Start();
for(inti=0;i%26lt;count;i++)
{
result=Regex.Replace(source,pattern,
destination,RegexOptions.IgnoreCase);
}
time.Stop();
Console.WriteLine("regexp ="+time.Duration+"s");
GC.Collect();
//vb
time=newHiPerfTimer();
time.Start();
for(inti=0;i%26lt;count;i++)
{
result=Strings.Replace(source,pattern,
destination,1,-1,CompareMethod.Text);
}
time.Stop();
Console.WriteLine("vb ="+time.Duration+"s");
GC.Collect();
//vbReplace
time=newHiPerfTimer();
time.Start();
for(inti=0;i%26lt;count;i++)
{
result=VBString.Replace(source,pattern,
destination,1,-1,StringCompareMethod.Text);
}
time.Stop();
Console.WriteLine("vbReplace="+time.Duration+"s");//+result);
GC.Collect();
//ReplaceEx
time=newHiPerfTimer();
time.Start();
for(inti=0;i%26lt;count;i++)
{
result=Test.ReplaceEx(source,pattern,destination);
}
time.Stop();
Console.WriteLine("ReplaceEx="+time.Duration+"s");
GC.Collect();
//Replace
time=newHiPerfTimer();
time.Start();
for(inti=0;i%26lt;count;i++)
{
result=source.Replace(pattern.ToLower(),destination);
}
time.Stop();
Console.WriteLine("Replace ="+time.Duration+"s");
GC.Collect();
//sorry,twoslow:(
/*//substring
time=newHiPerfTimer();
time.Start();
for(inti=0;i%26lt;count;i++)
{
result=StringHelper.ReplaceText(source,pattern,
destination,StringHelper.CompareMethods.Text);
}
time.Stop();
Console.WriteLine("substring="+time.Duration+":");
GC.Collect();
//substringwithstringbuilder
time=newHiPerfTimer();
time.Start();
for(inti=0;i%26lt;count;i++)
{
result=StringHelper.ReplaceTextB(source,pattern,
destination,StringHelper.CompareMethods.Text);
}
time.Stop();
Console.WriteLine("substringB="+time.Duration+":");
GC.Collect();
*/
Console.ReadLine();
}
1%26iexcl;%26cent;stringsegment="abcaBc";
regexp=3.75481827997692s
vb=1.52745502570857s
vbReplace=1.46234256029747s
ReplaceEx=0.797071415501132s!!!%26lt;FONTcolor=gray%26gt;Replace=0.178327413120941s%26lt;/FONT%26gt;
//ReplaceEx%26gt;vbReplace%26gt;vb%26gt;regexp
2%26iexcl;%26cent;stringsegment="abcaBcabC";
regexp=5.30117431126023s
vb=2.46258449048692s
vbReplace=2.5018721653171s
ReplaceEx=1.00662179131705s!!!
%26lt;FONTcolor=gray%26gt;Replace=0.233760994763301s%26lt;/FONT%26gt;
//ReplaceEx%26gt;vb%26gt;vbReplace%26gt;regexp
3%26iexcl;%26cent;stringsegment="abcaBcabCAbc";
regexp=7.00987862982586s
vb=3.61050301085753s
vbReplace=3.42324876485699s
ReplaceEx=1.14969947297771s!!!
%26lt;FONTcolor=gray%26gt;Replace=0.277254511397398s%26lt;/FONT%26gt;
//ReplaceEx%26gt;vbReplace%26gt;vb%26gt;regexp
4%26iexcl;%26cent;stringsegment="ABCabcAbCaBcAbcabCABCAbcaBC";
regexp=13.5940090151123s
vb=11.6806222578568s
vbReplace=11.1757614445411s
ReplaceEx=1.70264153684337s!!!(mygod!)
%26lt;FONTcolor=gray%26gt;Replace=0.42236820601501s%26lt;/FONT%26gt;
//ReplaceEx%26gt;vbReplace%26gt;vb%26gt;regexp 查看程序的Block在:
stringupperString=original.ToUpper();
stringupperPattern=pattern.ToUpper(); 如果需要敏感,就免了这2行。
解释:先建一个char[]类型的变量采访替换后的字符,其大小就是最大可能被替换的字符,例如ABABAB,替换AB成C,其获取过程就是ABABAB最大可能包括的AB的数目乘以AB多于C的数目,
char[]chars=newchar[original.Length+Math.Max(0,inc)];
,inc不一定大于零。
然后循环,用IndexOf索引。赋值。。。判断,返回。