我试过这段代码:
private void RemoveLines(List<string> Keywords)
{
string NewText = "";
String regex = string.Empty;
this.Invoke(new MethodInvoker(delegate { NewText = richTextBox1.Text; }));
Regex MyRegex = null;
foreach (string keyword in Keywords)
{
regex = String.Format(@"^.*\W{0}\W.*$",keyword);
MyRegex = new Regex(regex, RegexOptions.Multiline);
NewText = MyRegex.Replace(NewText, Environment.NewLine);
}
//Remove blank lines
NewText = Regex.Replace(NewText, @"^\s+$[\r\n]*", "", RegexOptions.Multiline);
this.Invoke(new MethodInvoker(delegate { richTextBox1.Text = NewText; }));
this.Invoke(new MethodInvoker(delegate { richTextBox1.Refresh(); }));
}
和 removeExtrenals 功能:
private List<string> removeExternals(List<string> externals)
{
if(!LocalyKeyWords.ContainsKey(mainUrl))
{
return externals;
}
List<string> keywords = LocalyKeyWords[mainUrl];
List<int> indices = new List<int>();
foreach(string keyword in keywords)
{
//Accumulate a list of the indices of the items that match.
indices = indices.Concat(externals.Select((v, i) => v.Contains(keyword) ? i : -1)).ToList();
}
//Filter out the -1s, grab only the unique indices.
indices = indices.Where(i => i >= 0).Distinct().ToList();
//Filter out those items that match the keyword(s) related to mainUrl.
externals = externals.Where((v, i) => !indices.Contains(i)).ToList();
return externals;
}
我在这个函数中调用了 removelines 和 removeexternals:
RemoveLines(removeExternals(webSites));
在使用断点后的 removeExternals 中,我看到两个不包含 google 的站点(示例中使用的关键字 im)所以从 18 个 url 我应该在richTextBox 中看到只有 16 个 url 我也在 removelines 函数中使用了断点,没有例外,但我看到了所有的网址都在richTextBox 中。