<br> Tuesday, November 03, 2009 2:16 AM <dir> <A HREF="/formularyupdate/PBMA/">PBMA</A>
<br> Tuesday, November 03, 2009 2:16 AM <dir> <A HREF="/formularyupdate/PBMB/">PBMB</A>
<br> Tuesday, November 03, 2009 2:16 AM <dir> <A HREF="/formularyupdate/PBMC/">PBMC</A>
<br> Tuesday, November 03, 2009 2:16 AM <dir> <A HREF="/formularyupdate/RXHUBPBM/">RXHUBPBM</A>
用c#截取每个a标签的链接,
<br> Tuesday, November 03, 2009 2:16 AM <dir> <A HREF="/formularyupdate/PBMB/">PBMB</A>
<br> Tuesday, November 03, 2009 2:16 AM <dir> <A HREF="/formularyupdate/PBMC/">PBMC</A>
<br> Tuesday, November 03, 2009 2:16 AM <dir> <A HREF="/formularyupdate/RXHUBPBM/">RXHUBPBM</A>
用c#截取每个a标签的链接,
还是要/formularyupdate/PBMA/
var links = document.getElementsByTagName("a");
for(var i = 0; i < links.length; i++)
{
//to do...
}
<br> Tuesday, November 03, 2009 2:16 AM <dir> <A HREF=""/formularyupdate/PBMB/"">PBMB </A>
<br> Tuesday, November 03, 2009 2:16 AM <dir> <A HREF=""/formularyupdate/PBMC/"">PBMC </A>
<br> Tuesday, November 03, 2009 2:16 AM <dir> <A HREF=""/formularyupdate/RXHUBPBM/"">RXHUBPBM </A>"; Regex reg = new Regex(@"(?is)<A\sHREF=""(.*?)"">([^>]+?)</A>");
MatchCollection mc = reg.Matches(html);
foreach (Match m in mc)
{
Console.WriteLine(m.Groups[0].ToString() +" 地址:"+ m.Groups[1].ToString() + " 连接名:"+m.Groups[2].ToString() + "\r\n");
}
/*
<A HREF="/formularyupdate/PBMA/">PBMA </A> 地址:/formularyupdate/PBMA/ 连接名:PBMA<A HREF="/formularyupdate/PBMB/">PBMB </A> 地址:/formularyupdate/PBMB/ 连接名:PBMB<A HREF="/formularyupdate/PBMC/">PBMC </A> 地址:/formularyupdate/PBMC/ 连接名:PBMC<A HREF="/formularyupdate/RXHUBPBM/">RXHUBPBM </A> 地址:/formularyupdate/RXHUBPBM/ 连接名:RXHUBPBM
*/
MatchCollection mc=Regex.Matches(str, @ " <a[^> ]*href=([ ' " "]?)(? <url> [^ ' " "> \s]*)\1?[^> ]*> (? <text> [^ <]*) </a> ", RegexOptions.IgnoreCase);
foreach (Match m in mc)
{
Console.Write(m.Groups[ "url "].Value);
Console.Write(m.Groups[ "text "].Value);
}
string strPattern=@"a[\s]+href=(? <Link>[^\s>]+)[^>]*>(? <Text>[^ <]*) </a>";
MatchCollection Matches=Regex.Matches(str,strPattern,RegexOptions.IgnoreCase|RegexOptions.Compiled);
foreach(Match mc in Matches)
{
Response.Write(mc.Groups["Link"].Value.ToString().Trim());
Response.Write(mc.Groups["Text"].Value.ToString().Trim());
}