January 5th, 2008
protected ArrayList getURL(string txtIn)
{
ArrayList outURL = new ArrayList();
Regex r = new Regex(“href\\s*=\\s*(?:(?:\\\”(?<url>[^\\\”]*)\\\”)|(?<url>[^\\s]* ))”);
MatchCollection mc1 = r.Matches(txtIn);
foreach (Match m1 in mc1)
{
foreach (Group g in m1.Groups)
{
outURL.Add(g.Value);
}
}
return outURL;
}
Programming |
| Trackback
2 comments on “How to extract URLs (href property) from HTML”
01
[…] How to extract URLs (href property) from HTML […]
02
Good site!
brainybusiness.info
Leave a Reply