Download Html Agility Pack from the following link:
http://htmlagilitypack.codeplex.com/
Add a reference of the library to your project
Step 2: download the html web page to parse
Use the following code to download the web page.
private void Download(string url) { WebClient client = new WebClient(); client.DownloadFileCompleted += new AsyncCompletedEventHandler(client_DownloadFileCompleted); client.DownloadFileAsync(new Uri(url), @"c:\temp.html"); } void client_DownloadFileCompleted(object sender, AsyncCompletedEventArgs e) { //do something here }
Step 3: Parse the downloaded web page using Html Agility Pack
Use the following code in the client_DownloadFileCompleted() to enumerate all links in the web page.
void client_DownloadFileCompleted(object sender, AsyncCompletedEventArgs e) { String storesadd=""; string storesname=""; string bestfood=""; HtmlNodeCollection form_node_collection=doc.DocumentNode.SelectNodes("//form"); foreach (HtmlNode form_node in form_node_collection) { HtmlNodeCollection input_node_collection = form_node.SelectNodes("//input"); if(input_node_collection != null) { foreach (HtmlNode input_node in input_node_collection) { if (input_node.Attributes.Contains("id") && input_node.Attributes.Contains("value")) { string input_id=input_node.Attributes["id"].Value; string input_value = input_node.Attributes["value"].Value; if (string.IsNullOrEmpty(input_value)) { continue; } if (input_id == "storesadd") { storesadd = input_value; } else if (input_id == "bestfood") { bestfood = input_value; } else if (input_id == "storesname") { storesname = input_value; } } } } } }
No comments:
Post a Comment