using CsvHelper;
using HtmlAgilityPack;
using System;
using System.Collections.Generic;
using System.Collections.ObjectModel;
using System.Diagnostics;
using System.Globalization;
using System.IO;
using System.Linq;
using System.Text;
using System.Threading.Tasks;
using System.Web;
namespace WpfScraper
{
public class Scraper
{
private ObservableCollection _entries = new ObservableCollection();
public ObservableCollection Entries
{
get { return _entries; }
set { _entries = value; }
}
public void ScrapeData(string page)
{
var web = new HtmlWeb();
var doc = web.Load(page);
//var Articles = doc.DocumentNode.SelectNodes("//*[@class = 'article-single']");
var Articles = doc.DocumentNode.SelectNodes("//*[@id='shareslist']/table/tbody/tr[1]");
foreach (var article in Articles)
{
//var header = HttpUtility.HtmlDecode(article.SelectSingleNode(".//li[@class = 'article-header']").InnerText);
//var description = HttpUtility.HtmlDecode(article.SelectSingleNode(".//li[@class = 'article-copy']").InnerText);
var header = HttpUtility.HtmlDecode(article.SelectSingleNode(".//li[@class = 'millistream-link']").InnerText);
var description = HttpUtility.HtmlDecode(article.SelectSingleNode(".//li[@class = 'millistream-numeric millistream-lastprice millistream-numeric-positive']").InnerText);
Debug.Print($"Title: {header} \n"+
$" Description: {description}");
_entries.Add(new EntryModel { Title = header, Description = description });
}
}
public void Export()
{
using(TextWriter tw = File.CreateText("SampleData.csv"))
{
using(var cw = new CsvWriter(tw,CultureInfo.InvariantCulture))
{
foreach(var entry in Entries)
{
cw.WriteRecord(entry);
cw.NextRecord();
}
}
}
}
}
}