Code to extract drawNumber and drawDate

This commit is contained in:
Ross Healy
2024-02-03 22:28:09 +00:00
parent 58d6b821f6
commit fbbb2e9d6f

View File

@@ -1,5 +1,7 @@
using HtmlAgilityPack;
using lottery_co_uk_scraper.Utilities;
using System.Globalization;
using System.Text.RegularExpressions;
namespace lottery_co_uk_scraper
{
@@ -269,6 +271,47 @@ namespace lottery_co_uk_scraper
}
var metaKeywords = doc.DocumentNode.Descendants("meta")
.FirstOrDefault(x => x.GetAttributeValue("name", "") == "keywords");
if (metaKeywords != null)
{
var keywordsText = metaKeywords.GetAttributeValue("content", "");
var drawNumberMatch = Regex.Match(keywordsText, @"lotto draw (\d+)");
if (drawNumberMatch.Success)
{
var drawNumber = int.Parse(drawNumberMatch.Groups[1].Value);
Console.WriteLine("Draw Number: " + drawNumber);
}
else
{
Console.WriteLine("Draw Number not found.");
}
}
else
{
Console.WriteLine("Meta keywords not found.");
}
var title = doc.DocumentNode.Descendants("title")
.FirstOrDefault();
if (title != null)
{
var titleText = title.InnerText;
var date = TextRemoval.ParseDateString(titleText);
string formattedDate = date.ToString("yyyy-MM-dd");
Console.WriteLine("Draw Date: " + formattedDate);
}
else
{
Console.WriteLine("Title not found.");
}
var rolloverElement = doc.DocumentNode.Descendants("span")
.FirstOrDefault(x => x.InnerText.Trim() == "Rollover");