I don't know of anywhere that would have done this already but I'm sorry as I don't know
here is a class that lets you get the Title from an html document
public class WebHelper
{
public static string FetchHTML(string sUrl)
{
System.Net.WebClient oClient = new System.Net.WebClient();
return oClient.DownloadString(sUrl);
//return new System.Text.UTF8Encoding().GetString(oClient.DownloadData(sUrl));
}
public static string FetchTitleFromHTML(string sHtml)
{
string regex = @"(?<=<title.*>)([\s\S]*)(?=</title>)";
System.Text.RegularExpressions.Regex ex = new System.Text.RegularExpressions.Regex(regex, System.Text.RegularExpressions.RegexOptions.IgnoreCase);
return ex.Match(sHtml).Value.Trim();
}
}
using the fetch HTML to get the text and then using the string.Replace method can get rid of the "