You could use HTMLParser like this
import sys
if sys.version_info[0] < 3:
from HTMLParser import HTMLParser
from urllib2 import urlopen
else:
from html.parser import HTMLParser
from urllib.request import urlopen
class MyParser(HTMLParser):
def __init__(self):
HTMLParser.__init__(self)
self.day = None
def handle_starttag(self, tag, attrs):
if tag == 'tr':
for key, value in attrs:
if key == 'colData0':
self.day = value
def get_day(url):
parser = MyParser()
html = urlopen(url).read().decode('utf8')
parser.feed(html)
parser.close()
return parser.day
if __name__ == '__main__':
print(get_day("http://www.mywebsite.com/py"))
Reputation Points: 930
Solved Threads: 668
Posting Maven
Offline 2,656 posts
since Jul 2008