29 lines
807 B
Python
29 lines
807 B
Python
|
#!/usr/bin/env python
|
||
|
try:
|
||
|
from html.parser import HTMLParser
|
||
|
except ImportError:
|
||
|
from HTMLParser import HTMLParser
|
||
|
|
||
|
# Don't blame on me for this mess, we can't use external libs and all we have is HTMLParser
|
||
|
class WTParser(HTMLParser):
|
||
|
def __init__(self):
|
||
|
HTMLParser.__init__(self)
|
||
|
self.meta = {}
|
||
|
self.scripts = []
|
||
|
|
||
|
def handle_starttag(self, tag, attrs):
|
||
|
if tag == 'meta':
|
||
|
m = {}
|
||
|
for name, value in attrs:
|
||
|
m[name] = value
|
||
|
|
||
|
name = m.get('name') or m.get('property')
|
||
|
if name:
|
||
|
self.meta[name] = m.get('content', '')
|
||
|
elif tag == 'script':
|
||
|
for name, value in attrs:
|
||
|
if name == 'src':
|
||
|
self.scripts.append(value)
|
||
|
return
|
||
|
|