|
|
@ -231,10 +231,12 @@ if sys.version_info < (2, 7, 3): |
|
|
|
if self.rawdata[i:].startswith("</scr'+'ipt>") |
|
|
|
else compat_html_parser.HTMLParser.parse_endtag(self, i)) |
|
|
|
|
|
|
|
|
|
|
|
def get_element_by_id(id, html): |
|
|
|
"""Return the content of the tag with the specified ID in the passed HTML document""" |
|
|
|
return get_element_by_attribute("id", id, html) |
|
|
|
|
|
|
|
|
|
|
|
def get_element_by_attribute(attribute, value, html): |
|
|
|
"""Return the content of the tag with the specified attribute in the passed HTML document""" |
|
|
|
parser = AttrParser(attribute, value) |
|
|
@ -265,16 +267,6 @@ class MetaParser(BaseHTMLParser): |
|
|
|
def get_result(self): |
|
|
|
return self.result |
|
|
|
|
|
|
|
def get_meta_content(name, html): |
|
|
|
""" |
|
|
|
Return the content attribute from the meta tag with the given name attribute. |
|
|
|
""" |
|
|
|
parser = MetaParser(name) |
|
|
|
try: |
|
|
|
parser.loads(html) |
|
|
|
except compat_html_parser.HTMLParseError: |
|
|
|
pass |
|
|
|
return parser.get_result() |
|
|
|
|
|
|
|
|
|
|
|
def clean_html(html): |
|
|
|