_meta_parser.py 818 B

1234567891011121314151617181920212223242526272829
  1. from __future__ import annotations
  2. from html.parser import HTMLParser
  3. def get_meta_description(meta_tags: str) -> bool:
  4. htp = HTMLTextParser()
  5. htp.feed(meta_tags)
  6. htp.close()
  7. return htp.meta_description
  8. class HTMLTextParser(HTMLParser):
  9. """Parse HTML into text."""
  10. def __init__(self) -> None:
  11. super().__init__()
  12. self.meta_description = None
  13. def handle_starttag(self, tag: str, attrs: list[tuple[str, str | None]]) -> None:
  14. # For example:
  15. # attrs = [("content", "My manual description"), ("name", "description")]
  16. if ('name', 'description') in attrs:
  17. self.meta_description = True
  18. for name, value in attrs:
  19. if name == 'content':
  20. self.meta_description = value
  21. break