extractors.py 454 B

12345678910111213141516171819
  1. __package__ = 'plugins_extractor.mercury'
  2. from pathlib import Path
  3. from abx.archivebox.base_extractor import BaseExtractor, ExtractorName
  4. from .binaries import MERCURY_BINARY
  5. class MercuryExtractor(BaseExtractor):
  6. name: ExtractorName = 'mercury'
  7. binary: str = MERCURY_BINARY.name
  8. def get_output_path(self, snapshot) -> Path | None:
  9. return snapshot.link_dir / 'mercury' / 'content.html'
  10. MERCURY_EXTRACTOR = MercuryExtractor()