apps.py 5.4 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154
  1. __package__ = 'archivebox.builtin_plugins.singlefile'
  2. from pathlib import Path
  3. from typing import List, Dict, Optional, ClassVar
  4. from typing_extensions import Self
  5. from django.conf import settings
  6. # Depends on other PyPI/vendor packages:
  7. from pydantic import InstanceOf, Field, validate_call
  8. from pydantic_pkgr import BinProvider, BinProviderName, ProviderLookupDict, BinName, bin_abspath
  9. # Depends on other Django apps:
  10. from plugantic.base_plugin import BasePlugin
  11. from plugantic.base_configset import BaseConfigSet, ConfigSectionName
  12. from plugantic.base_binary import BaseBinary, env
  13. from plugantic.base_extractor import BaseExtractor
  14. from plugantic.base_queue import BaseQueue
  15. from plugantic.base_hook import BaseHook
  16. # Depends on Other Plugins:
  17. from builtin_plugins.npm.apps import SYS_NPM_BINPROVIDER, LIB_NPM_BINPROVIDER
  18. from builtin_plugins.base.apps import CORE_CONFIG
  19. ###################### Config ##########################
  20. class SinglefileToggleConfigs(BaseConfigSet):
  21. section: ClassVar[ConfigSectionName] = 'ARCHIVE_METHOD_TOGGLES'
  22. SAVE_SINGLEFILE: bool = True
  23. class SinglefileOptionsConfigs(BaseConfigSet):
  24. section: ClassVar[ConfigSectionName] = 'ARCHIVE_METHOD_OPTIONS'
  25. SINGLEFILE_USER_AGENT: str = Field(default=lambda: CORE_CONFIG.USER_AGENT)
  26. SINGLEFILE_TIMEOUT: int = Field(default=lambda: CORE_CONFIG.TIMEOUT)
  27. SINGLEFILE_CHECK_SSL_VALIDITY: bool = Field(default=lambda: CORE_CONFIG.CHECK_SSL_VALIDITY)
  28. SINGLEFILE_RESTRICT_FILE_NAMES: str = Field(default=lambda: CORE_CONFIG.RESTRICT_FILE_NAMES)
  29. SINGLEFILE_COOKIES_FILE: Optional[Path] = Field(default=lambda: CORE_CONFIG.COOKIES_FILE)
  30. class SinglefileDependencyConfigs(BaseConfigSet):
  31. section: ClassVar[ConfigSectionName] = 'DEPENDENCY_CONFIG'
  32. SINGLEFILE_BINARY: str = Field(default='wget')
  33. SINGLEFILE_ARGS: Optional[List[str]] = Field(default=None)
  34. SINGLEFILE_EXTRA_ARGS: List[str] = []
  35. SINGLEFILE_DEFAULT_ARGS: List[str] = ['--timeout={TIMEOUT-10}']
  36. class SinglefileConfigs(SinglefileToggleConfigs, SinglefileOptionsConfigs, SinglefileDependencyConfigs):
  37. # section: ClassVar[ConfigSectionName] = 'ALL_CONFIGS'
  38. pass
  39. DEFAULT_GLOBAL_CONFIG = {
  40. 'CHECK_SSL_VALIDITY': False,
  41. 'SAVE_SINGLEFILE': True,
  42. 'TIMEOUT': 120,
  43. }
  44. SINGLEFILE_CONFIG = SinglefileConfigs(**DEFAULT_GLOBAL_CONFIG)
  45. SINGLEFILE_MIN_VERSION = '1.1.54'
  46. SINGLEFILE_MAX_VERSION = '1.1.60'
  47. class SinglefileBinary(BaseBinary):
  48. name: BinName = 'single-file'
  49. binproviders_supported: List[InstanceOf[BinProvider]] = [LIB_NPM_BINPROVIDER, SYS_NPM_BINPROVIDER, env]
  50. provider_overrides: Dict[BinProviderName, ProviderLookupDict] = {
  51. env.name: {
  52. 'abspath': lambda:
  53. bin_abspath('single-file', PATH=env.PATH) or bin_abspath('single-file-node.js', PATH=env.PATH),
  54. },
  55. LIB_NPM_BINPROVIDER.name: {
  56. "abspath": lambda:
  57. bin_abspath("single-file", PATH=LIB_NPM_BINPROVIDER.PATH) or bin_abspath("single-file-node.js", PATH=LIB_NPM_BINPROVIDER.PATH),
  58. "packages": lambda:
  59. [f"single-file-cli@>={SINGLEFILE_MIN_VERSION} <{SINGLEFILE_MAX_VERSION}"],
  60. },
  61. SYS_NPM_BINPROVIDER.name: {
  62. "packages": lambda:
  63. [], # prevent modifying system global npm packages
  64. },
  65. }
  66. @validate_call
  67. def install(self, binprovider_name: Optional[BinProviderName]=None) -> Self:
  68. # force install to only use lib/npm provider, we never want to modify global NPM packages
  69. return BaseBinary.install(self, binprovider_name=binprovider_name or LIB_NPM_BINPROVIDER.name)
  70. @validate_call
  71. def load_or_install(self, binprovider_name: Optional[BinProviderName] = None) -> Self:
  72. # force install to only use lib/npm provider, we never want to modify global NPM packages
  73. try:
  74. return self.load()
  75. except Exception:
  76. return BaseBinary.install(self, binprovider_name=binprovider_name or LIB_NPM_BINPROVIDER.name)
  77. # ALTERNATIVE INSTALL METHOD using Ansible:
  78. # install_playbook = PLUGANTIC_DIR / 'ansible' / 'install_singlefile.yml'
  79. # singlefile_bin = run_playbook(install_playbook, data_dir=settings.CONFIG.OUTPUT_DIR, quiet=quiet).BINARIES.singlefile
  80. # return self.__class__.model_validate(
  81. # {
  82. # **self.model_dump(),
  83. # "loaded_abspath": singlefile_bin.abspath,
  84. # "loaded_version": singlefile_bin.version,
  85. # "loaded_binprovider": env,
  86. # "binproviders_supported": self.binproviders_supported,
  87. # }
  88. # )
  89. SINGLEFILE_BINARY = SinglefileBinary()
  90. PLUGIN_BINARIES = [SINGLEFILE_BINARY]
  91. class SinglefileExtractor(BaseExtractor):
  92. name: str = 'singlefile'
  93. binary: BinName = SINGLEFILE_BINARY.name
  94. def get_output_path(self, snapshot) -> Path:
  95. return Path(snapshot.link_dir) / 'singlefile.html'
  96. SINGLEFILE_BINARY = SinglefileBinary()
  97. SINGLEFILE_EXTRACTOR = SinglefileExtractor()
  98. class SinglefileQueue(BaseQueue):
  99. name: str = 'singlefile'
  100. binaries: List[InstanceOf[BaseBinary]] = [SINGLEFILE_BINARY]
  101. SINGLEFILE_QUEUE = SinglefileQueue()
  102. class SinglefilePlugin(BasePlugin):
  103. app_label: str ='singlefile'
  104. verbose_name: str = 'SingleFile'
  105. hooks: List[InstanceOf[BaseHook]] = [
  106. SINGLEFILE_CONFIG,
  107. SINGLEFILE_BINARY,
  108. SINGLEFILE_EXTRACTOR,
  109. SINGLEFILE_QUEUE,
  110. ]
  111. PLUGIN = SinglefilePlugin()
  112. PLUGIN.register(settings)
  113. DJANGO_APP = PLUGIN.AppConfig