test_update.py 1.2 KB

123456789101112131415161718192021222324252627282930313233
  1. import sqlite3
  2. from .fixtures import *
  3. def test_update_imports_orphaned_snapshots(tmp_path, process, disable_extractors_dict):
  4. """Test that archivebox update imports orphaned snapshot directories."""
  5. # Add a snapshot
  6. subprocess.run(['archivebox', 'add', 'https://example.com'], capture_output=True, env=disable_extractors_dict)
  7. assert list((tmp_path / "archive").iterdir()) != []
  8. # Remove from DB but leave directory intact
  9. subprocess.run(['archivebox', 'remove', 'https://example.com', '--yes'], capture_output=True)
  10. # Verify snapshot removed from DB
  11. conn = sqlite3.connect(str(tmp_path / "index.sqlite3"))
  12. c = conn.cursor()
  13. link = c.execute("SELECT * FROM core_snapshot").fetchone()
  14. conn.commit()
  15. conn.close()
  16. assert link is None
  17. # Run update without filters - should scan filesystem and import orphaned directory
  18. update_process = subprocess.run(['archivebox', 'update'], capture_output=True, env=disable_extractors_dict)
  19. # Verify snapshot was re-imported from orphaned directory
  20. conn = sqlite3.connect(str(tmp_path / "index.sqlite3"))
  21. c = conn.cursor()
  22. url = c.execute("SELECT url FROM core_snapshot").fetchone()[0]
  23. conn.commit()
  24. conn.close()
  25. assert url == 'https://example.com'