瀏覽代碼

fix sql link parsing and writing

Nick Sweeting 6 年之前
父節點
當前提交
0b27f33d2e
共有 3 個文件被更改,包括 6 次插入4 次删除
  1. 4 2
      archivebox/legacy/index.py
  2. 1 1
      archivebox/legacy/logs.py
  3. 1 1
      archivebox/legacy/storage/sql.py

+ 4 - 2
archivebox/legacy/index.py

@@ -245,10 +245,12 @@ def load_main_index(out_dir: str=OUTPUT_DIR, warn: bool=True) -> List[Link]:
 
     all_links: List[Link] = []
     all_links = list(parse_json_main_index(out_dir))
-    links_from_sql = list(parse_sql_main_index())
+    links_from_sql = list(parse_sql_main_index(out_dir))
 
-    if warn and not set(l.url for l in all_links) == set(l['url'] for l in links_from_sql):
+    if warn and not set(l.url for l in all_links) == set(l.url for l in links_from_sql):
         stderr('{red}[!] Warning: SQL index does not match JSON index!{reset}'.format(**ANSI))
+        stderr('    To repair the index and re-import any orphaned links run:')
+        stderr('        archivebox init')
 
     return all_links
 

+ 1 - 1
archivebox/legacy/logs.py

@@ -60,7 +60,7 @@ def log_indexing_process_started(num_links: int):
     start_ts = datetime.now()
     _LAST_RUN_STATS.index_start_ts = start_ts
     print()
-    print('{green}[*] [{}] Updating {} links in main index...{reset}'.format(
+    print('{green}[*] [{}] Writing {} links to main index...{reset}'.format(
         start_ts.strftime('%Y-%m-%d %H:%M:%S'),
         num_links,
         **ANSI,

+ 1 - 1
archivebox/legacy/storage/sql.py

@@ -15,7 +15,7 @@ def parse_sql_main_index(out_dir: str=OUTPUT_DIR) -> Iterator[Link]:
     from core.models import Page
 
     return (
-        page.as_json(*Page.keys)
+        Link.from_json(page.as_json(*Page.keys))
         for page in Page.objects.all()
     )