Bläddra i källkod

feat: Add warc to list and limit check to succeeded archive results

Cristian 5 år sedan
förälder
incheckning
71655220ad
1 ändrade filer med 6 tillägg och 2 borttagningar
  1. 6 2
      archivebox/core/utils.py

+ 6 - 2
archivebox/core/utils.py

@@ -20,17 +20,21 @@ def get_icons(snapshot: Snapshot) -> str:
         "archive_org": "🏛",
         "readability": "🆁",
         "mercury": "🅼",
+        "warc": "📦"
     }
     exclude = ["favicon"]
     # Missing specific entry for WARC
 
-
     for extractor in EXTRACTORS:
-        result = archive_results.filter(extractor=extractor[0])
+        result = archive_results.filter(extractor=extractor[0], status="succeeded")
         try:
             if extractor[0] not in exclude:
                 output += output_template.format(link.archive_path, canon[f"{extractor[0]}_path"],
                                                  result.exists(), extractor[0], icons.get(extractor[0], "?"))
+            if extractor[0] == "wget":
+                extractor = "warc"
+                output += output_template.format(link.archive_path, canon[f"{extractor}_path"],
+                                                 result.exists(), extractor, icons.get(extractor, "?"))
         except Exception as e:
             print(e)