From 874403e667302ffac7343172371dff5c9abb0a3a Mon Sep 17 00:00:00 2001 From: Cristian Date: Tue, 18 Aug 2020 12:38:01 -0500 Subject: [PATCH] feat: Remove patch_main_index --- archivebox/extractors/__init__.py | 6 ----- archivebox/index/__init__.py | 40 ------------------------------- archivebox/main.py | 3 +-- 3 files changed, 1 insertion(+), 48 deletions(-) diff --git a/archivebox/extractors/__init__.py b/archivebox/extractors/__init__.py index 988635b6..000159e3 100644 --- a/archivebox/extractors/__init__.py +++ b/archivebox/extractors/__init__.py @@ -9,7 +9,6 @@ from ..index.schema import Link from ..index import ( load_link_details, write_link_details, - patch_main_index, ) from ..util import enforce_types from ..logging_util import ( @@ -114,11 +113,6 @@ def archive_link(link: Link, overwrite: bool=False, methods: Optional[Iterable[s write_link_details(link, out_dir=out_dir, skip_sql_index=skip_index) - # # If any changes were made, update the main links index json and html - # was_changed = stats['succeeded'] or stats['failed'] - # if was_changed: - # patch_main_index(link) - log_link_archiving_finished(link, link.link_dir, is_new, stats) except KeyboardInterrupt: diff --git a/archivebox/index/__init__.py b/archivebox/index/__init__.py index 555882ab..fb5ec6ec 100644 --- a/archivebox/index/__init__.py +++ b/archivebox/index/__init__.py @@ -328,46 +328,6 @@ def dedupe_links(existing_links: List[Link], return all_links, new_links - -@enforce_types -def patch_main_index(link: Link, out_dir: str=OUTPUT_DIR) -> None: - """hack to in-place update one row's info in the generated index files""" - - # TODO: remove this ASAP, it's ugly, error-prone, and potentially dangerous - - title = link.title or link.latest_outputs(status='succeeded')['title'] - successful = link.num_outputs - - # Patch JSON main index - json_file_links = parse_json_main_index(out_dir) - patched_links = [] - for saved_link in json_file_links: - if saved_link.url == link.url: - patched_links.append(saved_link.overwrite( - title=title, - history=link.history, - updated=link.updated, - )) - else: - patched_links.append(saved_link) - - write_json_main_index(patched_links, out_dir=out_dir) - - # Patch HTML main index - html_path = os.path.join(out_dir, 'index.html') - with open(html_path, 'r') as f: - html = f.read().splitlines() - - for idx, line in enumerate(html): - if title and ('