diff --git a/Dockerfile b/Dockerfile index e147e56e..dda3c97a 100644 --- a/Dockerfile +++ b/Dockerfile @@ -1,6 +1,8 @@ # This is the Dockerfile for ArchiveBox, it bundles the following dependencies: # python3, ArchiveBox, curl, wget, git, chromium, youtube-dl, yt-dlp, single-file # Usage: +# git submodule update --init --recursive +# git pull --recurse-submodules # docker build . -t archivebox --no-cache # docker run -v "$PWD/data":/data archivebox init # docker run -v "$PWD/data":/data archivebox add 'https://example.com' @@ -9,6 +11,9 @@ # Multi-arch build: # docker buildx create --use # docker buildx build . --platform=linux/amd64,linux/arm64,linux/arm/v7 --push -t archivebox/archivebox:latest -t archivebox/archivebox:dev +# +# Read more about [developing +# Archivebox](https://github.com/ArchiveBox/ArchiveBox#archivebox-development). FROM python:3.10-slim-bullseye diff --git a/archivebox/extractors/__init__.py b/archivebox/extractors/__init__.py index 8623a15b..1acefdf4 100644 --- a/archivebox/extractors/__init__.py +++ b/archivebox/extractors/__init__.py @@ -128,7 +128,7 @@ def archive_link(link: Link, overwrite: bool=False, methods: Optional[Iterable[s else: # print('{black} X {}{reset}'.format(method_name, **ANSI)) stats['skipped'] += 1 - except Exception: + except Exception as e: # Disabled until https://github.com/ArchiveBox/ArchiveBox/issues/984 # and https://github.com/ArchiveBox/ArchiveBox/issues/1014 # are fixed. diff --git a/archivebox/parsers/__init__.py b/archivebox/parsers/__init__.py index 992446ba..c033ab28 100644 --- a/archivebox/parsers/__init__.py +++ b/archivebox/parsers/__init__.py @@ -154,7 +154,7 @@ def save_text_as_source(raw_text: str, filename: str='{ts}-stdin.txt', out_dir: for entry in raw_text.split(): try: - if Path(entry).exists: + if Path(entry).exists(): referenced_texts += Path(entry).read_text() except Exception as err: print(err)