mirror of
https://github.com/ArchiveBox/ArchiveBox.git
synced 2025-05-14 15:14:31 -04:00
20 lines
498 B
Python
20 lines
498 B
Python
__package__ = 'plugins_extractor.readability'
|
|
|
|
from pathlib import Path
|
|
|
|
from pydantic_pkgr import BinName
|
|
|
|
from abx.archivebox.base_extractor import BaseExtractor
|
|
|
|
from .binaries import READABILITY_BINARY
|
|
|
|
|
|
class ReadabilityExtractor(BaseExtractor):
|
|
name: str = 'readability'
|
|
binary: BinName = READABILITY_BINARY.name
|
|
|
|
def get_output_path(self, snapshot) -> Path:
|
|
return Path(snapshot.link_dir) / 'readability' / 'content.html'
|
|
|
|
|
|
READABILITY_EXTRACTOR = ReadabilityExtractor()
|