mirror of
https://github.com/ArchiveBox/ArchiveBox.git
synced 2025-05-09 12:21:57 -04:00
65 lines
1.3 KiB
Python
65 lines
1.3 KiB
Python
__package__ = 'plugins_extractor.chrome'
|
|
__label__ = 'chrome'
|
|
__version__ = '2024.10.14'
|
|
__author__ = 'ArchiveBox'
|
|
__homepage__ = 'https://github.com/ArchiveBox/ArchiveBox/tree/main/archivebox/plugins_extractor/chrome'
|
|
__dependencies__ = []
|
|
|
|
import abx
|
|
|
|
|
|
@abx.hookimpl
|
|
def get_PLUGIN():
|
|
return {
|
|
'chrome': {
|
|
'PACKAGE': __package__,
|
|
'LABEL': __label__,
|
|
'VERSION': __version__,
|
|
'AUTHOR': __author__,
|
|
'HOMEPAGE': __homepage__,
|
|
'DEPENDENCIES': __dependencies__,
|
|
}
|
|
}
|
|
|
|
@abx.hookimpl
|
|
def get_CONFIG():
|
|
from .config import CHROME_CONFIG
|
|
|
|
return {
|
|
'chrome': CHROME_CONFIG
|
|
}
|
|
|
|
@abx.hookimpl
|
|
def get_BINARIES():
|
|
from .binaries import CHROME_BINARY
|
|
|
|
return {
|
|
'chrome': CHROME_BINARY,
|
|
}
|
|
|
|
# @abx.hookimpl
|
|
# def get_EXTRACTORS():
|
|
# return {
|
|
# 'pdf': PDF_EXTRACTOR,
|
|
# 'screenshot': SCREENSHOT_EXTRACTOR,
|
|
# 'dom': DOM_EXTRACTOR,
|
|
# }
|
|
|
|
# Hooks Available:
|
|
|
|
# Events:
|
|
# on_crawl_schedule_tick
|
|
# on_seed_post_save
|
|
# on_crawl_post_save
|
|
# on_snapshot_post_save
|
|
# on_archiveresult_post_save
|
|
|
|
|
|
# create_root_snapshot_from_seed
|
|
# create_archiveresults_pending_from_snapshot
|
|
# create_crawl_from_crawlschedule_if_due
|
|
# create_crawl_copy_from_template
|
|
#
|
|
|
|
|
|
# create_crawl_from_crawlschedule_if_due
|