mirror of
https://github.com/ArchiveBox/ArchiveBox.git
synced 2025-05-30 06:25:28 -04:00
new generic_html parser for extracting hrefs
This commit is contained in:
parent
a682a9c478
commit
15efb2d5ed
5 changed files with 106 additions and 39 deletions
|
@ -70,6 +70,7 @@ archivebox/index/json.py
|
|||
archivebox/index/schema.py
|
||||
archivebox/index/sql.py
|
||||
archivebox/parsers/__init__.py
|
||||
archivebox/parsers/generic_html.py
|
||||
archivebox/parsers/generic_json.py
|
||||
archivebox/parsers/generic_rss.py
|
||||
archivebox/parsers/generic_txt.py
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue