archivebox.abx.archivebox.base_extractor

Module Contents

Classes

BaseExtractor

Functions

no_empty_args

Data

__package__

ExtractorName

HandlerFuncStr

CmdArgsList

API

archivebox.abx.archivebox.base_extractor.__package__

‘abx.archivebox’

archivebox.abx.archivebox.base_extractor.no_empty_args(args: List[str]) List[str]
archivebox.abx.archivebox.base_extractor.ExtractorName

None

archivebox.abx.archivebox.base_extractor.HandlerFuncStr

None

archivebox.abx.archivebox.base_extractor.CmdArgsList

None

class archivebox.abx.archivebox.base_extractor.BaseExtractor

Bases: archivebox.abx.archivebox.base_hook.BaseHook

hook_type: archivebox.abx.archivebox.base_hook.HookType

‘EXTRACTOR’

name: archivebox.abx.archivebox.base_extractor.ExtractorName

None

binary: pydantic_pkgr.BinName

None

output_path_func: archivebox.abx.archivebox.base_extractor.HandlerFuncStr

‘self.get_output_path’

should_extract_func: archivebox.abx.archivebox.base_extractor.HandlerFuncStr

‘self.should_extract’

extract_func: archivebox.abx.archivebox.base_extractor.HandlerFuncStr

‘self.extract’

exec_func: archivebox.abx.archivebox.base_extractor.HandlerFuncStr

‘self.exec’

default_args: archivebox.abx.archivebox.base_extractor.CmdArgsList

[]

extra_args: archivebox.abx.archivebox.base_extractor.CmdArgsList

[]

args: Optional[archivebox.abx.archivebox.base_extractor.CmdArgsList]

None

validate_model() typing_extensions.Self
get_output_path(snapshot) pathlib.Path
should_extract(snapshot) bool
extract(snapshot_id: str) Dict[str, Any]
exec(args: archivebox.abx.archivebox.base_extractor.CmdArgsList = (), cwd: Optional[pathlib.Path] = None, installed_binary=None)
BINARY() archivebox.abx.archivebox.base_binary.BaseBinary
detect_installed_binary()
load_binary(installed_binary=None) archivebox.abx.archivebox.base_binary.BaseBinary
detect_network_interface()
get_EXTRACTORS()