- Define generic Result[T] dataclass (7 fields: success, status_code, data, list, count, is_end_page, error) - Port parse_response() from spiderJobs/core/base.py returning Result[Any] - BaseFetcher: 4 template methods (_build_params, _parse required; _build_headers, _check_blocked optional) - BaseSearcher: 4 template methods with load_all() paginator using stdlib logging - crawler_core/__init__.py exports BaseFetcher, BaseSearcher, Result, HTTPClient, parse_response - No ApiResult, no loguru, no spiderJobs/app imports
20 lines
443 B
Python
20 lines
443 B
Python
"""
|
|
crawler_core — 招聘爬虫共享核心包
|
|
|
|
安装方式: pip install -e ./crawler_core
|
|
使用方式: from crawler_core import BaseFetcher, BaseSearcher, Result, HTTPClient
|
|
"""
|
|
|
|
from crawler_core.base import Result, BaseFetcher, BaseSearcher, parse_response
|
|
from crawler_core.http_client import HTTPClient
|
|
|
|
__all__ = [
|
|
"Result",
|
|
"BaseFetcher",
|
|
"BaseSearcher",
|
|
"HTTPClient",
|
|
"parse_response",
|
|
]
|
|
|
|
__version__ = "0.1.0"
|