Return an unconfigured Crawler object. If settings_dict is given, it will be used to populate the crawler settings with a project level priority.
(
spidercls: type[Spider] | None = None,
settings_dict: dict[str, Any] | None = None,
prevent_warnings: bool = True,
)
| 58 | |
| 59 | |
| 60 | def get_crawler( |
| 61 | spidercls: type[Spider] | None = None, |
| 62 | settings_dict: dict[str, Any] | None = None, |
| 63 | prevent_warnings: bool = True, |
| 64 | ) -> Crawler: |
| 65 | """Return an unconfigured Crawler object. If settings_dict is given, it |
| 66 | will be used to populate the crawler settings with a project level |
| 67 | priority. |
| 68 | """ |
| 69 | # When needed, useful settings can be added here, e.g. ones that prevent |
| 70 | # deprecation warnings. |
| 71 | settings: dict[str, Any] = { |
| 72 | **get_reactor_settings(), |
| 73 | **(settings_dict or {}), |
| 74 | } |
| 75 | runner: CrawlerRunnerBase |
| 76 | if is_reactor_installed(): |
| 77 | runner = CrawlerRunner(settings) |
| 78 | else: |
| 79 | runner = AsyncCrawlerRunner(settings) |
| 80 | crawler = runner.create_crawler(spidercls or DefaultSpider) |
| 81 | crawler._apply_settings() |
| 82 | return crawler |
| 83 | |
| 84 | |
| 85 | def get_pythonpath() -> str: |
nothing calls this directly
no test coverage detected