(self, response)
| 27 | return url |
| 28 | |
| 29 | def parse(self, response): |
| 30 | self.logger.info(response.headers) |
| 31 | self.logger.info(response.text) |
| 32 | item = { |
| 33 | self.media_key: [], |
| 34 | self.media_urls_key: [ |
| 35 | self._process_url(response.urljoin(href)) |
| 36 | for href in response.xpath( |
| 37 | '//table[thead/tr/th="Filename"]/tbody//a/@href' |
| 38 | ).getall() |
| 39 | ], |
| 40 | } |
| 41 | yield item |
| 42 | |
| 43 | |
| 44 | class BrokenLinksMediaDownloadSpider(MediaDownloadSpider): |
nothing calls this directly
no test coverage detected