Method parse

tests/test_pipeline_crawl.py:29–41 · view source on GitHub ↗

(self, response)

Source from the content-addressed store, hash-verified

27	return url
28
29	def parse(self, response):
30	self.logger.info(response.headers)
31	self.logger.info(response.text)
32	item = {
33	self.media_key: [],
34	self.media_urls_key: [
35	self._process_url(response.urljoin(href))
36	for href in response.xpath(
37	'//table[thead/tr/th="Filename"]/tbody//a/@href'
38	).getall()
39	],
40	}
41	yield item
42
43
44	class BrokenLinksMediaDownloadSpider(MediaDownloadSpider):

nothing calls this directly

_process_urlMethod · 0.95

infoMethod · 0.80

urljoinMethod · 0.45

xpathMethod · 0.45

no test coverage detected