Scraply (, <ul> <ol>) - . . , HTML/, , , (<li></li>), , , , .
, , , . , case .split('\n')[3:-2] :
['- 50 gr de hojas de albahaca',
'- 4 cucharadas (60 ml) de piñones',
'- 2 - 4 dientes de ajo',
'- 120 ml (1/2 vaso) de aceite de oliva virgen extra',
'- 115 gr de queso parmesano recién rallado',
'- 25 gr de queso pecorino recién rallado ( o queso de leche de oveja curado)']
( - ), Scraper , :
class PostprocessScraper(Scraper):
def scrape_page_postprocess(self, page, processors=None):
if processors == None:
processors = {}
result = self.scrape_page(page)
for r in result:
for field, items in r.items():
if field in processors:
fn = processors[field]
r[field] = [fn(i) for i in items]
return result
scrape_page_postprocess , . :
processors = {'ingredients': lambda s: s.split('\n')[3:-2]}
scrape_page_postprocess(page, processors)