A convenient library for everyday parsing of sites
pip3 install git+https://github.com/afedotov89/site-parser@f830001f275b25c051ac3a1bf096f7e050f3c9c9
>>> from siteparser.parser import Parser
>>> parser = Parser().html('https://www.kinopoisk.ru/top/')
>>> docs = [
sub_parser.take(
title='./td[2]/a',
original_title='./td[2]/span',
vote='./td[3]//a'
).document
for sub_parser in parser.foreach('//tr[contains(@id, "top250_place_")]')
]
>>> len(docs)
250
>>> docs[0]
{'title': 'Побег из Шоушенка (1994)', 'original_title': 'The Shawshank Redemption', 'vote': '9.191'}