from lxml import html def get_urls_from_page(url): result = [] path = './/*[@class = "span10"]/div[1]/text()' for page in range(10): doc = html.parse(url + 'page') values = doc.xpath(path) for i in values: result.append(i) return result headers = get_urls_from_page('http://msl.ua/ru/megalot/archive/page/') for h in headers: print(h)