diff options
-rw-r--r-- | habr/topic.py | 5 |
1 files changed, 2 insertions, 3 deletions
diff --git a/habr/topic.py b/habr/topic.py index 0ca4e36..c12332f 100644 --- a/habr/topic.py +++ b/habr/topic.py @@ -82,15 +82,14 @@ class TMTopic(object): "//ul[@class='postinfo-panel postinfo-panel_post']//span[@class='oting-wjt__counter-score js-score']") self.post['rating'] = tmp[0].text if len(tmp) else '' tmp = doc.xpath("//div[@class='content html_format js-mediator-article']") or \ - doc.xpath("//div[@class='content html_format']") or \ - doc.xpath('//div[@class="article__body"]') + doc.xpath('//div[@class="article__body js-mediator-article"]') self.post['text'] = etree.tostring(tmp[0], pretty_print=True, method='html').decode('utf-8') \ if len(tmp) else '' self.post['comments'] = [] # bug in class 'comments_list ' - space added # comments = doc.xpath("//div[@class='comments_list ']//div[@class='comment_item']") # comments = doc.xpath("//ul[@id='comments-list']//li[@class='comment_item']") - # record = (author, text)text + # record = (author, text) authors = list( map(lambda x: x.text, doc.xpath("//ul[@id='comments-list']//a[@class='comment-item__username']")) ) |