Welcome to mirror list, hosted at ThFree Co, Russian Federation.

github.com/icoz/habraparse.git - Unnamed repository; edit this file 'description' to name the repository.
summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authoricoz <icoz.vt@gmail.com>2017-11-15 01:04:29 +0300
committericoz <icoz.vt@gmail.com>2017-11-15 01:04:29 +0300
commit93d4ac29e008ed24bbd8b5997f4eddad69d9ed51 (patch)
tree12e24c1c0caaa6b1b0c2587326ed4ec5e2f0b2ec
parent51a49ef6ba355872db9b7752f3f4d75c04fe548e (diff)
topic.py:
- исправлено правило для выборки текста статьи
-rw-r--r--habr/topic.py8
1 files changed, 4 insertions, 4 deletions
diff --git a/habr/topic.py b/habr/topic.py
index 5a4170a..3a26806 100644
--- a/habr/topic.py
+++ b/habr/topic.py
@@ -84,10 +84,10 @@ class TMTopic(object):
tmp = doc.xpath(
"//ul[@class='postinfo-panel postinfo-panel_post']//span[@class='oting-wjt__counter-score js-score']")
self.post['rating'] = tmp[0].text if len(tmp) else ''
- tmp = doc.xpath("//div[@class='content html_format js-mediator-article']") or \
- doc.xpath('//div[@class="article__body js-mediator-article"]')
- self.post['text'] = etree.tostring(tmp[0], pretty_print=True, method='html').decode('utf-8') \
- if len(tmp) else ''
+ # tmp = doc.xpath("//div[@class='content html_format js-mediator-article']") or \
+ # doc.xpath('//div[@class="article__body js-mediator-article"]') or \
+ tmp = doc.xpath('//div[@class="post__text post__text-html js-mediator-article"]')
+ self.post['text'] = etree.tostring(tmp[0], pretty_print=True, method='html').decode('utf-8') if len(tmp) else ''
# get comments
self.post['comments'] = []
for cmnt in doc.xpath("//ul[@id='comments-list']//li[@class='content-list__item content-list__item_comment js-comment ']"):