Welcome to mirror list, hosted at ThFree Co, Russian Federation.

github.com/icoz/habraparse.git - Unnamed repository; edit this file 'description' to name the repository.
summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authoricoz <icoz.vt@gmail.com>2017-08-06 10:06:23 +0300
committericoz <icoz.vt@gmail.com>2017-08-06 10:06:23 +0300
commita09fe184612502432c92c483dc6a7e097f9015ac (patch)
tree564464b1f8ddc00fb3898e7e9a6b2b68e4f005e1
parent55fddda03182fb3d2c2163d98926a1ef8d676d69 (diff)
parente2713d8ab741ee31af965bb5f2b53eaabff0631b (diff)
Merge remote-tracking branch 'origin/master'
# Conflicts: # habr/topic.py
-rw-r--r--habr/topic.py5
1 files changed, 2 insertions, 3 deletions
diff --git a/habr/topic.py b/habr/topic.py
index 0ca4e36..c12332f 100644
--- a/habr/topic.py
+++ b/habr/topic.py
@@ -82,15 +82,14 @@ class TMTopic(object):
"//ul[@class='postinfo-panel postinfo-panel_post']//span[@class='oting-wjt__counter-score js-score']")
self.post['rating'] = tmp[0].text if len(tmp) else ''
tmp = doc.xpath("//div[@class='content html_format js-mediator-article']") or \
- doc.xpath("//div[@class='content html_format']") or \
- doc.xpath('//div[@class="article__body"]')
+ doc.xpath('//div[@class="article__body js-mediator-article"]')
self.post['text'] = etree.tostring(tmp[0], pretty_print=True, method='html').decode('utf-8') \
if len(tmp) else ''
self.post['comments'] = []
# bug in class 'comments_list ' - space added
# comments = doc.xpath("//div[@class='comments_list ']//div[@class='comment_item']")
# comments = doc.xpath("//ul[@id='comments-list']//li[@class='comment_item']")
- # record = (author, text)text
+ # record = (author, text)
authors = list(
map(lambda x: x.text, doc.xpath("//ul[@id='comments-list']//a[@class='comment-item__username']"))
)