Welcome to mirror list, hosted at ThFree Co, Russian Federation.

github.com/icoz/habraparse.git - Unnamed repository; edit this file 'description' to name the repository.
summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authoricoz <icoz.vt@gmail.com>2016-12-11 14:24:59 +0300
committericoz <icoz.vt@gmail.com>2016-12-11 14:24:59 +0300
commit70cfc8706d15853199cd2303229430185d5e0065 (patch)
treeb3f799723f2822ceb05954490a97d439d00073fd
parentb2a3a29aac57a8f6b77c0ca27707e76f1eed3429 (diff)
Исправлен код разбора с связи с изменением разметки на хабре
-rw-r--r--habr/user.py6
1 files changed, 3 insertions, 3 deletions
diff --git a/habr/user.py b/habr/user.py
index f6cda91..611927a 100644
--- a/habr/user.py
+++ b/habr/user.py
@@ -118,7 +118,7 @@ class TMUser(object):
date_of_last_login = tmp[0].text.strip()
tmp = self._doc.xpath("//div[@class='user_header']/h2/a")
- self._user['username'] = tmp.pop().text if len(tmp) else ''
+ self._user['username'] = tmp.pop().text if len(tmp) else self._username
tmp = self._doc.xpath("//div[@class='karma']//div[@class='num']")
self._user_karma['karma'] = float(tmp.pop().text.replace(',', '.').replace("–","-")) if len(tmp) else 0.0
@@ -186,7 +186,7 @@ class TMUser(object):
doc = html.document_fromstring(requests.get(url).text)
out = dict()
pages = get_pages(doc)
- favs = doc.xpath("//div[@class='user_favorites']//a[@class='post_title']")
+ favs = doc.xpath("//div[@class='user_favorites']//a[@class='post__title_link']")
for f in favs:
# out[f.text] = str(f.attrib['href']).split('/')[-2]
# topic_id =
@@ -196,7 +196,7 @@ class TMUser(object):
# if show_progress:
# print('parsing page{0}... url={1}'.format(p, url))
doc = html.document_fromstring(requests.get(url).text)
- favs = doc.xpath("//div[@class='user_favorites']//a[@class='post_title']")
+ favs = doc.xpath("//div[@class='user_favorites']//a[@class='post__title_link']")
for f in favs:
# out[f.text] = f.attrib['href'][-7:-1]
out[f.text] = str(f.attrib['href']).split('/')[-2]