diff --git a/modules/taz/pages/article.py b/modules/taz/pages/article.py index b769288372d5872bc4d468ab8037c4b1f5e10009..aad673f5c38c8d3bbb9baba7d733edae2dae905e 100644 --- a/modules/taz/pages/article.py +++ b/modules/taz/pages/article.py @@ -19,7 +19,7 @@ # along with weboob. If not, see . from weboob.tools.capabilities.messages.genericArticle import GenericNewsPage,\ - try_drop_tree + try_drop_tree, clean_relativ_urls class ArticlePage(GenericNewsPage): @@ -33,15 +33,7 @@ def on_loaded(self): def get_body(self): div = self.document.getroot().find('.//div[@class="sectbody"]') try_drop_tree(self.parser, div, "div.anchor") - for a in div.findall('.//a'): - try: - if a.attrib["href"][0:7] != "http://": - a.attrib["href"] = "http://taz.de/" + a.attrib["href"] - except: - continue - for img in div.findall('.//img'): - if img.attrib["src"][0:7] != "http://": - img.attrib["src"] = "http://taz.de/" + img.attrib["src"] + clean_relativ_urls(div, "http://taz.de") return self.parser.tostring(div)