Newer
Older
# -*- coding: utf-8 -*-
# Copyright(C) 2012 Romain Bignon
#
# This file is part of a weboob module.
# This weboob module is free software: you can redistribute it and/or modify
# it under the terms of the GNU Affero General Public License as published by
# the Free Software Foundation, either version 3 of the License, or
# (at your option) any later version.
#
# This weboob module is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU Affero General Public License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with this weboob module. If not, see <http://www.gnu.org/licenses/>.
from weboob.browser.pages import XMLPage, JsonPage, pagination
from weboob.browser.elements import ItemElement, ListElement, DictElement, method
from weboob.browser.filters.json import Dict
from weboob.browser.filters.html import XPath
from weboob.browser.filters.standard import (CleanText, CleanDecimal, Currency,
from weboob.capabilities.base import NotAvailable, NotLoaded
from weboob.capabilities.housing import (Housing, HousingPhoto, City,
UTILITIES, ENERGY_CLASS, POSTS_TYPES,
ADVERT_TYPES)
from weboob.tools.capabilities.housing.housing import PricePerMeterFilter
from .constants import TYPES, RET
class CitiesPage(JsonPage):
@method
class iter_cities(DictElement):
Bezleputh
committed
ignore_duplicate = True
obj_id = Dict('Params/ci')
obj_name = Dict('Display')
class SeLogerItem(ItemElement):
klass = Housing
obj_id = CleanText('idAnnonce')
def obj_type(self):
idType = int(CleanText('idTypeTransaction')(self))
type = next(k for k, v in TYPES.items() if v == idType)
if type == POSTS_TYPES.FURNISHED_RENT:
# SeLoger does not let us discriminate between furnished and not
# furnished.
return POSTS_TYPES.RENT
return type
def obj_house_type(self):
idType = CleanText('idTypeBien')(self)
try:
return next(k for k, v in RET.items() if v == idType)
except StopIteration:
obj_title = Format(
"%s %s%s - %s",
CleanText('titre'),
CleanText('surface'),
CleanText('surfaceUnite'),
CleanText('ville'),
)
obj_cost = CleanDecimal('prix', default=NotLoaded)
obj_currency = Currency(Regexp(CleanText('prixUnite'), r'(\W).*', r'\1'))
obj_area = CleanDecimal('surface', default=NotLoaded)
obj_price_per_meter = PricePerMeterFilter()
obj_rooms = CleanDecimal('nbPiece|nbPieces', default=NotLoaded)
obj_bedrooms = CleanDecimal('nbChambre|nbChambres', default=NotLoaded)
def obj_location(self):
location = CleanText('adresse', default="")(self)
quartier = CleanText('quartier', default=None)(self)
if not location and quartier is not None:
location = quartier
ville = CleanText('ville')(self)
cp = CleanText('cp')(self)
return u'%s %s (%s)' % (location, ville, cp)
obj_station = CleanText('proximite', default=NotLoaded)
obj_url = CleanText('permaLien')
class SearchResultsPage(XMLPage):
@pagination
@method
class iter_housings(ListElement):
item_xpath = "//annonce"
def next_page(self):
page = CleanText('//pageSuivante', default=None, replace=[('http://ws.seloger.com/', '')])(self)
def condition(self):
if self.env['query_type'] == POSTS_TYPES.SALE:
# Ignore VIAGER
return CleanText('idTypeTransaction')(self) == '2'
return True
def validate(self, obj):
return (len(self.env['advert_types']) == 1 and
self.env['advert_types'][0] == obj.advert_type) or \
self.env['advert_types'] > 1
obj_type = Env('query_type')
def obj_advert_type(self):
is_agency = (
';' not in CleanText('contact/nom')(self)
)
if is_agency:
return ADVERT_TYPES.PROFESSIONAL
else:
return ADVERT_TYPES.PERSONAL
Bezleputh
committed
for photo in XPath('./photos/photo/stdUrl')(self):
photos.append(HousingPhoto(CleanText('.')(photo)))
def obj_utilities(self):
currency = CleanText('prixUnite')(self)
if "+ch" in currency:
return UTILITIES.EXCLUDED
elif "cc*" in currency:
return UTILITIES.INCLUDED
else:
return UTILITIES.UNKNOWN
class HousingPage(XMLPage):
@method
class get_housing(SeLogerItem):
def obj_photos(self):
photos = []
for photo in XPath('./photos/photo')(self):
url = CleanText('bigUrl', default=None)(photo)
if not url:
url = CleanText('stdUrl', default=None)(photo)
photos.append(HousingPhoto(url))
return photos
def obj_advert_type(self):
is_agency = (
CleanText('contact/rcsSiren')(self) or
CleanText('contact/rcsNic')(self) or
CleanText('contact/idAnnuaire')(self)
)
if is_agency:
return ADVERT_TYPES.PROFESSIONAL
else:
return ADVERT_TYPES.PERSONAL
def obj_DPE(self):
DPE = CleanText('//bilanConsoEnergie', default="")(self)
return getattr(ENERGY_CLASS, DPE, NotAvailable)
def obj_GES(self):
GES = CleanText('//bilanEmissionGES', default="")(self)
return getattr(ENERGY_CLASS, GES, NotAvailable)
def obj_details(self):
details = {}
for detail in XPath('//detailAnnonce/details/detail')(self):
details[CleanText('libelle')(detail)] = CleanText('valeur', default='N/A')(detail)
details['Reference'] = CleanText('//detailAnnonce/reference')(self)
return details
obj_phone = CleanText('//contact/telephone')
def obj_utilities(self):
mention = CleanText('prixMention')(self)
if "charges comprises" in mention:
return UTILITIES.INCLUDED
else:
Phyks (Lucas Verney)
committed
return UTILITIES.UNKNOWN