Newer
Older
# Copyright(C) 2010-2012 Nicolas Duhamel, Laurent Bachelier
# weboob is free software: you can redistribute it and/or modify
# it under the terms of the GNU Affero General Public License as published by
# the Free Software Foundation, either version 3 of the License, or
# (at your option) any later version.
#
# weboob is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU Affero General Public License for more details.
# You should have received a copy of the GNU Affero General Public License
# along with weboob. If not, see <http://www.gnu.org/licenses/>.
Christophe Benz
committed
import lxml.etree
from weboob.tools.browser.decorators import id2url
from .pages import ChannelsPage, VideoPage
from .video import CanalplusVideo
from weboob.capabilities.collection import CollectionNotFound
Christophe Benz
committed
__all__ = ['CanalplusBrowser']
class XMLParser(object):
def parse(self, data, encoding=None):
if encoding is None:
parser = None
else:
parser = lxml.etree.XMLParser(encoding=encoding, strip_cdata=False)
return lxml.etree.XML(data.get_data(), parser)
DOMAIN = u'service.canal-plus.com'
ENCODING = 'utf-8'
Christophe Benz
committed
PAGES = {
r'http://service.canal-plus.com/video/rest/initPlayer/cplus/': ChannelsPage,
Christophe Benz
committed
r'http://service.canal-plus.com/video/rest/search/cplus/.*': VideoPage,
r'http://service.canal-plus.com/video/rest/getVideosLiees/cplus/(?P<id>.+)': VideoPage,
r'http://service.canal-plus.com/video/rest/getMEAs/cplus/.*': VideoPage,
Christophe Benz
committed
}
Christophe Benz
committed
FORMATS = {
Christophe Benz
committed
}
Browser.__init__(self, parser=self.PARSER, *args, **kwargs)
self.quality = self.FORMATS.get(quality, self.FORMATS['hd'])
Christophe Benz
committed
self.location('http://service.canal-plus.com/video/rest/initPlayer/cplus/')
Romain Bignon
committed
def search_videos(self, pattern):
self.location('http://service.canal-plus.com/video/rest/search/cplus/' + urllib.quote_plus(pattern.replace('/', '').encode('utf-8')))
@id2url(CanalplusVideo.id2url)
def get_video(self, url, video=None):
self.location(url)
video.url = u'%s' % self.read_url(video.url)[self.quality]
return video
def read_url(self, url):
r = requests.get(url, stream=True)
buf = r.iter_lines()
r.close()
return [line for line in buf if not line.startswith('#')]
Romain Bignon
committed
def iter_resources(self, split_path):
if not self.is_on_page(ChannelsPage):
self.home()
channels = self.page.get_channels()
if len(split_path) == 0:
for channel in channels:
if channel.path_level == 1:
yield channel
elif len(split_path) == 1:
for channel in channels:
if channel.path_level == 2 and split_path == channel.parent_path:
yield channel
elif len(split_path) == 2:
subchannels = self.iter_resources(split_path[0:1])
try:
channel = [subchannel for subchannel in subchannels
if split_path == subchannel.split_path][0]
self.location("http://service.canal-plus.com/video/rest/getMEAs/cplus/%s" % channel._link_id)
assert self.is_on_page(VideoPage)
for video in self.page.iter_channel():
yield video
raise CollectionNotFound(split_path)
else:
raise CollectionNotFound(split_path)