from __future__ import unicode_literals import re from .common import InfoExtractor from ..utils import ( int_or_none, ) class ServingSysIE(InfoExtractor): _VALID_URL = r'https?://(?:[^.]+\.)?serving-sys\.com/BurstingPipe/adServer\.bs\?.*?&pli=(?P<id>[0-9]+)' _TEST = { 'url': 'http://bs.serving-sys.com/BurstingPipe/adServer.bs?cn=is&c=23&pl=VAST&pli=5349193&PluID=0&pos=7135&ord=[timestamp]&cim=1?', 'playlist': [{ 'file': '29955898.flv', 'md5': 'baed851342df6846eb8677a60a011a0f', 'info_dict': { 'title': 'AdAPPter_Hyundai_demo (1)', 'duration': 74, 'tbr': 1378, 'width': 640, 'height': 400, }, }, { 'file': '29907998.flv', 'md5': '979b4da2655c4bc2d81aeb915a8c5014', 'info_dict': { 'title': 'AdAPPter_Hyundai_demo (2)', 'duration': 34, 'width': 854, 'height': 480, 'tbr': 516, }, }], 'params': { 'playlistend': 2, } } def _real_extract(self, url): mobj = re.match(self._VALID_URL, url) pl_id = mobj.group('id') vast_doc = self._download_xml(url, pl_id) title = vast_doc.find('.//AdTitle').text media = vast_doc.find('.//MediaFile').text info_url = self._search_regex(r'&adData=([^&]+)&', media, 'info URL') doc = self._download_xml(info_url, pl_id, 'Downloading video info') entries = [{ '_type': 'video', 'id': a.attrib['id'], 'title': '%s (%s)' % (title, a.attrib['assetID']), 'url': a.attrib['URL'], 'duration': int_or_none(a.attrib.get('length')), 'tbr': int_or_none(a.attrib.get('bitrate')), 'height': int_or_none(a.attrib.get('height')), 'width': int_or_none(a.attrib.get('width')), } for a in doc.findall('.//AdditionalAssets/asset')] return { '_type': 'playlist', 'id': pl_id, 'title': title, 'entries': entries, }