Skip to content

Commit

Permalink
[foxnews] Add support for iframe embeds (closes #15810, closes #16711)
Browse files Browse the repository at this point in the history
  • Loading branch information
dstftw committed Jun 20, 2018
1 parent c9b983f commit f51f526
Show file tree
Hide file tree
Showing 2 changed files with 41 additions and 7 deletions.
42 changes: 35 additions & 7 deletions youtube_dl/extractor/foxnews.py
Expand Up @@ -58,6 +58,14 @@ class FoxNewsIE(AMPIE):
},
]

@staticmethod
def _extract_urls(webpage):
return [
mobj.group('url')
for mobj in re.finditer(
r'<(?:amp-)?iframe[^>]+\bsrc=(["\'])(?P<url>(?:https?:)?//video\.foxnews\.com/v/video-embed\.html?.*?\bvideo_id=\d+.*?)\1',
webpage)]

def _real_extract(self, url):
host, video_id = re.match(self._VALID_URL, url).groups()

Expand All @@ -71,29 +79,49 @@ class FoxNewsArticleIE(InfoExtractor):
_VALID_URL = r'https?://(?:www\.)?foxnews\.com/(?!v)([^/]+/)+(?P<id>[a-z-]+)'
IE_NAME = 'foxnews:article'

_TEST = {
_TESTS = [{
# data-video-id
'url': 'http://www.foxnews.com/politics/2016/09/08/buzz-about-bud-clinton-camp-denies-claims-wore-earpiece-at-forum.html',
'md5': '62aa5a781b308fdee212ebb6f33ae7ef',
'md5': '83d44e1aff1433e7a29a7b537d1700b5',
'info_dict': {
'id': '5116295019001',
'ext': 'mp4',
'title': 'Trump and Clinton asked to defend positions on Iraq War',
'description': 'Veterans react on \'The Kelly File\'',
'timestamp': 1473299755,
'timestamp': 1473301045,
'upload_date': '20160908',
},
}
}, {
# iframe embed
'url': 'http://www.foxnews.com/us/2018/03/09/parkland-survivor-kyle-kashuv-on-meeting-trump-his-app-to-prevent-another-school-shooting.amp.html?__twitter_impression=true',
'info_dict': {
'id': '5748266721001',
'ext': 'flv',
'title': 'Kyle Kashuv has a positive message for the Trump White House',
'description': 'Marjory Stoneman Douglas student disagrees with classmates.',
'thumbnail': r're:^https?://.*\.jpg$',
'duration': 229,
'timestamp': 1520594670,
'upload_date': '20180309',
},
'params': {
'skip_download': True,
},
}]

def _real_extract(self, url):
display_id = self._match_id(url)
webpage = self._download_webpage(url, display_id)

video_id = self._html_search_regex(
r'data-video-id=([\'"])(?P<id>[^\'"]+)\1',
webpage, 'video ID', group='id')
webpage, 'video ID', group='id', default=None)
if video_id:
return self.url_result(
'http://video.foxnews.com/v/' + video_id, FoxNewsIE.ie_key())

return self.url_result(
'http://video.foxnews.com/v/' + video_id,
FoxNewsIE.ie_key())
FoxNewsIE._extract_urls(webpage)[0], FoxNewsIE.ie_key())


class FoxNewsInsiderIE(InfoExtractor):
Expand Down
6 changes: 6 additions & 0 deletions youtube_dl/extractor/generic.py
Expand Up @@ -111,6 +111,7 @@
from .peertube import PeerTubeIE
from .indavideo import IndavideoEmbedIE
from .apa import APAIE
from .foxnews import FoxNewsIE


class GenericIE(InfoExtractor):
Expand Down Expand Up @@ -3091,6 +3092,11 @@ def _real_extract(self, url):
return self.playlist_from_matches(
apa_urls, video_id, video_title, ie=APAIE.ie_key())

foxnews_urls = FoxNewsIE._extract_urls(webpage)
if foxnews_urls:
return self.playlist_from_matches(
foxnews_urls, video_id, video_title, ie=FoxNewsIE.ie_key())

sharevideos_urls = [mobj.group('url') for mobj in re.finditer(
r'<iframe[^>]+?\bsrc\s*=\s*(["\'])(?P<url>(?:https?:)?//embed\.share-videos\.se/auto/embed/\d+\?.*?\buid=\d+.*?)\1',
webpage)]
Expand Down

0 comments on commit f51f526

Please sign in to comment.