[GorillaVid] Added GorillaVid extractor

pull/2/head
marcwebbie 11 years ago
parent 814d4257df
commit 617c0b2239

@ -109,6 +109,7 @@ from .gdcvault import GDCVaultIE
from .generic import GenericIE from .generic import GenericIE
from .googleplus import GooglePlusIE from .googleplus import GooglePlusIE
from .googlesearch import GoogleSearchIE from .googlesearch import GoogleSearchIE
from .gorillavid import GorillaVidIE
from .hark import HarkIE from .hark import HarkIE
from .helsinki import HelsinkiIE from .helsinki import HelsinkiIE
from .hentaistigma import HentaiStigmaIE from .hentaistigma import HentaiStigmaIE

@ -0,0 +1,38 @@
# coding: utf-8
from __future__ import unicode_literals
import re
from .common import InfoExtractor
class GorillaVidIE(InfoExtractor):
_VALID_URL = r'https?://(?:www.)?gorillavid.in/(?:embed-)?(?P<id>\w+)(?:\-\d+x\d+)?.html'
_TEST = {
'url': "http://gorillavid.in/kdk7i5r1p5ye.html",
'md5': '5a01b05ed3da82a10c6659e954b80108',
'info_dict': {
'id': 'kdk7i5r1p5ye',
'ext': 'flv',
'title': 'Full House 1x16 - But Seriously, Folks.avi',
}
}
def _real_extract(self, url):
mobj = re.match(self._VALID_URL, url)
video_id = mobj.group('id')
webpage = self._download_webpage(url, video_id)
title = self._html_search_regex(r"name=['\"]fname['\"]\s+value=['\"](.*?)['\"]", webpage, u"video title")
# download embed page again with cookies to get url
embed_url = "http://gorillavid.in/embed-{0}-960x480.html".format(video_id)
webpage = self._download_webpage(embed_url, video_id, note=u'Downloading webpage again (with cookie)')
url = self._html_search_regex(r'file:\s+["\'](http://.*?video.\w{3})["\']', webpage, url)
info_dict = {
'id': video_id,
'title': title,
'url': url,
}
return info_dict
Loading…
Cancel
Save