@ -27,6 +27,7 @@ from ..utils import (
get_element_by_id ,
get_element_by_id ,
get_element_by_attribute ,
get_element_by_attribute ,
ExtractorError ,
ExtractorError ,
PagedList ,
RegexNotFoundError ,
RegexNotFoundError ,
unescapeHTML ,
unescapeHTML ,
unified_strdate ,
unified_strdate ,
@ -1580,44 +1581,35 @@ class YoutubeUserIE(InfoExtractor):
# page by page until there are no video ids - it means we got
# page by page until there are no video ids - it means we got
# all of them.
# all of them.
url_results = [ ]
def download_page ( pagenum ) :
for pagenum in itertools . count ( 0 ) :
start_index = pagenum * self . _GDATA_PAGE_SIZE + 1
start_index = pagenum * self . _GDATA_PAGE_SIZE + 1
gdata_url = self . _GDATA_URL % ( username , self . _GDATA_PAGE_SIZE , start_index )
gdata_url = self . _GDATA_URL % ( username , self . _GDATA_PAGE_SIZE , start_index )
page = self . _download_webpage ( gdata_url , username ,
page = self . _download_webpage (
u ' Downloading video ids from %d to %d ' % ( start_index , start_index + self . _GDATA_PAGE_SIZE ) )
gdata_url , username ,
u ' Downloading video ids from %d to %d ' % (
start_index , start_index + self . _GDATA_PAGE_SIZE ) )
try :
try :
response = json . loads ( page )
response = json . loads ( page )
except ValueError as err :
except ValueError as err :
raise ExtractorError ( u ' Invalid JSON in API response: ' + compat_str ( err ) )
raise ExtractorError ( u ' Invalid JSON in API response: ' + compat_str ( err ) )
if ' entry ' not in response [ ' feed ' ] :
if ' entry ' not in response [ ' feed ' ] :
# Number of videos is a multiple of self._MAX_RESULTS
return
break
# Extract video identifiers
# Extract video identifiers
entries = response [ ' feed ' ] [ ' entry ' ]
entries = response [ ' feed ' ] [ ' entry ' ]
for entry in entries :
for entry in entries :
title = entry [ ' title ' ] [ ' $t ' ]
title = entry [ ' title ' ] [ ' $t ' ]
video_id = entry [ ' id ' ] [ ' $t ' ] . split ( ' / ' ) [ - 1 ]
video_id = entry [ ' id ' ] [ ' $t ' ] . split ( ' / ' ) [ - 1 ]
url_results . append ( {
yield {
' _type ' : ' url ' ,
' _type ' : ' url ' ,
' url ' : video_id ,
' url ' : video_id ,
' ie_key ' : ' Youtube ' ,
' ie_key ' : ' Youtube ' ,
' id ' : ' video_id ' ,
' id ' : ' video_id ' ,
' title ' : title ,
' title ' : title ,
} )
}
url_results = PagedList ( download_page , self . _GDATA_PAGE_SIZE )
# A little optimization - if current page is not
# "full", ie. does not contain PAGE_SIZE video ids then
# we can assume that this page is the last one - there
# are no more ids on further pages - no need to query
# again.
if len ( entries ) < self . _GDATA_PAGE_SIZE :
break
return self . playlist_result ( url_results , playlist_title = username )
return self . playlist_result ( url_results , playlist_title = username )