From c533c89ce1d6965d8575413738d76a5bf9e2de59 Mon Sep 17 00:00:00 2001 From: pukkandan Date: Mon, 31 Jan 2022 12:32:44 +0530 Subject: [PATCH] [GoogleSearch] Fix extractor --- yt_dlp/extractor/googlesearch.py | 21 +++++++++------------ 1 file changed, 9 insertions(+), 12 deletions(-) diff --git a/yt_dlp/extractor/googlesearch.py b/yt_dlp/extractor/googlesearch.py index f605c0c35f..4b8b1bcbb8 100644 --- a/yt_dlp/extractor/googlesearch.py +++ b/yt_dlp/extractor/googlesearch.py @@ -8,36 +8,33 @@ class GoogleSearchIE(SearchInfoExtractor): IE_DESC = 'Google Video search' - _MAX_RESULTS = 1000 IE_NAME = 'video.google:search' _SEARCH_KEY = 'gvsearch' - _WORKING = False - _TEST = { + _TESTS = [{ 'url': 'gvsearch15:python language', 'info_dict': { 'id': 'python language', 'title': 'python language', }, 'playlist_count': 15, - } + }] + _PAGE_SIZE = 100 def _search_results(self, query): for pagenum in itertools.count(): webpage = self._download_webpage( - 'http://www.google.com/search', - 'gvsearch:' + query, - note='Downloading result page %s' % (pagenum + 1), + 'http://www.google.com/search', f'gvsearch:{query}', + note=f'Downloading result page {pagenum + 1}', query={ 'tbm': 'vid', 'q': query, - 'start': pagenum * 10, + 'start': pagenum * self._PAGE_SIZE, + 'num': self._PAGE_SIZE, 'hl': 'en', }) - for hit_idx, mobj in enumerate(re.finditer( - r'

]* class="dXiKIc"[^>]*>