From 3e87c8eec86c03c9a69ca9784a7e737ce4c26300 Mon Sep 17 00:00:00 2001
From: Avichai Cohen <cavichai@videocites.com>
Date: Wed, 23 Oct 2019 11:06:31 +0300
Subject: [PATCH 01/46] Merge branch 'master' of
 https://github.com/ytdl-org/youtube-dl into ytdl-org-master

# Conflicts:
#	youtube_dl/extractor/facebook.py
---
 youtube_dl/extractor/ceskatelevize.py |  2 ++
 youtube_dl/extractor/facebook.py      |  7 ++++++-
 youtube_dl/extractor/globo.py         | 24 +++++++++++++++---------
 3 files changed, 23 insertions(+), 10 deletions(-)

diff --git a/youtube_dl/extractor/ceskatelevize.py b/youtube_dl/extractor/ceskatelevize.py
index 1ec58f7d8..7cb4efb74 100644
--- a/youtube_dl/extractor/ceskatelevize.py
+++ b/youtube_dl/extractor/ceskatelevize.py
@@ -147,6 +147,8 @@ class CeskaTelevizeIE(InfoExtractor):
                 is_live = item.get('type') == 'LIVE'
                 formats = []
                 for format_id, stream_url in item.get('streamUrls', {}).items():
+                    if 'drmOnly=true' in stream_url:
+                        continue
                     if 'playerType=flash' in stream_url:
                         stream_formats = self._extract_m3u8_formats(
                             stream_url, playlist_id, 'mp4', 'm3u8_native',
diff --git a/youtube_dl/extractor/facebook.py b/youtube_dl/extractor/facebook.py
index fff42255e..b205fa276 100644
--- a/youtube_dl/extractor/facebook.py
+++ b/youtube_dl/extractor/facebook.py
@@ -397,6 +397,7 @@ class FacebookIE(InfoExtractor):
 
         is_live = live_status == 'live'
 
+        subtitles = {}
         formats = []
         for f in video_data:
             format_id = f['stream_type']
@@ -420,6 +421,9 @@ class FacebookIE(InfoExtractor):
             if dash_manifest:
                 formats.extend(self._parse_mpd_formats(
                     compat_etree_fromstring(compat_urllib_parse_unquote_plus(dash_manifest))))
+            subtitles_src = f[0].get('subtitles_src')
+            if subtitles_src:
+                subtitles.setdefault('en', []).append({'url': subtitles_src})
         if not formats:
             raise ExtractorError('Cannot find video formats')
 
@@ -492,7 +496,8 @@ class FacebookIE(InfoExtractor):
             'is_live': is_live,
             'live_status': live_status,
             'like_count': likes_count,
-            'share_count': shares_count
+            'share_count': shares_count,
+            'subtitles': subtitles,
         }
         if uploader_id:
             info_dict['uploader_like_count'] = FacebookAjax(self, webpage, uploader_id).page_likes
diff --git a/youtube_dl/extractor/globo.py b/youtube_dl/extractor/globo.py
index 9ad1d95fb..60d842d3a 100644
--- a/youtube_dl/extractor/globo.py
+++ b/youtube_dl/extractor/globo.py
@@ -132,18 +132,24 @@ class GloboIE(InfoExtractor):
                         '%s returned error: %s' % (self.IE_NAME, message), expected=True)
                 continue
 
-            assert security_hash[:2] in ('04', '14')
-            received_time = security_hash[3:13]
-            received_md5 = security_hash[24:]
-
-            sign_time = compat_str(int(received_time) + 86400)
+            hash_code = security_hash[:2]
             padding = '%010d' % random.randint(1, 10000000000)
-
-            md5_data = (received_md5 + sign_time + padding + '0xAC10FD').encode()
+            if hash_code in ('04', '14'):
+                received_time = security_hash[3:13]
+                received_md5 = security_hash[24:]
+                hash_prefix = security_hash[:23]
+            elif hash_code in ('02', '12', '03', '13'):
+                received_time = security_hash[2:12]
+                received_md5 = security_hash[22:]
+                padding += '1'
+                hash_prefix = '05' + security_hash[:22]
+
+            padded_sign_time = compat_str(int(received_time) + 86400) + padding
+            md5_data = (received_md5 + padded_sign_time + '0xAC10FD').encode()
             signed_md5 = base64.urlsafe_b64encode(hashlib.md5(md5_data).digest()).decode().strip('=')
-            signed_hash = security_hash[:23] + sign_time + padding + signed_md5
-
+            signed_hash = hash_prefix + padded_sign_time + signed_md5
             signed_url = '%s?h=%s&k=html5&a=%s&u=%s' % (resource_url, signed_hash, 'F' if video.get('subscriber_only') else 'A', security.get('user') or '')
+
             if resource_id.endswith('m3u8') or resource_url.endswith('.m3u8'):
                 formats.extend(self._extract_m3u8_formats(
                     signed_url, resource_id, 'mp4', entry_protocol='m3u8_native',

From a96eb0b5cdf2971b2d137b115da1d947f3416969 Mon Sep 17 00:00:00 2001
From: Avi Peretz <pavi@videocites.com>
Date: Sun, 27 Oct 2019 14:35:17 +0200
Subject: [PATCH 02/46] .

---
 youtube_dl/extractor/discoverynetworks.py |  63 ++--
 youtube_dl/extractor/dplay.py             | 397 +++++++---------------
 youtube_dl/extractor/extractors.py        |   5 +-
 youtube_dl/extractor/generic.py           |   7 +-
 youtube_dl/extractor/odnoklassniki.py     |   9 +
 youtube_dl/extractor/vk.py                | 342 ++++++++++---------
 6 files changed, 337 insertions(+), 486 deletions(-)

diff --git a/youtube_dl/extractor/discoverynetworks.py b/youtube_dl/extractor/discoverynetworks.py
index fba1ef221..607a54948 100644
--- a/youtube_dl/extractor/discoverynetworks.py
+++ b/youtube_dl/extractor/discoverynetworks.py
@@ -3,63 +3,38 @@ from __future__ import unicode_literals
 
 import re
 
-from .brightcove import BrightcoveLegacyIE
 from .dplay import DPlayIE
-from ..compat import (
-    compat_parse_qs,
-    compat_urlparse,
-)
-from ..utils import smuggle_url
 
 
 class DiscoveryNetworksDeIE(DPlayIE):
-    _VALID_URL = r'''(?x)https?://(?:www\.)?(?P<site>discovery|tlc|animalplanet|dmax)\.de/
-                        (?:
-                           .*\#(?P<id>\d+)|
-                           (?:[^/]+/)*videos/(?P<display_id>[^/?#]+)|
-                           programme/(?P<programme>[^/]+)/video/(?P<alternate_id>[^/]+)
-                        )'''
+    _VALID_URL = r'https?://(?:www\.)?(?P<domain>(?:tlc|dmax)\.de|dplay\.co\.uk)/(?:programme|show)/(?P<programme>[^/]+)/video/(?P<alternate_id>[^/]+)'
 
     _TESTS = [{
-        'url': 'http://www.tlc.de/sendungen/breaking-amish/videos/#3235167922001',
+        'url': 'https://www.tlc.de/programme/breaking-amish/video/die-welt-da-drauen/DCB331270001100',
         'info_dict': {
-            'id': '3235167922001',
+            'id': '78867',
             'ext': 'mp4',
-            'title': 'Breaking Amish: Die Welt da draußen',
-            'description': (
-                'Vier Amische und eine Mennonitin wagen in New York'
-                '  den Sprung in ein komplett anderes Leben. Begleitet sie auf'
-                ' ihrem spannenden Weg.'),
-            'timestamp': 1396598084,
-            'upload_date': '20140404',
-            'uploader_id': '1659832546',
+            'title': 'Die Welt da draußen',
+            'description': 'md5:61033c12b73286e409d99a41742ef608',
+            'timestamp': 1554069600,
+            'upload_date': '20190331',
+        },
+        'params': {
+            'format': 'bestvideo',
+            'skip_download': True,
         },
     }, {
-        'url': 'http://www.dmax.de/programme/storage-hunters-uk/videos/storage-hunters-uk-episode-6/',
+        'url': 'https://www.dmax.de/programme/dmax-highlights/video/tuning-star-sidney-hoffmann-exklusiv-bei-dmax/191023082312316',
         'only_matching': True,
     }, {
-        'url': 'http://www.discovery.de/#5332316765001',
+        'url': 'https://www.dplay.co.uk/show/ghost-adventures/video/hotel-leger-103620/EHD_280313B',
         'only_matching': True,
     }]
-    BRIGHTCOVE_URL_TEMPLATE = 'http://players.brightcove.net/1659832546/default_default/index.html?videoId=%s'
 
     def _real_extract(self, url):
-        mobj = re.match(self._VALID_URL, url)
-        alternate_id = mobj.group('alternate_id')
-        if alternate_id:
-            self._initialize_geo_bypass({
-                'countries': ['DE'],
-            })
-            return self._get_disco_api_info(
-                url, '%s/%s' % (mobj.group('programme'), alternate_id),
-                'sonic-eu1-prod.disco-api.com', mobj.group('site') + 'de')
-        brightcove_id = mobj.group('id')
-        if not brightcove_id:
-            title = mobj.group('title')
-            webpage = self._download_webpage(url, title)
-            brightcove_legacy_url = BrightcoveLegacyIE._extract_brightcove_url(webpage)
-            brightcove_id = compat_parse_qs(compat_urlparse.urlparse(
-                brightcove_legacy_url).query)['@videoPlayer'][0]
-        return self.url_result(smuggle_url(
-            self.BRIGHTCOVE_URL_TEMPLATE % brightcove_id, {'geo_countries': ['DE']}),
-            'BrightcoveNew', brightcove_id)
+        domain, programme, alternate_id = re.match(self._VALID_URL, url).groups()
+        country = 'GB' if domain == 'dplay.co.uk' else 'DE'
+        realm = 'questuk' if country == 'GB' else domain.replace('.', '')
+        return self._get_disco_api_info(
+            url, '%s/%s' % (programme, alternate_id),
+            'sonic-eu1-prod.disco-api.com', realm, country)
diff --git a/youtube_dl/extractor/dplay.py b/youtube_dl/extractor/dplay.py
index ebf59512c..d9c3d59cd 100644
--- a/youtube_dl/extractor/dplay.py
+++ b/youtube_dl/extractor/dplay.py
@@ -1,74 +1,68 @@
 # coding: utf-8
 from __future__ import unicode_literals
 
-import json
 import re
-import time
 
 from .common import InfoExtractor
-from ..compat import (
-    compat_HTTPError,
-    compat_str,
-    compat_urlparse,
-)
+from ..compat import compat_HTTPError
 from ..utils import (
     determine_ext,
     ExtractorError,
     float_or_none,
     int_or_none,
-    remove_end,
-    try_get,
-    unified_strdate,
     unified_timestamp,
-    update_url_query,
-    urljoin,
-    USER_AGENTS,
 )
 
 
 class DPlayIE(InfoExtractor):
-    _VALID_URL = r'https?://(?P<domain>www\.(?P<host>dplay\.(?P<country>dk|se|no)))/(?:video(?:er|s)/)?(?P<id>[^/]+/[^/?#]+)'
+    _VALID_URL = r'''(?x)https?://
+        (?P<domain>
+            (?:www\.)?(?P<host>dplay\.(?P<country>dk|fi|jp|se|no))|
+            (?P<subdomain_country>es|it)\.dplay\.com
+        )/[^/]+/(?P<id>[^/]+/[^/?#]+)'''
 
     _TESTS = [{
         # non geo restricted, via secure api, unsigned download hls URL
-        'url': 'http://www.dplay.se/nugammalt-77-handelser-som-format-sverige/season-1-svensken-lar-sig-njuta-av-livet/',
+        'url': 'https://www.dplay.se/videos/nugammalt-77-handelser-som-format-sverige/nugammalt-77-handelser-som-format-sverige-101',
         'info_dict': {
-            'id': '3172',
-            'display_id': 'nugammalt-77-handelser-som-format-sverige/season-1-svensken-lar-sig-njuta-av-livet',
+            'id': '13628',
+            'display_id': 'nugammalt-77-handelser-som-format-sverige/nugammalt-77-handelser-som-format-sverige-101',
             'ext': 'mp4',
             'title': 'Svensken lär sig njuta av livet',
             'description': 'md5:d3819c9bccffd0fe458ca42451dd50d8',
-            'duration': 2650,
-            'timestamp': 1365454320,
+            'duration': 2649.856,
+            'timestamp': 1365453720,
             'upload_date': '20130408',
-            'creator': 'Kanal 5 (Home)',
+            'creator': 'Kanal 5',
             'series': 'Nugammalt - 77 händelser som format Sverige',
             'season_number': 1,
             'episode_number': 1,
-            'age_limit': 0,
+        },
+        'params': {
+            'format': 'bestvideo',
+            'skip_download': True,
         },
     }, {
         # geo restricted, via secure api, unsigned download hls URL
-        'url': 'http://www.dplay.dk/mig-og-min-mor/season-6-episode-12/',
+        'url': 'http://www.dplay.dk/videoer/ted-bundy-mind-of-a-monster/ted-bundy-mind-of-a-monster',
         'info_dict': {
-            'id': '70816',
-            'display_id': 'mig-og-min-mor/season-6-episode-12',
+            'id': '104465',
+            'display_id': 'ted-bundy-mind-of-a-monster/ted-bundy-mind-of-a-monster',
             'ext': 'mp4',
-            'title': 'Episode 12',
-            'description': 'md5:9c86e51a93f8a4401fc9641ef9894c90',
-            'duration': 2563,
-            'timestamp': 1429696800,
-            'upload_date': '20150422',
-            'creator': 'Kanal 4 (Home)',
-            'series': 'Mig og min mor',
-            'season_number': 6,
-            'episode_number': 12,
-            'age_limit': 0,
+            'title': 'Ted Bundy: Mind Of A Monster',
+            'description': 'md5:8b780f6f18de4dae631668b8a9637995',
+            'duration': 5290.027,
+            'timestamp': 1570694400,
+            'upload_date': '20191010',
+            'creator': 'ID - Investigation Discovery',
+            'series': 'Ted Bundy: Mind Of A Monster',
+            'season_number': 1,
+            'episode_number': 1,
+        },
+        'params': {
+            'format': 'bestvideo',
+            'skip_download': True,
         },
-    }, {
-        # geo restricted, via direct unsigned hls URL
-        'url': 'http://www.dplay.no/pga-tour/season-1-hoydepunkter-18-21-februar/',
-        'only_matching': True,
     }, {
         # disco-api
         'url': 'https://www.dplay.no/videoer/i-kongens-klr/sesong-1-episode-7',
@@ -89,19 +83,59 @@ class DPlayIE(InfoExtractor):
             'format': 'bestvideo',
             'skip_download': True,
         },
+        'skip': 'Available for Premium users',
     }, {
-
-        'url': 'https://www.dplay.dk/videoer/singleliv/season-5-episode-3',
+        'url': 'http://it.dplay.com/nove/biografie-imbarazzanti/luigi-di-maio-la-psicosi-di-stanislawskij/',
+        'md5': '2b808ffb00fc47b884a172ca5d13053c',
+        'info_dict': {
+            'id': '6918',
+            'display_id': 'biografie-imbarazzanti/luigi-di-maio-la-psicosi-di-stanislawskij',
+            'ext': 'mp4',
+            'title': 'Luigi Di Maio: la psicosi di Stanislawskij',
+            'description': 'md5:3c7a4303aef85868f867a26f5cc14813',
+            'thumbnail': r're:^https?://.*\.jpe?g',
+            'upload_date': '20160524',
+            'timestamp': 1464076800,
+            'series': 'Biografie imbarazzanti',
+            'season_number': 1,
+            'episode': 'Episode 1',
+            'episode_number': 1,
+        },
+    }, {
+        'url': 'https://es.dplay.com/dmax/la-fiebre-del-oro/temporada-8-episodio-1/',
+        'info_dict': {
+            'id': '21652',
+            'display_id': 'la-fiebre-del-oro/temporada-8-episodio-1',
+            'ext': 'mp4',
+            'title': 'Episodio 1',
+            'description': 'md5:b9dcff2071086e003737485210675f69',
+            'thumbnail': r're:^https?://.*\.png',
+            'upload_date': '20180709',
+            'timestamp': 1531173540,
+            'series': 'La fiebre del oro',
+            'season_number': 8,
+            'episode': 'Episode 1',
+            'episode_number': 1,
+        },
+        'params': {
+            'skip_download': True,
+        },
+    }, {
+        'url': 'https://www.dplay.fi/videot/shifting-gears-with-aaron-kaufman/episode-16',
         'only_matching': True,
     }, {
-        'url': 'https://www.dplay.se/videos/sofias-anglar/sofias-anglar-1001',
+        'url': 'https://www.dplay.jp/video/gold-rush/24086',
         'only_matching': True,
     }]
 
-    def _get_disco_api_info(self, url, display_id, disco_host, realm):
-        disco_base = 'https://' + disco_host
+    def _get_disco_api_info(self, url, display_id, disco_host, realm, country):
+        geo_countries = [country.upper()]
+        self._initialize_geo_bypass({
+            'countries': geo_countries,
+        })
+        disco_base = 'https://%s/' % disco_host
         token = self._download_json(
-            '%s/token' % disco_base, display_id, 'Downloading token',
+            disco_base + 'token', display_id, 'Downloading token',
             query={
                 'realm': realm,
             })['data']['attributes']['token']
@@ -110,17 +144,30 @@ class DPlayIE(InfoExtractor):
             'Authorization': 'Bearer ' + token,
         }
         video = self._download_json(
-            '%s/content/videos/%s' % (disco_base, display_id), display_id,
+            disco_base + 'content/videos/' + display_id, display_id,
             headers=headers, query={
-                'include': 'show'
+                'include': 'images,primaryChannel,show,tags'
             })
         video_id = video['data']['id']
         info = video['data']['attributes']
-        title = info['name']
+        title = info['name'].strip()
         formats = []
-        for format_id, format_dict in self._download_json(
-                '%s/playback/videoPlaybackInfo/%s' % (disco_base, video_id),
-                display_id, headers=headers)['data']['attributes']['streaming'].items():
+        try:
+            streaming = self._download_json(
+                disco_base + 'playback/videoPlaybackInfo/' + video_id,
+                display_id, headers=headers)['data']['attributes']['streaming']
+        except ExtractorError as e:
+            if isinstance(e.cause, compat_HTTPError) and e.cause.code == 403:
+                info = self._parse_json(e.cause.read().decode('utf-8'), display_id)
+                error = info['errors'][0]
+                error_code = error.get('code')
+                if error_code == 'access.denied.geoblocked':
+                    self.raise_geo_restricted(countries=geo_countries)
+                elif error_code == 'access.denied.missingpackage':
+                    self.raise_login_required()
+                raise ExtractorError(info['errors'][0]['detail'], expected=True)
+            raise
+        for format_id, format_dict in streaming.items():
             if not isinstance(format_dict, dict):
                 continue
             format_url = format_dict.get('url')
@@ -142,235 +189,55 @@ class DPlayIE(InfoExtractor):
                 })
         self._sort_formats(formats)
 
-        series = None
-        try:
-            included = video.get('included')
-            if isinstance(included, list):
-                show = next(e for e in included if e.get('type') == 'show')
-                series = try_get(
-                    show, lambda x: x['attributes']['name'], compat_str)
-        except StopIteration:
-            pass
+        creator = series = None
+        tags = []
+        thumbnails = []
+        included = video.get('included') or []
+        if isinstance(included, list):
+            for e in included:
+                attributes = e.get('attributes')
+                if not attributes:
+                    continue
+                e_type = e.get('type')
+                if e_type == 'channel':
+                    creator = attributes.get('name')
+                elif e_type == 'image':
+                    src = attributes.get('src')
+                    if src:
+                        thumbnails.append({
+                            'url': src,
+                            'width': int_or_none(attributes.get('width')),
+                            'height': int_or_none(attributes.get('height')),
+                        })
+                if e_type == 'show':
+                    series = attributes.get('name')
+                elif e_type == 'tag':
+                    name = attributes.get('name')
+                    if name:
+                        tags.append(name)
 
         return {
             'id': video_id,
             'display_id': display_id,
             'title': title,
             'description': info.get('description'),
-            'duration': float_or_none(
-                info.get('videoDuration'), scale=1000),
+            'duration': float_or_none(info.get('videoDuration'), 1000),
             'timestamp': unified_timestamp(info.get('publishStart')),
             'series': series,
             'season_number': int_or_none(info.get('seasonNumber')),
             'episode_number': int_or_none(info.get('episodeNumber')),
             'age_limit': int_or_none(info.get('minimum_age')),
+            'creator': creator,
+            'tags': tags,
+            'thumbnails': thumbnails,
             'formats': formats,
         }
 
     def _real_extract(self, url):
         mobj = re.match(self._VALID_URL, url)
         display_id = mobj.group('id')
-        domain = mobj.group('domain')
-
-        self._initialize_geo_bypass({
-            'countries': [mobj.group('country').upper()],
-        })
-
-        webpage = self._download_webpage(url, display_id)
-
-        video_id = self._search_regex(
-            r'data-video-id=["\'](\d+)', webpage, 'video id', default=None)
-
-        if not video_id:
-            host = mobj.group('host')
-            return self._get_disco_api_info(
-                url, display_id, 'disco-api.' + host, host.replace('.', ''))
-
-        info = self._download_json(
-            'http://%s/api/v2/ajax/videos?video_id=%s' % (domain, video_id),
-            video_id)['data'][0]
-
-        title = info['title']
-
-        PROTOCOLS = ('hls', 'hds')
-        formats = []
-
-        def extract_formats(protocol, manifest_url):
-            if protocol == 'hls':
-                m3u8_formats = self._extract_m3u8_formats(
-                    manifest_url, video_id, ext='mp4',
-                    entry_protocol='m3u8_native', m3u8_id=protocol, fatal=False)
-                # Sometimes final URLs inside m3u8 are unsigned, let's fix this
-                # ourselves. Also fragments' URLs are only served signed for
-                # Safari user agent.
-                query = compat_urlparse.parse_qs(compat_urlparse.urlparse(manifest_url).query)
-                for m3u8_format in m3u8_formats:
-                    m3u8_format.update({
-                        'url': update_url_query(m3u8_format['url'], query),
-                        'http_headers': {
-                            'User-Agent': USER_AGENTS['Safari'],
-                        },
-                    })
-                formats.extend(m3u8_formats)
-            elif protocol == 'hds':
-                formats.extend(self._extract_f4m_formats(
-                    manifest_url + '&hdcore=3.8.0&plugin=flowplayer-3.8.0.0',
-                    video_id, f4m_id=protocol, fatal=False))
-
-        domain_tld = domain.split('.')[-1]
-        if domain_tld in ('se', 'dk', 'no'):
-            for protocol in PROTOCOLS:
-                # Providing dsc-geo allows to bypass geo restriction in some cases
-                self._set_cookie(
-                    'secure.dplay.%s' % domain_tld, 'dsc-geo',
-                    json.dumps({
-                        'countryCode': domain_tld.upper(),
-                        'expiry': (time.time() + 20 * 60) * 1000,
-                    }))
-                stream = self._download_json(
-                    'https://secure.dplay.%s/secure/api/v2/user/authorization/stream/%s?stream_type=%s'
-                    % (domain_tld, video_id, protocol), video_id,
-                    'Downloading %s stream JSON' % protocol, fatal=False)
-                if stream and stream.get(protocol):
-                    extract_formats(protocol, stream[protocol])
-
-        # The last resort is to try direct unsigned hls/hds URLs from info dictionary.
-        # Sometimes this does work even when secure API with dsc-geo has failed (e.g.
-        # http://www.dplay.no/pga-tour/season-1-hoydepunkter-18-21-februar/).
-        if not formats:
-            for protocol in PROTOCOLS:
-                if info.get(protocol):
-                    extract_formats(protocol, info[protocol])
-
-        self._sort_formats(formats)
-
-        subtitles = {}
-        for lang in ('se', 'sv', 'da', 'nl', 'no'):
-            for format_id in ('web_vtt', 'vtt', 'srt'):
-                subtitle_url = info.get('subtitles_%s_%s' % (lang, format_id))
-                if subtitle_url:
-                    subtitles.setdefault(lang, []).append({'url': subtitle_url})
-
-        return {
-            'id': video_id,
-            'display_id': display_id,
-            'title': title,
-            'description': info.get('video_metadata_longDescription'),
-            'duration': int_or_none(info.get('video_metadata_length'), scale=1000),
-            'timestamp': int_or_none(info.get('video_publish_date')),
-            'creator': info.get('video_metadata_homeChannel'),
-            'series': info.get('video_metadata_show'),
-            'season_number': int_or_none(info.get('season')),
-            'episode_number': int_or_none(info.get('episode')),
-            'age_limit': int_or_none(info.get('minimum_age')),
-            'formats': formats,
-            'subtitles': subtitles,
-        }
-
-
-class DPlayItIE(InfoExtractor):
-    _VALID_URL = r'https?://it\.dplay\.com/[^/]+/[^/]+/(?P<id>[^/?#]+)'
-    _GEO_COUNTRIES = ['IT']
-    _TEST = {
-        'url': 'http://it.dplay.com/nove/biografie-imbarazzanti/luigi-di-maio-la-psicosi-di-stanislawskij/',
-        'md5': '2b808ffb00fc47b884a172ca5d13053c',
-        'info_dict': {
-            'id': '6918',
-            'display_id': 'luigi-di-maio-la-psicosi-di-stanislawskij',
-            'ext': 'mp4',
-            'title': 'Biografie imbarazzanti: Luigi Di Maio: la psicosi di Stanislawskij',
-            'description': 'md5:3c7a4303aef85868f867a26f5cc14813',
-            'thumbnail': r're:^https?://.*\.jpe?g',
-            'upload_date': '20160524',
-            'series': 'Biografie imbarazzanti',
-            'season_number': 1,
-            'episode': 'Luigi Di Maio: la psicosi di Stanislawskij',
-            'episode_number': 1,
-        },
-    }
-
-    def _real_extract(self, url):
-        display_id = self._match_id(url)
-
-        webpage = self._download_webpage(url, display_id)
-
-        title = remove_end(self._og_search_title(webpage), ' | Dplay')
-
-        video_id = None
-
-        info = self._search_regex(
-            r'playback_json\s*:\s*JSON\.parse\s*\(\s*("(?:\\.|[^"\\])+?")',
-            webpage, 'playback JSON', default=None)
-        if info:
-            for _ in range(2):
-                info = self._parse_json(info, display_id, fatal=False)
-                if not info:
-                    break
-            else:
-                video_id = try_get(info, lambda x: x['data']['id'])
-
-        if not info:
-            info_url = self._search_regex(
-                (r'playback_json_url\s*:\s*(["\'])(?P<url>(?:(?!\1).)+)\1',
-                 r'url\s*[:=]\s*["\'](?P<url>(?:https?:)?//[^/]+/playback/videoPlaybackInfo/\d+)'),
-                webpage, 'info url', group='url')
-
-            info_url = urljoin(url, info_url)
-            video_id = info_url.rpartition('/')[-1]
-
-            try:
-                info = self._download_json(
-                    info_url, display_id, headers={
-                        'Authorization': 'Bearer %s' % self._get_cookies(url).get(
-                            'dplayit_token').value,
-                        'Referer': url,
-                    })
-                if isinstance(info, compat_str):
-                    info = self._parse_json(info, display_id)
-            except ExtractorError as e:
-                if isinstance(e.cause, compat_HTTPError) and e.cause.code in (400, 403):
-                    info = self._parse_json(e.cause.read().decode('utf-8'), display_id)
-                    error = info['errors'][0]
-                    if error.get('code') == 'access.denied.geoblocked':
-                        self.raise_geo_restricted(
-                            msg=error.get('detail'), countries=self._GEO_COUNTRIES)
-                    raise ExtractorError(info['errors'][0]['detail'], expected=True)
-                raise
-
-        hls_url = info['data']['attributes']['streaming']['hls']['url']
-
-        formats = self._extract_m3u8_formats(
-            hls_url, display_id, ext='mp4', entry_protocol='m3u8_native',
-            m3u8_id='hls')
-        self._sort_formats(formats)
-
-        series = self._html_search_regex(
-            r'(?s)<h1[^>]+class=["\'].*?\bshow_title\b.*?["\'][^>]*>(.+?)</h1>',
-            webpage, 'series', fatal=False)
-        episode = self._search_regex(
-            r'<p[^>]+class=["\'].*?\bdesc_ep\b.*?["\'][^>]*>\s*<br/>\s*<b>([^<]+)',
-            webpage, 'episode', fatal=False)
-
-        mobj = re.search(
-            r'(?s)<span[^>]+class=["\']dates["\'][^>]*>.+?\bS\.(?P<season_number>\d+)\s+E\.(?P<episode_number>\d+)\s*-\s*(?P<upload_date>\d{2}/\d{2}/\d{4})',
-            webpage)
-        if mobj:
-            season_number = int(mobj.group('season_number'))
-            episode_number = int(mobj.group('episode_number'))
-            upload_date = unified_strdate(mobj.group('upload_date'))
-        else:
-            season_number = episode_number = upload_date = None
-
-        return {
-            'id': compat_str(video_id or display_id),
-            'display_id': display_id,
-            'title': title,
-            'description': self._og_search_description(webpage),
-            'thumbnail': self._og_search_thumbnail(webpage),
-            'series': series,
-            'season_number': season_number,
-            'episode': episode,
-            'episode_number': episode_number,
-            'upload_date': upload_date,
-            'formats': formats,
-        }
+        domain = mobj.group('domain').lstrip('www.')
+        country = mobj.group('country') or mobj.group('subdomain_country')
+        host = 'disco-api.' + domain if domain.startswith('dplay.') else 'eu2-prod.disco-api.com'
+        return self._get_disco_api_info(
+            url, display_id, host, 'dplay' + country, country)
diff --git a/youtube_dl/extractor/extractors.py b/youtube_dl/extractor/extractors.py
index 1db21529f..a8fe0de1a 100644
--- a/youtube_dl/extractor/extractors.py
+++ b/youtube_dl/extractor/extractors.py
@@ -277,10 +277,7 @@ from .douyutv import (
     DouyuShowIE,
     DouyuTVIE,
 )
-from .dplay import (
-    DPlayIE,
-    DPlayItIE,
-)
+from .dplay import DPlayIE
 from .dreisat import DreiSatIE
 from .drbonanza import DRBonanzaIE
 from .drtuber import DrTuberIE
diff --git a/youtube_dl/extractor/generic.py b/youtube_dl/extractor/generic.py
index 5ed952b29..f66cae0eb 100644
--- a/youtube_dl/extractor/generic.py
+++ b/youtube_dl/extractor/generic.py
@@ -118,6 +118,7 @@ from .foxnews import FoxNewsIE
 from .viqeo import ViqeoIE
 from .expressen import ExpressenIE
 from .zype import ZypeIE
+from .odnoklassniki import OdnoklassnikiIE
 
 
 class GenericIE(InfoExtractor):
@@ -2627,9 +2628,9 @@ class GenericIE(InfoExtractor):
             return self.url_result(mobj.group('url'), 'VK')
 
         # Look for embedded Odnoklassniki player
-        mobj = re.search(r'<iframe[^>]+?src=(["\'])(?P<url>https?://(?:odnoklassniki|ok)\.ru/videoembed/.+?)\1', webpage)
-        if mobj is not None:
-            return self.url_result(mobj.group('url'), 'Odnoklassniki')
+        odnoklassniki_url = OdnoklassnikiIE._extract_url(webpage)
+        if odnoklassniki_url:
+            return self.url_result(odnoklassniki_url, OdnoklassnikiIE.ie_key())
 
         # Look for embedded ivi player
         mobj = re.search(r'<embed[^>]+?src=(["\'])(?P<url>https?://(?:www\.)?ivi\.ru/video/player.+?)\1', webpage)
diff --git a/youtube_dl/extractor/odnoklassniki.py b/youtube_dl/extractor/odnoklassniki.py
index 06de40e50..0eb79e250 100644
--- a/youtube_dl/extractor/odnoklassniki.py
+++ b/youtube_dl/extractor/odnoklassniki.py
@@ -1,6 +1,8 @@
 # coding: utf-8
 from __future__ import unicode_literals
 
+import re
+
 from .common import InfoExtractor
 from ..compat import (
     compat_etree_fromstring,
@@ -136,6 +138,13 @@ class OdnoklassnikiIE(InfoExtractor):
         'only_matching': True,
     }]
 
+    @staticmethod
+    def _extract_url(webpage):
+        mobj = re.search(
+            r'<iframe[^>]+src=(["\'])(?P<url>(?:https?:)?//(?:odnoklassniki|ok)\.ru/videoembed/.+?)\1', webpage)
+        if mobj:
+            return mobj.group('url')
+
     def _real_extract(self, url):
         start_time = int_or_none(compat_parse_qs(
             compat_urllib_parse_urlparse(url).query).get('fromTime', [None])[0])
diff --git a/youtube_dl/extractor/vk.py b/youtube_dl/extractor/vk.py
index 08e838060..4c8ca4f41 100644
--- a/youtube_dl/extractor/vk.py
+++ b/youtube_dl/extractor/vk.py
@@ -12,7 +12,6 @@ from ..utils import (
     get_element_by_class,
     int_or_none,
     orderedSet,
-    remove_start,
     str_or_none,
     str_to_int,
     unescapeHTML,
@@ -21,6 +20,7 @@ from ..utils import (
     urlencode_postdata,
 )
 from .dailymotion import DailymotionIE
+from .odnoklassniki import OdnoklassnikiIE
 from .pladform import PladformIE
 from .vimeo import VimeoIE
 from .youtube import YoutubeIE
@@ -60,6 +60,18 @@ class VKBaseIE(InfoExtractor):
     def _real_initialize(self):
         self._login()
 
+    def _download_payload(self, path, video_id, data, fatal=True):
+        data['al'] = 1
+        code, payload = self._download_json(
+            'https://vk.com/%s.php' % path, video_id,
+            data=urlencode_postdata(data), fatal=fatal,
+            headers={'X-Requested-With': 'XMLHttpRequest'})['payload']
+        if code == '3':
+            self.raise_login_required()
+        elif code == '8':
+            raise ExtractorError(clean_html(payload[0][1:-1]), expected=True)
+        return payload
+
 
 class VKIE(VKBaseIE):
     IE_NAME = 'vk'
@@ -96,7 +108,6 @@ class VKIE(VKBaseIE):
         },
         {
             'url': 'http://vk.com/video205387401_165548505',
-            'md5': '6c0aeb2e90396ba97035b9cbde548700',
             'info_dict': {
                 'id': '205387401_165548505',
                 'ext': 'mp4',
@@ -110,18 +121,18 @@ class VKIE(VKBaseIE):
         },
         {
             'note': 'Embedded video',
-            'url': 'http://vk.com/video_ext.php?oid=32194266&id=162925554&hash=7d8c2e0d5e05aeaa&hd=1',
-            'md5': 'c7ce8f1f87bec05b3de07fdeafe21a0a',
+            'url': 'https://vk.com/video_ext.php?oid=-77521&id=162222515&hash=87b046504ccd8bfa',
+            'md5': '7babad3b85ea2e91948005b1b8b0cb84',
             'info_dict': {
-                'id': '32194266_162925554',
+                'id': '-77521_162222515',
                 'ext': 'mp4',
-                'uploader': 'Vladimir Gavrin',
-                'title': 'Lin Dan',
-                'duration': 101,
-                'upload_date': '20120730',
-                'view_count': int,
+                'uploader': 're:(?:Noize MC|Alexander Ilyashenko).*',
+                'title': 'ProtivoGunz - Хуёвая песня',
+                'duration': 195,
+                'upload_date': '20120212',
+                'timestamp': 1329049880,
+                'uploader_id': '-77521',
             },
-            'skip': 'This video has been removed from public access.',
         },
         {
             # VIDEO NOW REMOVED
@@ -138,18 +149,19 @@ class VKIE(VKBaseIE):
                 'upload_date': '20121218',
                 'view_count': int,
             },
-            'skip': 'Requires vk account credentials',
+            'skip': 'Removed',
         },
         {
             'url': 'http://vk.com/hd_kino_mania?z=video-43215063_168067957%2F15c66b9b533119788d',
-            'md5': '4d7a5ef8cf114dfa09577e57b2993202',
             'info_dict': {
                 'id': '-43215063_168067957',
                 'ext': 'mp4',
-                'uploader': 'Киномания - лучшее из мира кино',
+                'uploader': 'Bro Mazter',
                 'title': ' ',
                 'duration': 7291,
                 'upload_date': '20140328',
+                'uploader_id': '223413403',
+                'timestamp': 1396018030,
             },
             'skip': 'Requires vk account credentials',
         },
@@ -165,7 +177,7 @@ class VKIE(VKBaseIE):
                 'upload_date': '20140626',
                 'view_count': int,
             },
-            'skip': 'Only works from Russia',
+            'skip': 'Removed',
         },
         {
             # video (removed?) only available with list id
@@ -247,6 +259,9 @@ class VKIE(VKBaseIE):
                 'uploader_id': '-387766',
                 'timestamp': 1475137527,
             },
+            'params': {
+                'skip_download': True,
+            },
         },
         {
             # live stream, hls and rtmp links, most likely already finished live
@@ -282,100 +297,100 @@ class VKIE(VKBaseIE):
             # The video is not available in your region.
             'url': 'https://vk.com/video-51812607_171445436',
             'only_matching': True,
-        },
-        {
-            # Video %s is not available.
-            'url': 'https://vk.com/video-173478245_456239188',
-            'only_matching': True,
-        },
-    ]
+        }]
 
     def _real_extract(self, url):
         mobj = re.match(self._VALID_URL, url)
         video_id = mobj.group('videoid')
 
+        mv_data = {}
         if video_id:
-            info_url = 'https://vk.com/al_video.php?act=show_inline&al=1&video=' + video_id
+            data = {
+                'act': 'show_inline',
+                'video': video_id,
+            }
             # Some videos (removed?) can only be downloaded with list id specified
             list_id = mobj.group('list_id')
             if list_id:
-                info_url += '&list=%s' % list_id
+                data['list'] = list_id
+
+            payload = self._download_payload('al_video', video_id, data)
+            info_page = payload[1]
+            opts = payload[-1]
+            mv_data = opts.get('mvData') or {}
+            player = opts.get('player') or {}
         else:
-            info_url = 'http://vk.com/video_ext.php?' + mobj.group('embed_query')
             video_id = '%s_%s' % (mobj.group('oid'), mobj.group('id'))
 
-        info_page = self._download_webpage(info_url, video_id)
-        url_page = self._download_webpage(url, video_id)
+            info_page = self._download_webpage(
+                'http://vk.com/video_ext.php?' + mobj.group('embed_query'), video_id)
 
-        error_message = self._html_search_regex(
-            [r'(?s)<!><div[^>]+class="video_layer_message"[^>]*>(.+?)</div>',
-                r'(?s)<div[^>]+id="video_ext_msg"[^>]*>(.+?)</div>'],
-            info_page, 'error message', default=None)
-        if error_message:
-            raise ExtractorError(error_message, expected=True)
+            error_message = self._html_search_regex(
+                [r'(?s)<!><div[^>]+class="video_layer_message"[^>]*>(.+?)</div>',
+                    r'(?s)<div[^>]+id="video_ext_msg"[^>]*>(.+?)</div>'],
+                info_page, 'error message', default=None)
+            if error_message:
+                raise ExtractorError(error_message, expected=True)
 
-        if re.search(r'<!>/login\.php\?.*\bact=security_check', info_page):
-            raise ExtractorError(
-                'You are trying to log in from an unusual location. You should confirm ownership at vk.com to log in with this IP.',
-                expected=True)
-
-        ERROR_COPYRIGHT = 'Video %s has been removed from public access due to rightholder complaint.'
-
-        ERRORS = {
-            r'Видеозапись .*? была изъята из публичного доступа в связи с обращением правообладателя.<':
-            ERROR_COPYRIGHT,
+            if re.search(r'<!>/login\.php\?.*\bact=security_check', info_page):
+                raise ExtractorError(
+                    'You are trying to log in from an unusual location. You should confirm ownership at vk.com to log in with this IP.',
+                    expected=True)
 
-            r'The video .*? was removed from public access by request of the copyright holder.<':
-            ERROR_COPYRIGHT,
+            ERROR_COPYRIGHT = 'Video %s has been removed from public access due to rightholder complaint.'
 
-            r'Please log in or <':
-            'Video %s is only available for registered users, '
-            'use --username and --password options to provide account credentials.',
+            ERRORS = {
+                r'>Видеозапись .*? была изъята из публичного доступа в связи с обращением правообладателя.<':
+                ERROR_COPYRIGHT,
 
-            r'Unknown error':
-            'Video %s does not exist.',
+                r'>The video .*? was removed from public access by request of the copyright holder.<':
+                ERROR_COPYRIGHT,
 
-            r'<!>Видео временно недоступно':
-            'Video %s is temporarily unavailable.',
+                r'<!>Please log in or <':
+                'Video %s is only available for registered users, '
+                'use --username and --password options to provide account credentials.',
 
-            r'Access denied':
-            'Access denied to video %s.',
+                r'<!>Unknown error':
+                'Video %s does not exist.',
 
-            r'Видеозапись недоступна, так как её автор был заблокирован.':
-            'Video %s is no longer available, because its author has been blocked.',
+                r'<!>Видео временно недоступно':
+                'Video %s is temporarily unavailable.',
 
-            r'This video is no longer available, because its author has been blocked.':
-            'Video %s is no longer available, because its author has been blocked.',
+                r'<!>Access denied':
+                'Access denied to video %s.',
 
-            r'This video is no longer available, because it has been deleted.':
-            'Video %s is no longer available, because it has been deleted.',
+                r'<!>Видеозапись недоступна, так как её автор был заблокирован.':
+                'Video %s is no longer available, because its author has been blocked.',
 
-            r'The video .+? is not available in your region.':
-            'Video %s is not available in your region.',
+                r'<!>This video is no longer available, because its author has been blocked.':
+                'Video %s is no longer available, because its author has been blocked.',
 
-            r'The video .+? is unavailable':
-                'Video %s is not available.',
+                r'<!>This video is no longer available, because it has been deleted.':
+                'Video %s is no longer available, because it has been deleted.',
 
-            r'You need to be a member of this group to view':
-                'Video %s is for group members only.',
-        }
+                r'<!>The video .+? is not available in your region.':
+                'Video %s is not available in your region.',
+            }
 
-        for error_re, error_msg in ERRORS.items():
-            for page in [info_page, url_page]:
-                if re.search(error_re, page):
+            for error_re, error_msg in ERRORS.items():
+                if re.search(error_re, info_page):
                     raise ExtractorError(error_msg % video_id, expected=True)
 
+            player = self._parse_json(self._search_regex(
+                r'var\s+playerParams\s*=\s*({.+?})\s*;\s*\n',
+                info_page, 'player params'), video_id)
+
         youtube_url = YoutubeIE._extract_url(info_page)
         if youtube_url:
-            return self.url_result(youtube_url, ie=YoutubeIE.ie_key())
+            return self.url_result(youtube_url, YoutubeIE.ie_key())
 
         vimeo_url = VimeoIE._extract_url(url, info_page)
         if vimeo_url is not None:
-            return self.url_result(vimeo_url)
+            return self.url_result(vimeo_url, VimeoIE.ie_key())
 
         pladform_url = PladformIE._extract_url(info_page)
         if pladform_url:
-            return self.url_result(pladform_url)
+            return self.url_result(pladform_url, PladformIE.ie_key())
 
         m_rutube = re.search(
             r'\ssrc="((?:https?:)?//rutube\.ru\\?/(?:video|play)\\?/embed(?:.*?))\\?"', info_page)
@@ -388,6 +403,10 @@ class VKIE(VKBaseIE):
         if dailymotion_urls:
             return self.url_result(dailymotion_urls[0], DailymotionIE.ie_key())
 
+        odnoklassniki_url = OdnoklassnikiIE._extract_url(info_page)
+        if odnoklassniki_url:
+            return self.url_result(odnoklassniki_url, OdnoklassnikiIE.ie_key())
+
         m_opts = re.search(r'(?s)var\s+opts\s*=\s*({.+?});', info_page)
         if m_opts:
             m_opts_url = re.search(r"url\s*:\s*'((?!/\b)[^']+)", m_opts.group(1))
@@ -397,38 +416,7 @@ class VKIE(VKBaseIE):
                     opts_url = 'http:' + opts_url
                 return self.url_result(opts_url)
 
-        # vars does not look to be served anymore since 24.10.2016
-        data = self._parse_json(
-            self._search_regex(
-                r'var\s+vars\s*=\s*({.+?});', info_page, 'vars', default='{}'),
-            video_id, fatal=False)
-
-        # <!json> is served instead
-        if not data:
-            data = self._parse_json(
-                self._search_regex(
-                    [r'<!json>\s*({.+?})\s*<!>', r'<!json>\s*({.+})'],
-                    info_page, 'json', default='{}'),
-                video_id)
-            if data:
-                data = data['player']['params'][0]
-
-        if not data:
-            data = self._parse_json(
-                self._search_regex(
-                    r'var\s+playerParams\s*=\s*({.+?})\s*;\s*\n', info_page,
-                    'player params', default='{}'),
-                video_id)
-            if data:
-                data = data['params'][0]
-
-        # <!--{...}
-        if not data:
-            data = self._parse_json(
-                self._search_regex(
-                    r'<!--\s*({.+})', info_page, 'payload'),
-                video_id)['payload'][-1][-1]['player']['params'][0]
-
+        data = player['params'][0]
         title = unescapeHTML(data['md_title'])
 
         # 2 = live
@@ -477,12 +465,12 @@ class VKIE(VKBaseIE):
             'title': title,
             'thumbnail': data.get('jpg'),
             'uploader': data.get('md_author'),
-            'uploader_id': str_or_none(data.get('author_id')),
-            'duration': data.get('duration'),
+            'uploader_id': str_or_none(data.get('author_id') or mv_data.get('authorId')),
+            'duration': int_or_none(data.get('duration') or mv_data.get('duration')),
             'timestamp': timestamp,
             'view_count': view_count,
-            'like_count': int_or_none(data.get('liked')),
-            'dislike_count': int_or_none(data.get('nolikes')),
+            'like_count': int_or_none(mv_data.get('likes')),
+            'comment_count': int_or_none(mv_data.get('commcount')),
             'is_live': is_live,
         }
 
@@ -496,7 +484,6 @@ class VKUserVideosIE(VKBaseIE):
         'url': 'http://vk.com/videos205387401',
         'info_dict': {
             'id': '205387401',
-            'title': "Tom Cruise's Videos",
         },
         'playlist_mincount': 4,
     }, {
@@ -512,22 +499,25 @@ class VKUserVideosIE(VKBaseIE):
         'url': 'http://new.vk.com/videos205387401',
         'only_matching': True,
     }]
+    _VIDEO = collections.namedtuple(
+        'Video', ['owner_id', 'id', 'thumb', 'title', 'flags', 'duration', 'hash', 'moder_acts', 'owner', 'date', 'views', 'platform', 'blocked', 'music_video_meta'])
 
     def _real_extract(self, url):
         page_id = self._match_id(url)
 
-        webpage = self._download_webpage(url, page_id)
-
-        entries = [
-            self.url_result(
-                'http://vk.com/video' + video_id, 'VK', video_id=video_id)
-            for video_id in orderedSet(re.findall(r'href="/video(-?[0-9_]+)"', webpage))]
+        l = self._download_payload('al_video', page_id, {
+            'act': 'load_videos_silent',
+            'oid': page_id,
+        })[0]['']['list']
 
-        title = unescapeHTML(self._search_regex(
-            r'<title>\s*([^<]+?)\s+\|\s+\d+\s+videos',
-            webpage, 'title', default=page_id))
+        entries = []
+        for video in l:
+            v = self._VIDEO._make(video)
+            video_id = '%d_%d' % (v.owner_id, v.id)
+            entries.append(self.url_result(
+                'http://vk.com/video' + video_id, 'VK', video_id=video_id))
 
-        return self.playlist_result(entries, page_id, title)
+        return self.playlist_result(entries, page_id)
 
 
 class VKWallPostIE(VKBaseIE):
@@ -537,15 +527,15 @@ class VKWallPostIE(VKBaseIE):
         # public page URL, audio playlist
         'url': 'https://vk.com/bs.official?w=wall-23538238_35',
         'info_dict': {
-            'id': '23538238_35',
-            'title': 'Black Shadow - Wall post 23538238_35',
+            'id': '-23538238_35',
+            'title': 'Black Shadow - Wall post -23538238_35',
             'description': 'md5:3f84b9c4f9ef499731cf1ced9998cc0c',
         },
         'playlist': [{
             'md5': '5ba93864ec5b85f7ce19a9af4af080f6',
             'info_dict': {
                 'id': '135220665_111806521',
-                'ext': 'mp3',
+                'ext': 'mp4',
                 'title': 'Black Shadow - Слепое Верование',
                 'duration': 370,
                 'uploader': 'Black Shadow',
@@ -556,18 +546,16 @@ class VKWallPostIE(VKBaseIE):
             'md5': '4cc7e804579122b17ea95af7834c9233',
             'info_dict': {
                 'id': '135220665_111802303',
-                'ext': 'mp3',
+                'ext': 'mp4',
                 'title': 'Black Shadow - Война - Негасимое Бездны Пламя!',
                 'duration': 423,
                 'uploader': 'Black Shadow',
                 'artist': 'Black Shadow',
                 'track': 'Война - Негасимое Бездны Пламя!',
             },
-            'params': {
-                'skip_download': True,
-            },
         }],
         'params': {
+            'skip_download': True,
             'usenetrc': True,
         },
         'skip': 'Requires vk account credentials',
@@ -576,7 +564,7 @@ class VKWallPostIE(VKBaseIE):
         'url': 'https://vk.com/wall85155021_6319',
         'info_dict': {
             'id': '85155021_6319',
-            'title': 'Sergey Gorbunov - Wall post 85155021_6319',
+            'title': 'Сергей Горбунов - Wall post 85155021_6319',
         },
         'playlist_count': 1,
         'params': {
@@ -592,58 +580,72 @@ class VKWallPostIE(VKBaseIE):
         'url': 'https://m.vk.com/wall-23538238_35',
         'only_matching': True,
     }]
+    _BASE64_CHARS = 'abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMN0PQRSTUVWXYZO123456789+/='
+    _AUDIO = collections.namedtuple(
+        'Audio', ['id', 'owner_id', 'url', 'title', 'performer', 'duration', 'album_id', 'unk', 'author_link', 'lyrics', 'flags', 'context', 'extra', 'hashes', 'cover_url', 'ads', 'subtitle', 'main_artists', 'feat_artists', 'album', 'track_code', 'restriction', 'album_part', 'new_stats', 'access_key'])
+
+    def _decode(self, enc):
+        dec = ''
+        e = n = 0
+        for c in enc:
+            r = self._BASE64_CHARS.index(c)
+            cond = n % 4
+            e = 64 * e + r if cond else r
+            n += 1
+            if cond:
+                dec += chr(255 & e >> (-2 * n & 6))
+        return dec
+
+    def _unmask_url(self, mask_url, vk_id):
+        if 'audio_api_unavailable' in mask_url:
+            extra = mask_url.split('?extra=')[1].split('#')
+            func, base = self._decode(extra[1]).split(chr(11))
+            mask_url = list(self._decode(extra[0]))
+            url_len = len(mask_url)
+            indexes = [None] * url_len
+            index = int(base) ^ vk_id
+            for n in range(url_len - 1, -1, -1):
+                index = (url_len * (n + 1) ^ index + n) % url_len
+                indexes[n] = index
+            for n in range(1, url_len):
+                c = mask_url[n]
+                index = indexes[url_len - 1 - n]
+                mask_url[n] = mask_url[index]
+                mask_url[index] = c
+            mask_url = ''.join(mask_url)
+        return mask_url
 
     def _real_extract(self, url):
         post_id = self._match_id(url)
 
-        wall_url = 'https://vk.com/wall%s' % post_id
-
-        post_id = remove_start(post_id, '-')
-
-        webpage = self._download_webpage(wall_url, post_id)
-
-        error = self._html_search_regex(
-            r'>Error</div>\s*<div[^>]+class=["\']body["\'][^>]*>([^<]+)',
-            webpage, 'error', default=None)
-        if error:
-            raise ExtractorError('VK said: %s' % error, expected=True)
+        webpage = self._download_payload('wkview', post_id, {
+            'act': 'show',
+            'w': 'wall' + post_id,
+        })[1]
 
         description = clean_html(get_element_by_class('wall_post_text', webpage))
         uploader = clean_html(get_element_by_class('author', webpage))
-        thumbnail = self._og_search_thumbnail(webpage)
 
         entries = []
 
-        audio_ids = re.findall(r'data-full-id=["\'](\d+_\d+)', webpage)
-        if audio_ids:
-            al_audio = self._download_webpage(
-                'https://vk.com/al_audio.php', post_id,
-                note='Downloading audio info', fatal=False,
-                data=urlencode_postdata({
-                    'act': 'reload_audio',
-                    'al': '1',
-                    'ids': ','.join(audio_ids)
-                }))
-            if al_audio:
-                Audio = collections.namedtuple(
-                    'Audio', ['id', 'user_id', 'url', 'track', 'artist', 'duration'])
-                audios = self._parse_json(
-                    self._search_regex(
-                        r'<!json>(.+?)<!>', al_audio, 'audios', default='[]'),
-                    post_id, fatal=False, transform_source=unescapeHTML)
-                if isinstance(audios, list):
-                    for audio in audios:
-                        a = Audio._make(audio[:6])
-                        entries.append({
-                            'id': '%s_%s' % (a.user_id, a.id),
-                            'url': a.url,
-                            'title': '%s - %s' % (a.artist, a.track) if a.artist and a.track else a.id,
-                            'thumbnail': thumbnail,
-                            'duration': a.duration,
-                            'uploader': uploader,
-                            'artist': a.artist,
-                            'track': a.track,
-                        })
+        for audio in re.findall(r'data-audio="([^"]+)', webpage):
+            audio = self._parse_json(unescapeHTML(audio), post_id)
+            a = self._AUDIO._make(audio)
+            if not a.url:
+                continue
+            title = unescapeHTML(a.title)
+            entries.append({
+                'id': '%s_%s' % (a.owner_id, a.id),
+                'url': self._unmask_url(a.url, a.ads['vk_id']),
+                'title': '%s - %s' % (a.performer, title) if a.performer else title,
+                'thumbnail': a.cover_url.split(',') if a.cover_url else None,
+                'duration': a.duration,
+                'uploader': uploader,
+                'artist': a.performer,
+                'track': title,
+                'ext': 'mp4',
+                'protocol': 'm3u8',
+            })
 
         for video in re.finditer(
                 r'<a[^>]+href=(["\'])(?P<url>/video(?:-?[\d_]+).*?)\1', webpage):

From a8320b35b27755b8de4e323ce7a2527d0ff8f19e Mon Sep 17 00:00:00 2001
From: Avi Peretz <pavi@videocites.com>
Date: Sun, 27 Oct 2019 14:39:11 +0200
Subject: [PATCH 03/46] refix prints.

---
 youtube_dl/extractor/vk.py | 27 ++++++++++++++-------------
 1 file changed, 14 insertions(+), 13 deletions(-)

diff --git a/youtube_dl/extractor/vk.py b/youtube_dl/extractor/vk.py
index 4c8ca4f41..acd809389 100644
--- a/youtube_dl/extractor/vk.py
+++ b/youtube_dl/extractor/vk.py
@@ -324,7 +324,7 @@ class VKIE(VKBaseIE):
 
             info_page = self._download_webpage(
                 'http://vk.com/video_ext.php?' + mobj.group('embed_query'), video_id)
-
+            url_page = self._download_webpage(url, video_id)
             error_message = self._html_search_regex(
                 [r'(?s)<!><div[^>]+class="video_layer_message"[^>]*>(.+?)</div>',
                     r'(?s)<div[^>]+id="video_ext_msg"[^>]*>(.+?)</div>'],
@@ -340,41 +340,42 @@ class VKIE(VKBaseIE):
             ERROR_COPYRIGHT = 'Video %s has been removed from public access due to rightholder complaint.'
 
             ERRORS = {
-                r'>Видеозапись .*? была изъята из публичного доступа в связи с обращением правообладателя.<':
+                r'Видеозапись .*? была изъята из публичного доступа в связи с обращением правообладателя.<':
                 ERROR_COPYRIGHT,
 
-                r'>The video .*? was removed from public access by request of the copyright holder.<':
+                r'The video .*? was removed from public access by request of the copyright holder.<':
                 ERROR_COPYRIGHT,
 
-                r'<!>Please log in or <':
+                r'Please log in or <':
                 'Video %s is only available for registered users, '
                 'use --username and --password options to provide account credentials.',
 
-                r'<!>Unknown error':
+                r'Unknown error':
                 'Video %s does not exist.',
 
-                r'<!>Видео временно недоступно':
+                r'Видео временно недоступно':
                 'Video %s is temporarily unavailable.',
 
-                r'<!>Access denied':
+                r'Access denied':
                 'Access denied to video %s.',
 
-                r'<!>Видеозапись недоступна, так как её автор был заблокирован.':
+                r'Видеозапись недоступна, так как её автор был заблокирован.':
                 'Video %s is no longer available, because its author has been blocked.',
 
-                r'<!>This video is no longer available, because its author has been blocked.':
+                r'This video is no longer available, because its author has been blocked.':
                 'Video %s is no longer available, because its author has been blocked.',
 
-                r'<!>This video is no longer available, because it has been deleted.':
+                r'This video is no longer available, because it has been deleted.':
                 'Video %s is no longer available, because it has been deleted.',
 
-                r'<!>The video .+? is not available in your region.':
+                r'The video .+? is not available in your region.':
                 'Video %s is not available in your region.',
             }
 
             for error_re, error_msg in ERRORS.items():
-                if re.search(error_re, info_page):
-                    raise ExtractorError(error_msg % video_id, expected=True)
+                for page in [info_page, url_page]:
+                    if re.search(error_re, page):
+                        raise ExtractorError(error_msg % video_id, expected=True)
 
             player = self._parse_json(self._search_regex(
                 r'var\s+playerParams\s*=\s*({.+?})\s*;\s*\n',

From c63550346fd17053f6e739409fa9b58a6243747a Mon Sep 17 00:00:00 2001
From: Avi Peretz <pavi@videocites.com>
Date: Thu, 7 Nov 2019 15:34:05 +0200
Subject: [PATCH 04/46] fix timestamp extraction.

---
 youtube_dl/extractor/odnoklassniki.py | 103 ++++++++++++++++----------
 1 file changed, 63 insertions(+), 40 deletions(-)

diff --git a/youtube_dl/extractor/odnoklassniki.py b/youtube_dl/extractor/odnoklassniki.py
index 0eb79e250..ef951672a 100644
--- a/youtube_dl/extractor/odnoklassniki.py
+++ b/youtube_dl/extractor/odnoklassniki.py
@@ -1,6 +1,6 @@
 # coding: utf-8
 from __future__ import unicode_literals
-
+from datetime import datetime, timedelta
 import re
 
 from .common import InfoExtractor
@@ -17,6 +17,7 @@ from ..utils import (
     qualities,
     unescapeHTML,
     urlencode_postdata,
+    unified_timestamp
 )
 
 
@@ -199,45 +200,7 @@ class OdnoklassnikiIE(InfoExtractor):
 
         upload_date = unified_strdate(self._html_search_meta(
             'ya:ovs:upload_date', webpage, 'upload date', default=None))
-
-        if upload_date is None:
-            upload_date_str = self._search_regex(
-                r'vp-layer-info_date">(?P<date>.*?)<\/span>',
-                webpage, 'upload date', group='date')
-            if upload_date_str:
-                upload_date_str = upload_date_str.replace('Sept', 'Sep')
-                from datetime import datetime, timedelta
-                upload_date_time = None
-                try:
-                    upload_date_time = datetime.strptime(upload_date_str, '%d %b %Y')
-                except:
-                    pass
-                try:
-                    upload_date_time = datetime.strptime(upload_date_str, '%d %b')
-                    upload_date_time = upload_date_time.replace(year=datetime.utcnow().year)
-                except:
-                    pass
-                try:
-                    upload_date_time = datetime.strptime(upload_date_str, '%d %B')
-                    upload_date_time = upload_date_time.replace(year=datetime.utcnow().year)
-                except:
-                    pass
-
-                try:
-                    if upload_date_str.find(':') >=0:
-                        hour_and_minutes = upload_date_str.split(' ')[-1]
-                    else:
-                        hour_and_minutes = upload_date_str
-                    upload_date_time = datetime.strptime(hour_and_minutes, '%H:%M')
-                    upload_date_time = upload_date_time.replace(year=datetime.utcnow().year)
-                    upload_date_time = upload_date_time.replace(day=datetime.utcnow().day)
-                    if upload_date_str.find('yesterday') ==0:
-                        upload_date_time = upload_date_time - timedelta(days=1)
-                except:
-                    pass
-
-                if upload_date_time:
-                    upload_date = upload_date_time.strftime('%Y%m%d')
+        upload_date, timestamp = self.resolve_timestamp_and_upload_date(upload_date, webpage)
 
         age_limit = None
         adult = self._html_search_meta(
@@ -253,6 +216,7 @@ class OdnoklassnikiIE(InfoExtractor):
             'thumbnail': thumbnail,
             'duration': duration,
             'upload_date': upload_date,
+            'timestamp': timestamp,
             'uploader': uploader,
             'uploader_id': uploader_id,
             'like_count': like_count,
@@ -322,3 +286,62 @@ class OdnoklassnikiIE(InfoExtractor):
 
         info['formats'] = formats
         return info
+
+    def resolve_timestamp_and_upload_date(self, upload_date, webpage):
+        timestamp = None
+        upload_date_str = self._search_regex(
+            r'vp-layer-info_date">(?P<date>.*?)<\/span>',
+            webpage, 'upload date', group='date')
+        if upload_date_str:
+            if upload_date is None:
+                upload_date_time = None
+                upload_date_str = upload_date_str.replace('Sept', 'Sep')
+                try:
+                    upload_date_time = datetime.strptime(upload_date_str, '%d %b %Y')
+                except:
+                    pass
+                try:
+                    upload_date_time = datetime.strptime(upload_date_str, '%d %b')
+                    upload_date_time = upload_date_time.replace(year=datetime.utcnow().year)
+                except:
+                    pass
+                try:
+                    upload_date_time = datetime.strptime(upload_date_str, '%d %B')
+                    upload_date_time = upload_date_time.replace(year=datetime.utcnow().year)
+                except:
+                    pass
+                try:
+                    upload_date_time = self._extract_hours_and_minutes(upload_date_str)
+                    upload_date_time = upload_date_time.replace(year=datetime.utcnow().year)
+                    upload_date_time = upload_date_time.replace(day=datetime.utcnow().day)
+                    if upload_date_str.find('yesterday') == 0:
+                        upload_date_time = upload_date_time - timedelta(days=1)
+                except:
+                    pass
+
+                if upload_date_time:
+                    upload_date = upload_date_time.strftime('%Y%m%d')
+            else:
+                upload_date_time = datetime.strptime(upload_date, '%Y%m%d')
+                upload_date_hours_and_minutes = self._extract_hours_and_minutes(upload_date_str)
+                if upload_date_hours_and_minutes:
+                    upload_date_time = upload_date_time + timedelta(
+                        hours=upload_date_hours_and_minutes.hour, minutes=upload_date_hours_and_minutes.minute
+                    )
+                    timestamp = unified_timestamp(upload_date_time.isoformat())
+                if upload_date_time:
+                    upload_date = upload_date_time.strftime('%Y%m%d')
+
+            return upload_date, timestamp
+
+    @staticmethod
+    def _extract_hours_and_minutes(upload_date_str):
+        try:
+            if upload_date_str.find(':') >= 0:
+                hour_and_minutes = upload_date_str.split(' ')[-1]
+            else:
+                hour_and_minutes = upload_date_str
+            upload_date_time = datetime.strptime(hour_and_minutes, '%H:%M')
+            return upload_date_time
+        except:
+            pass
\ No newline at end of file

From 608dd9524cb913798ba6c39afaf10493e87b40a6 Mon Sep 17 00:00:00 2001
From: Avi Peretz <pavi@videocites.com>
Date: Thu, 7 Nov 2019 15:46:35 +0200
Subject: [PATCH 05/46] fix timezone.

---
 youtube_dl/extractor/odnoklassniki.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/youtube_dl/extractor/odnoklassniki.py b/youtube_dl/extractor/odnoklassniki.py
index ef951672a..4b46117a7 100644
--- a/youtube_dl/extractor/odnoklassniki.py
+++ b/youtube_dl/extractor/odnoklassniki.py
@@ -326,7 +326,7 @@ class OdnoklassnikiIE(InfoExtractor):
                 upload_date_hours_and_minutes = self._extract_hours_and_minutes(upload_date_str)
                 if upload_date_hours_and_minutes:
                     upload_date_time = upload_date_time + timedelta(
-                        hours=upload_date_hours_and_minutes.hour, minutes=upload_date_hours_and_minutes.minute
+                        hours=upload_date_hours_and_minutes.hour - 3, minutes=upload_date_hours_and_minutes.minute
                     )
                     timestamp = unified_timestamp(upload_date_time.isoformat())
                 if upload_date_time:

From 638d00d852ecec80072250f47759a1a6d39ded73 Mon Sep 17 00:00:00 2001
From: Avi Peretz <pavi@videocites.com>
Date: Sun, 10 Nov 2019 13:42:48 +0200
Subject: [PATCH 06/46] add support for facebook watch

---
 youtube_dl/extractor/facebook.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/youtube_dl/extractor/facebook.py b/youtube_dl/extractor/facebook.py
index b205fa276..ac05b580f 100644
--- a/youtube_dl/extractor/facebook.py
+++ b/youtube_dl/extractor/facebook.py
@@ -40,7 +40,8 @@ class FacebookIE(InfoExtractor):
                                 photo\.php|
                                 video\.php|
                                 video/embed|
-                                story\.php
+                                story\.php|
+                                watch
                             )\?(?:.*?)(?:v|video_id|story_fbid)=|
                             [^/]+/videos/(?:[^/]+/)?|
                             [^/]+/posts/|

From 6bb25bb1d4d8504752b496033ef70c127ccd9c45 Mon Sep 17 00:00:00 2001
From: Avi Peretz <pavi@videocites.com>
Date: Mon, 11 Nov 2019 16:34:57 +0200
Subject: [PATCH 07/46] lowercase escape channel name.

---
 youtube_dl/extractor/facebook.py | 7 ++++---
 1 file changed, 4 insertions(+), 3 deletions(-)

diff --git a/youtube_dl/extractor/facebook.py b/youtube_dl/extractor/facebook.py
index ac05b580f..ea4bd6d8d 100644
--- a/youtube_dl/extractor/facebook.py
+++ b/youtube_dl/extractor/facebook.py
@@ -24,7 +24,8 @@ from ..utils import (
     sanitized_Request,
     try_get,
     urlencode_postdata,
-    update_url_query
+    update_url_query,
+    lowercase_escape
 )
 
 
@@ -455,9 +456,9 @@ class FacebookIE(InfoExtractor):
         uploader = clean_html(get_element_by_id(
             'fbPhotoPageAuthorName', webpage)) or self._search_regex(
             r'ownerName\s*:\s*"([^"]+)"', webpage, 'uploader',default=None) or \
-                   self._search_regex(
+                   lowercase_escape(self._search_regex(
                         r'\"ownerName\":"(.+?)"', tahoe_data.secondary,
-                        'uploader_id', fatal=False) or self._og_search_title(webpage, default=None)
+                        'uploader_id', fatal=False)) or self._og_search_title(webpage, default=None)
 
 
         timestamp = int_or_none(self._search_regex(

From 3e1144a71d2dfb5ae68962ba1d69cdbf49623600 Mon Sep 17 00:00:00 2001
From: Avi Peretz <pavi@videocites.com>
Date: Thu, 14 Nov 2019 16:41:25 +0200
Subject: [PATCH 08/46] add twitter views back.

---
 youtube_dl/extractor/twitter.py | 29 +++++++++++++++++++++++++----
 1 file changed, 25 insertions(+), 4 deletions(-)

diff --git a/youtube_dl/extractor/twitter.py b/youtube_dl/extractor/twitter.py
index 5f8d90fb4..dd9498dfd 100644
--- a/youtube_dl/extractor/twitter.py
+++ b/youtube_dl/extractor/twitter.py
@@ -2,6 +2,8 @@
 from __future__ import unicode_literals
 
 import re
+import time
+
 
 from .common import InfoExtractor
 from ..compat import (
@@ -20,6 +22,7 @@ from ..utils import (
     unified_timestamp,
     update_url_query,
     xpath_text,
+    parse_count
 )
 
 from .periscope import (
@@ -79,11 +82,20 @@ class TwitterBaseIE(InfoExtractor):
         headers = {
             'Authorization': 'Bearer AAAAAAAAAAAAAAAAAAAAAPYXBAAAAAAACLXUNDekMxqa8h%2F40K4moUkGsoc%3DTYfbDKbT3jJPCEVnMYqilB28NHfOPqkca3qaAxGfsyKCs0wRbw',
         }
+        ct0 = self._get_cookies(self._API_BASE).get('ct0')
+        if ct0:
+            headers['x-csrf-token'] = ct0.value
         if not self._GUEST_TOKEN:
-            self._GUEST_TOKEN = self._download_json(
-                self._API_BASE + 'guest/activate.json', video_id,
-                'Downloading guest token', data=b'',
-                headers=headers)['guest_token']
+            guest_token_c = self._get_cookies('http://api.twitter.com/').get('gt')
+            if guest_token_c:
+                self._GUEST_TOKEN = guest_token_c
+            else:
+                self._GUEST_TOKEN = self._download_json(
+                    self._API_BASE + 'guest/activate.json', video_id,
+                    'Downloading guest token', data=b'',
+                    headers=headers)['guest_token']
+                self._set_cookie('api.twitter.com', 'gt', self._GUEST_TOKEN, expire_time=time.time() + 3000)
+
         headers['x-guest-token'] = self._GUEST_TOKEN
         try:
             return self._download_json(
@@ -380,6 +392,12 @@ class TwitterIE(TwitterBaseIE):
 
     def _real_extract(self, url):
         twid = self._match_id(url)
+        # Download page to fetch cookies
+        self._download_webpage(url, twid)
+        config = self._call_api(
+            'videos/tweet/config/%s.json' % twid, twid
+        )
+
         status = self._call_api(
             'statuses/show/%s.json' % twid, twid, {
                 'cards_platform': 'Web-12',
@@ -389,6 +407,8 @@ class TwitterIE(TwitterBaseIE):
                 'tweet_mode': 'extended',
             })
 
+
+
         title = description = status['full_text'].replace('\n', ' ')
         # strip  'https -_t.co_BJYgOjSeGA' junk from filenames
         title = re.sub(r'\s+(https?://[^ ]+)', '', title)
@@ -447,6 +467,7 @@ class TwitterIE(TwitterBaseIE):
                 'formats': formats,
                 'thumbnails': thumbnails,
                 'duration': float_or_none(video_info.get('duration_millis'), 1000),
+                'view_count': parse_count(config.get('track', {}).get('viewCount'))
             })
         else:
             card = status.get('card')

From d9cb3c379cabd69ff9ea2e17d6690c9898322d9c Mon Sep 17 00:00:00 2001
From: Avi Peretz <pavi@videocites.com>
Date: Thu, 28 Nov 2019 11:58:41 +0200
Subject: [PATCH 09/46] support comment count for facebook.

---
 youtube_dl/extractor/facebook.py | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/youtube_dl/extractor/facebook.py b/youtube_dl/extractor/facebook.py
index 41f000771..234ff3e9f 100644
--- a/youtube_dl/extractor/facebook.py
+++ b/youtube_dl/extractor/facebook.py
@@ -485,6 +485,7 @@ class FacebookIE(InfoExtractor):
 
         likes_count = parse_count(self._extract_likes(webpage, tahoe_data))
         shares_count = parse_count(self._extract_meta_count(['sharecount'], webpage, tahoe_data, 'shares'))
+        comment_count = parse_count(self._extract_meta_count(['commentCount'], webpage, tahoe_data, 'shares'))
 
         info_dict = {
             'id': video_id,
@@ -500,6 +501,7 @@ class FacebookIE(InfoExtractor):
             'like_count': likes_count,
             'share_count': shares_count,
             'subtitles': subtitles,
+            'comment_count': comment_count
         }
         if uploader_id:
             info_dict['uploader_like_count'] = FacebookAjax(self, webpage, uploader_id).page_likes

From 0fb420e8b8cc5fdc8312b2cec123b63b0c6501dd Mon Sep 17 00:00:00 2001
From: Avichai Cohen <cavichai@videocites.com>
Date: Sun, 8 Dec 2019 16:17:58 +0200
Subject: [PATCH 10/46] adding another situation when login is required: when
 we see just the title in incognito. Example:
 https://www.facebook.com/thegrahamnortonshow/videos/1225192167632369

---
 youtube_dl/extractor/facebook.py | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/youtube_dl/extractor/facebook.py b/youtube_dl/extractor/facebook.py
index 234ff3e9f..a870eb881 100644
--- a/youtube_dl/extractor/facebook.py
+++ b/youtube_dl/extractor/facebook.py
@@ -382,7 +382,9 @@ class FacebookIE(InfoExtractor):
 
             video_data = extract_from_jsmods_instances(tahoe_js_data)
 
-        if not video_data:
+        if not video_data :
+            if self._search_regex(r'newsFeedStream.*?<h1><span class.*?>(.*?)<\/span><\/h1>', webpage, "video_title") is not None:
+                self.raise_login_required()
             raise ExtractorError('Cannot parse data')
 
         is_scheduled = '"isScheduledLive":true' in tahoe_data.secondary

From a056c99272f990c2f8f011ade1418b51ca9209a9 Mon Sep 17 00:00:00 2001
From: Avi Peretz <pavi@videocites.com>
Date: Mon, 9 Dec 2019 08:40:21 +0200
Subject: [PATCH 11/46] optimize tahoe data.

---
 youtube_dl/extractor/facebook.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/youtube_dl/extractor/facebook.py b/youtube_dl/extractor/facebook.py
index a870eb881..780308339 100644
--- a/youtube_dl/extractor/facebook.py
+++ b/youtube_dl/extractor/facebook.py
@@ -582,6 +582,7 @@ class FacebookTahoeData:
                 data=req_data,
                 headers=headers
             )
+            self._data[data_type] = data
         return '' if not data else data
 
     @property

From 31858ba37a9c31fd17ebf5ec844a5712c3e30bbf Mon Sep 17 00:00:00 2001
From: Avi Peretz <pavi@videocites.com>
Date: Fri, 13 Dec 2019 11:41:41 +0200
Subject: [PATCH 12/46] add dash manifest indication

---
 youtube_dl/extractor/youtube.py | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/youtube_dl/extractor/youtube.py b/youtube_dl/extractor/youtube.py
index b913d07a6..3228fa92c 100644
--- a/youtube_dl/extractor/youtube.py
+++ b/youtube_dl/extractor/youtube.py
@@ -1723,6 +1723,7 @@ class YoutubeIE(YoutubeBaseInfoExtractor):
 
         # Get video info
         embed_webpage = None
+        used_dash_manifest = False
         if re.search(r'player-age-gate-content">', video_webpage) is not None:
             age_gate = True
             # We simulate the access to the video from www.youtube.com/v/{video_id}
@@ -1768,7 +1769,10 @@ class YoutubeIE(YoutubeBaseInfoExtractor):
                 sts = ytplayer_config.get('sts')
                 if not player_response:
                     player_response = extract_player_response(args.get('player_response'), video_id)
+
+
             if not video_info or self._downloader.params.get('youtube_include_dash_manifest', True):
+                used_dash_manifest = True
                 add_dash_mpd_pr(player_response)
                 # We also try looking in get_video_info since it may contain different dashmpd
                 # URL that points to a DASH manifest with possibly different itag set (some itags
@@ -2459,6 +2463,7 @@ class YoutubeIE(YoutubeBaseInfoExtractor):
             'album': album,
             'release_date': release_date,
             'release_year': release_year,
+            'used_dash_manifest': used_dash_manifest
         }
 
 

From 5ebc2884c80ef9c6100af95b7933e5cbe04296a7 Mon Sep 17 00:00:00 2001
From: Avi Peretz <pavi@videocites.com>
Date: Tue, 31 Dec 2019 14:08:52 +0200
Subject: [PATCH 13/46] Add message.

---
 youtube_dl/extractor/vk.py | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/youtube_dl/extractor/vk.py b/youtube_dl/extractor/vk.py
index 880a76e24..5f8b51d51 100644
--- a/youtube_dl/extractor/vk.py
+++ b/youtube_dl/extractor/vk.py
@@ -360,6 +360,9 @@ class VKIE(VKBaseIE):
                 r'Access denied':
                 'Access denied to video %s.',
 
+                r'You need to be a member':
+                    'Access denied to video %s.',
+
                 r'Видеозапись недоступна, так как её автор был заблокирован.':
                 'Video %s is no longer available, because its author has been blocked.',
 

From c1440b8a1b2ae7ad8caa36209a89238813ff00bf Mon Sep 17 00:00:00 2001
From: Avi Peretz <pavi@videocites.com>
Date: Fri, 10 Jan 2020 15:33:20 +0200
Subject: [PATCH 14/46] add other posts views.

---
 youtube_dl/extractor/facebook.py | 330 ++++++++++++++++++++++++++++++-
 1 file changed, 329 insertions(+), 1 deletion(-)

diff --git a/youtube_dl/extractor/facebook.py b/youtube_dl/extractor/facebook.py
index 780308339..ca966b150 100644
--- a/youtube_dl/extractor/facebook.py
+++ b/youtube_dl/extractor/facebook.py
@@ -485,6 +485,7 @@ class FacebookIE(InfoExtractor):
         else:
             view_count = parse_count(self._extract_meta_count(['postViewCount', 'viewCount'], webpage, tahoe_data, 'likes'))
 
+        other_posts_view_count = parse_count(self._extract_meta_count(['otherPostsViewCount'], webpage, tahoe_data, 'other_post_views'))
         likes_count = parse_count(self._extract_likes(webpage, tahoe_data))
         shares_count = parse_count(self._extract_meta_count(['sharecount'], webpage, tahoe_data, 'shares'))
         comment_count = parse_count(self._extract_meta_count(['commentCount'], webpage, tahoe_data, 'shares'))
@@ -503,7 +504,8 @@ class FacebookIE(InfoExtractor):
             'like_count': likes_count,
             'share_count': shares_count,
             'subtitles': subtitles,
-            'comment_count': comment_count
+            'comment_count': comment_count,
+            'other_posts_view_count': other_posts_view_count
         }
         if uploader_id:
             info_dict['uploader_like_count'] = FacebookAjax(self, webpage, uploader_id).page_likes
@@ -691,3 +693,329 @@ class FacebookPluginsVideoIE(InfoExtractor):
         return self.url_result(
             compat_urllib_parse_unquote(self._match_id(url)),
             FacebookIE.ie_key())
+
+
+class FacebookPhotosIE(InfoExtractor):
+    _VALID_URL = r'^https?:\/\/(?:www\.|)facebook\.com\/(.*?)\/videos\/([^?&\/]*)'
+    IE_NAME = 'facebook_photos'
+
+    _CHROME_USER_AGENT = 'Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/48.0.2564.97 Safari/537.36'
+
+
+    @staticmethod
+    def _extract_urls(webpage):
+        urls = []
+        for mobj in re.finditer(
+                r'<iframe[^>]+?src=(["\'])(?P<url>https?://www\.facebook\.com/(?:video/embed|plugins/video\.php).+?)\1',
+                webpage):
+            urls.append(mobj.group('url'))
+        # Facebook API embed
+        # see https://developers.facebook.com/docs/plugins/embedded-video-player
+        for mobj in re.finditer(r'''(?x)<div[^>]+
+                class=(?P<q1>[\'"])[^\'"]*\bfb-(?:video|post)\b[^\'"]*(?P=q1)[^>]+
+                data-href=(?P<q2>[\'"])(?P<url>(?:https?:)?//(?:www\.)?facebook.com/.+?)(?P=q2)''', webpage):
+            urls.append(mobj.group('url'))
+        return urls
+
+    def _login(self):
+        useremail, password = self._get_login_info()
+        if useremail is None:
+            return
+
+        login_page_req = sanitized_Request(self._LOGIN_URL)
+        self._set_cookie('facebook.com', 'locale', 'en_US')
+        login_page = self._download_webpage(login_page_req, None,
+                                            note='Downloading login page',
+                                            errnote='Unable to download login page')
+        lsd = self._search_regex(
+            r'<input type="hidden" name="lsd" value="([^"]*)"',
+            login_page, 'lsd')
+        lgnrnd = self._search_regex(r'name="lgnrnd" value="([^"]*?)"', login_page, 'lgnrnd')
+
+        login_form = {
+            'email': useremail,
+            'pass': password,
+            'lsd': lsd,
+            'lgnrnd': lgnrnd,
+            'next': 'http://facebook.com/home.php',
+            'default_persistent': '0',
+            'legacy_return': '1',
+            'timezone': '-60',
+            'trynum': '1',
+        }
+        request = sanitized_Request(self._LOGIN_URL, urlencode_postdata(login_form))
+        request.add_header('Content-Type', 'application/x-www-form-urlencoded')
+        try:
+            login_results = self._download_webpage(request, None,
+                                                   note='Logging in', errnote='unable to fetch login page')
+            if re.search(r'<form(.*)name="login"(.*)</form>', login_results) is not None:
+                error = self._html_search_regex(
+                    r'(?s)<div[^>]+class=(["\']).*?login_error_box.*?\1[^>]*><div[^>]*>.*?</div><div[^>]*>(?P<error>.+?)</div>',
+                    login_results, 'login error', default=None, group='error')
+                if error:
+                    raise ExtractorError('Unable to login: %s' % error, expected=True)
+                self._downloader.report_warning('unable to log in: bad username/password, or exceeded login rate limit (~3/min). Check credentials or wait.')
+                return
+
+            fb_dtsg = self._search_regex(
+                r'name="fb_dtsg" value="(.+?)"', login_results, 'fb_dtsg', default=None)
+            h = self._search_regex(
+                r'name="h"\s+(?:\w+="[^"]+"\s+)*?value="([^"]+)"', login_results, 'h', default=None)
+
+            if not fb_dtsg or not h:
+                return
+
+            check_form = {
+                'fb_dtsg': fb_dtsg,
+                'h': h,
+                'name_action_selected': 'dont_save',
+            }
+            check_req = sanitized_Request(self._CHECKPOINT_URL, urlencode_postdata(check_form))
+            check_req.add_header('Content-Type', 'application/x-www-form-urlencoded')
+            check_response = self._download_webpage(check_req, None,
+                                                    note='Confirming login')
+            if re.search(r'id="checkpointSubmitButton"', check_response) is not None:
+                self._downloader.report_warning('Unable to confirm login, you have to login in your browser and authorize the login.')
+        except (compat_urllib_error.URLError, compat_http_client.HTTPException, socket.error) as err:
+            self._downloader.report_warning('unable to log in: %s' % error_to_compat_str(err))
+            return
+
+    def _real_initialize(self):
+        self._login()
+
+    def _extract_from_url(self, url, video_id, fatal_if_no_video=True):
+        req = sanitized_Request(url)
+        req.add_header('User-Agent', self._CHROME_USER_AGENT)
+        webpage = self._download_webpage(req, video_id)
+
+        video_data = None
+
+        def extract_video_data(instances):
+            for item in instances:
+                if item[1][0] == 'VideoConfig':
+                    video_item = item[2][0]
+                    if video_item.get('video_id'):
+                        return video_item['videoData']
+
+        server_js_data = self._parse_json(self._search_regex(
+            r'handleServerJS\(({.+})(?:\);|,")', webpage,
+            'server js data', default='{}'), video_id, fatal=False)
+
+        if server_js_data:
+            video_data = extract_video_data(server_js_data.get('instances', []))
+
+        def extract_from_jsmods_instances(js_data):
+            if js_data:
+                return extract_video_data(try_get(
+                    js_data, lambda x: x['jsmods']['instances'], list) or [])
+
+        if not video_data:
+            server_js_data = self._parse_json(
+                self._search_regex(
+                    r'bigPipe\.onPageletArrive\(({.+?})\)\s*;\s*}\s*\)\s*,\s*["\']onPageletArrive\s+(?:pagelet_group_mall|permalink_video_pagelet|hyperfeed_story_id_\d+)',
+                    webpage, 'js data', default='{}'),
+                video_id, transform_source=js_to_json, fatal=False)
+            video_data = extract_from_jsmods_instances(server_js_data)
+
+        tahoe_data = FacebookTahoeData(self, webpage, video_id)
+        if not video_data:
+            if not fatal_if_no_video:
+                return webpage, False
+            m_msg = re.search(r'class="[^"]*uiInterstitialContent[^"]*"><div>(.*?)</div>', webpage)
+            if m_msg is not None:
+                raise ExtractorError(
+                    'The video is not available, Facebook said: "%s"' % m_msg.group(1),
+                    expected=True)
+            elif '>You must log in to continue' in webpage:
+                self.raise_login_required()
+            # Video info not in first request, do a secondary request using
+            # tahoe player specific URL
+            tahoe_js_data = self._parse_json(
+                self._search_regex(
+                    r'for\s+\(\s*;\s*;\s*\)\s*;(.+)', tahoe_data.primary,
+                    'tahoe js data', default='{}'),
+                video_id, fatal=False)
+
+            video_data = extract_from_jsmods_instances(tahoe_js_data)
+
+        if not video_data :
+            if self._search_regex(r'newsFeedStream.*?<h1><span class.*?>(.*?)<\/span><\/h1>', webpage, "video_title") is not None:
+                self.raise_login_required()
+            raise ExtractorError('Cannot parse data')
+
+        is_scheduled = '"isScheduledLive":true' in tahoe_data.secondary
+        is_live_stream = video_data[0].get('is_live_stream', False)
+        is_broadcast = video_data[0].get('is_broadcast', False)
+
+        live_status = 'not_live'
+        if is_broadcast:
+            live_status = 'completed'
+            if is_live_stream:
+                live_status = 'live'
+                if is_scheduled:
+                    live_status = 'upcoming'
+
+        is_live = live_status == 'live'
+
+        subtitles = {}
+        formats = []
+        for f in video_data:
+            format_id = f['stream_type']
+            if f and isinstance(f, dict):
+                f = [f]
+            if not f or not isinstance(f, list):
+                continue
+            for quality in ('sd', 'hd'):
+                for src_type in ('src', 'src_no_ratelimit'):
+                    src = f[0].get('%s_%s' % (quality, src_type))
+                    if src:
+                        preference = -10 if format_id == 'progressive' else 0
+                        if quality == 'hd':
+                            preference += 5
+                        formats.append({
+                            'format_id': '%s_%s_%s' % (format_id, quality, src_type),
+                            'url': src,
+                            'preference': preference,
+                        })
+            dash_manifest = f[0].get('dash_manifest')
+            if dash_manifest:
+                formats.extend(self._parse_mpd_formats(
+                    compat_etree_fromstring(compat_urllib_parse_unquote_plus(dash_manifest))))
+            subtitles_src = f[0].get('subtitles_src')
+            if subtitles_src:
+                subtitles.setdefault('en', []).append({'url': subtitles_src})
+        if not formats:
+            raise ExtractorError('Cannot find video formats')
+
+        # Downloads with browser's User-Agent are rate limited. Working around
+        # with non-browser User-Agent.
+        for f in formats:
+            f.setdefault('http_headers', {})['User-Agent'] = 'facebookexternalhit/1.1'
+
+        self._sort_formats(formats)
+
+        video_title = self._html_search_regex(
+            r'<h2\s+[^>]*class="uiHeaderTitle"[^>]*>([^<]*)</h2>', webpage,
+            'title', default=None)
+        if not video_title:
+            video_title = self._html_search_regex(
+                r'(?s)<span class="fbPhotosPhotoCaption".*?id="fbPhotoPageCaption"><span class="hasCaption">(.*?)</span>',
+                webpage, 'alternative title', default=None)
+        if not video_title:
+            video_title = self._og_search_title(webpage, default=None)
+        if not video_title:
+            video_title = self._html_search_meta(
+                'description', webpage, 'title', default=None)
+        if video_title:
+            video_title = limit_length(video_title, 80)
+        else:
+            video_title = 'Facebook video #%s' % video_id
+
+        uploader = clean_html(get_element_by_id(
+            'fbPhotoPageAuthorName', webpage)) or self._search_regex(
+            r'ownerName\s*:\s*"([^"]+)"', webpage, 'uploader',default=None) or \
+                   lowercase_escape(self._search_regex(
+                        r'\"ownerName\":"(.+?)"', tahoe_data.secondary,
+                        'uploader_id', fatal=False)) or self._og_search_title(webpage, default=None)
+
+
+        timestamp = int_or_none(self._search_regex(
+            r'data-utime=\\\"(\d+)\\\"', tahoe_data.secondary,
+            'timestamp', default=None) or self._search_regex(
+            r'<abbr[^>]+data-utime=["\'](\d+)', webpage,
+            'timestamp', default=None))
+
+        uploader_id = self._search_regex(
+            r'ownerid:"([\d]+)', webpage,
+            'uploader_id', default=None) or self._search_regex(
+            r'[\'\"]ownerid[\'\"]\s*:\s*[\'\"](\d+)[\'\"]', tahoe_data.secondary,
+            'uploader_id', fatal=False)
+
+
+        thumbnail = self._html_search_meta(['og:image', 'twitter:image'], webpage)
+        if is_live:
+            view_count = parse_count(
+                self._search_regex(r'viewerCount:([\d]+)', webpage, 'views', fatal=False) or \
+                self._search_regex(r'[\'\"]viewerCount[\'\"]\s*:\s*(\d+)', tahoe_data.primary, 'views', fatal=False)
+            )
+        else:
+            view_count = parse_count(self._extract_meta_count(['postViewCount', 'viewCount'], webpage, tahoe_data, 'likes'))
+
+        likes_count = parse_count(self._extract_likes(webpage, tahoe_data))
+        shares_count = parse_count(self._extract_meta_count(['sharecount'], webpage, tahoe_data, 'shares'))
+        comment_count = parse_count(self._extract_meta_count(['commentCount'], webpage, tahoe_data, 'shares'))
+
+        info_dict = {
+            'id': video_id,
+            'title': video_title,
+            'formats': formats,
+            'uploader': uploader,
+            'timestamp': timestamp,
+            'thumbnail': thumbnail,
+            'view_count': view_count,
+            'uploader_id': uploader_id,
+            'is_live': is_live,
+            'live_status': live_status,
+            'like_count': likes_count,
+            'share_count': shares_count,
+            'subtitles': subtitles,
+            'comment_count': comment_count
+        }
+        if uploader_id:
+            info_dict['uploader_like_count'] = FacebookAjax(self, webpage, uploader_id).page_likes
+
+        return webpage, info_dict
+
+    def _extract_meta_count(self, fields, webpage, tahoe_data, name, ):
+        value = None
+
+        for f in fields:
+            if value:
+                break
+            value = self._search_regex(
+                    r'\b%s\s*:\s*["\']([\d,.]+)' % f, webpage, name,
+                    default=None
+            )
+            if value:
+                break
+
+            value = self._search_regex(
+                r'[\'\"]%s[\'\"]\s*:\s*(\d+)' % f, tahoe_data.secondary, name,
+                default=None)
+
+        return value
+
+    def _extract_likes(self, webpage, tahoe_data):
+        values = re.findall(r'\blikecount\s*:\s*["\']([\d,.]+)', webpage)
+        if values:
+            return values[-1]
+
+
+        values = re.findall(r'[\'\"]\blikecount[\'\"]\s*:\s*(\d+)', tahoe_data.secondary)
+        if values:
+            return values[-1]
+
+    def _real_extract(self, url):
+        video_id = self._match_id(url)
+
+        real_url = self._VIDEO_PAGE_TEMPLATE % video_id if url.startswith('facebook:') else url
+        webpage, info_dict = self._extract_from_url(real_url, video_id, fatal_if_no_video=False)
+
+        if info_dict:
+            return info_dict
+
+        if '/posts/' in url:
+            entries = [
+                self.url_result('facebook:%s' % vid, FacebookIE.ie_key())
+                for vid in self._parse_json(
+                    self._search_regex(
+                        r'(["\'])video_ids\1\s*:\s*(?P<ids>\[.+?\])',
+                        webpage, 'video ids', group='ids'),
+                    video_id)]
+
+            return self.playlist_result(entries, video_id)
+        else:
+            _, info_dict = self._extract_from_url(
+                self._VIDEO_PAGE_TEMPLATE % video_id,
+                video_id, fatal_if_no_video=True)
+            return info_dict
\ No newline at end of file

From b996efcb11d4fb0181c06d3fe53b61c484f0914c Mon Sep 17 00:00:00 2001
From: Avi Peretz <pavi@videocites.com>
Date: Wed, 22 Jan 2020 23:41:49 +0200
Subject: [PATCH 15/46] .

---
 youtube_dl/extractor/youtube.py | 91 +++++++++++++++++----------------
 1 file changed, 47 insertions(+), 44 deletions(-)

diff --git a/youtube_dl/extractor/youtube.py b/youtube_dl/extractor/youtube.py
index 3228fa92c..6df7ad01f 100644
--- a/youtube_dl/extractor/youtube.py
+++ b/youtube_dl/extractor/youtube.py
@@ -2,7 +2,7 @@
 
 from __future__ import unicode_literals
 
-
+import requests
 import itertools
 import json
 import os.path
@@ -1780,50 +1780,53 @@ class YoutubeIE(YoutubeBaseInfoExtractor):
                 # manifest pointed by get_video_info's dashmpd).
                 # The general idea is to take a union of itags of both DASH manifests (for example
                 # video with such 'manifest behavior' see https://github.com/ytdl-org/youtube-dl/issues/6093)
-                self.report_video_info_webpage_download(video_id)
-                for el in ('embedded', 'detailpage', 'vevo', ''):
-                    query = {
-                        'video_id': video_id,
-                        'ps': 'default',
-                        'eurl': '',
-                        'gl': 'US',
-                        'hl': 'en',
-                    }
-                    if el:
-                        query['el'] = el
-                    if sts:
-                        query['sts'] = sts
-                    video_info_webpage = self._download_webpage(
-                        '%s://www.youtube.com/get_video_info' % proto,
-                        video_id, note=False,
-                        errnote='unable to download video info webpage',
-                        fatal=False, query=query)
-                    if not video_info_webpage:
-                        continue
-                    get_video_info = compat_parse_qs(video_info_webpage)
-                    if not player_response:
-                        pl_response = get_video_info.get('player_response', [None])[0]
-                        player_response = extract_player_response(pl_response, video_id)
-                    add_dash_mpd(get_video_info)
-                    if view_count is None:
-                        view_count = extract_view_count(get_video_info)
-                    if not video_info:
-                        video_info = get_video_info
-                    get_token = extract_token(get_video_info)
-                    if get_token:
-                        # Different get_video_info requests may report different results, e.g.
-                        # some may report video unavailability, but some may serve it without
-                        # any complaint (see https://github.com/ytdl-org/youtube-dl/issues/7362,
-                        # the original webpage as well as el=info and el=embedded get_video_info
-                        # requests report video unavailability due to geo restriction while
-                        # el=detailpage succeeds and returns valid data). This is probably
-                        # due to YouTube measures against IP ranges of hosting providers.
-                        # Working around by preferring the first succeeded video_info containing
-                        # the token if no such video_info yet was found.
-                        token = extract_token(video_info)
-                        if not token:
+                if self._downloader.params.get('youtube_extend_dash_manifest', False):
+                    self.report_video_info_webpage_download(video_id)
+                    for el in ('embedded', 'detailpage', 'vevo', ''):
+                        query = {
+                            'video_id': video_id,
+                            'ps': 'default',
+                            'eurl': '',
+                            'gl': 'US',
+                            'hl': 'en',
+                        }
+                        if el:
+                            query['el'] = el
+                        if sts:
+                            query['sts'] = sts
+                        video_info_webpage = self._download_webpage(
+                            '%s://www.youtube.com/get_video_info' % proto,
+                            video_id, note=False,
+                            errnote='unable to download video info webpage',
+                            fatal=False, query=query)
+                        if not video_info_webpage:
+                            continue
+                        get_video_info = compat_parse_qs(video_info_webpage)
+                        if not player_response:
+                            pl_response = get_video_info.get('player_response', [None])[0]
+                            player_response = extract_player_response(pl_response, video_id)
+                        add_dash_mpd(get_video_info)
+                        if view_count is None:
+                            view_count = extract_view_count(get_video_info)
+                        if not video_info:
                             video_info = get_video_info
-                        break
+                        get_token = extract_token(get_video_info)
+                        if get_token:
+                            # Different get_video_info requests may report different results, e.g.
+                            # some may report video unavailability, but some may serve it without
+                            # any complaint (see https://github.com/ytdl-org/youtube-dl/issues/7362,
+                            # the original webpage as well as el=info and el=embedded get_video_info
+                            # requests report video unavailability due to geo restriction while
+                            # el=detailpage succeeds and returns valid data). This is probably
+                            # due to YouTube measures against IP ranges of hosting providers.
+                            # Working around by preferring the first succeeded video_info containing
+                            # the token if no such video_info yet was found.
+                            token = extract_token(video_info)
+                            if not token:
+                                video_info = get_video_info
+                            break
+                else:
+                    video_info = {'title': 'Unknown'}
 
         def extract_unavailable_message():
             messages = []

From 36584f85e69ee794d5b38d8d07737516cf94662b Mon Sep 17 00:00:00 2001
From: Avi Peretz <pavi@videocites.com>
Date: Thu, 23 Jan 2020 00:02:41 +0200
Subject: [PATCH 16/46] .

---
 youtube_dl/extractor/youtube.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/youtube_dl/extractor/youtube.py b/youtube_dl/extractor/youtube.py
index 6df7ad01f..c109d7310 100644
--- a/youtube_dl/extractor/youtube.py
+++ b/youtube_dl/extractor/youtube.py
@@ -1780,7 +1780,7 @@ class YoutubeIE(YoutubeBaseInfoExtractor):
                 # manifest pointed by get_video_info's dashmpd).
                 # The general idea is to take a union of itags of both DASH manifests (for example
                 # video with such 'manifest behavior' see https://github.com/ytdl-org/youtube-dl/issues/6093)
-                if self._downloader.params.get('youtube_extend_dash_manifest', False):
+                if self._downloader.params.get('youtube_extend_dash_manifest', False) is True:
                     self.report_video_info_webpage_download(video_id)
                     for el in ('embedded', 'detailpage', 'vevo', ''):
                         query = {

From 2b4552357a804e16701ca28d7790e5934cfae3db Mon Sep 17 00:00:00 2001
From: Avi Peretz <pavi@videocites.com>
Date: Thu, 23 Jan 2020 00:12:01 +0200
Subject: [PATCH 17/46] .

---
 youtube_dl/extractor/youtube.py | 47 +--------------------------------
 1 file changed, 1 insertion(+), 46 deletions(-)

diff --git a/youtube_dl/extractor/youtube.py b/youtube_dl/extractor/youtube.py
index c109d7310..0200cb1b8 100644
--- a/youtube_dl/extractor/youtube.py
+++ b/youtube_dl/extractor/youtube.py
@@ -1780,52 +1780,7 @@ class YoutubeIE(YoutubeBaseInfoExtractor):
                 # manifest pointed by get_video_info's dashmpd).
                 # The general idea is to take a union of itags of both DASH manifests (for example
                 # video with such 'manifest behavior' see https://github.com/ytdl-org/youtube-dl/issues/6093)
-                if self._downloader.params.get('youtube_extend_dash_manifest', False) is True:
-                    self.report_video_info_webpage_download(video_id)
-                    for el in ('embedded', 'detailpage', 'vevo', ''):
-                        query = {
-                            'video_id': video_id,
-                            'ps': 'default',
-                            'eurl': '',
-                            'gl': 'US',
-                            'hl': 'en',
-                        }
-                        if el:
-                            query['el'] = el
-                        if sts:
-                            query['sts'] = sts
-                        video_info_webpage = self._download_webpage(
-                            '%s://www.youtube.com/get_video_info' % proto,
-                            video_id, note=False,
-                            errnote='unable to download video info webpage',
-                            fatal=False, query=query)
-                        if not video_info_webpage:
-                            continue
-                        get_video_info = compat_parse_qs(video_info_webpage)
-                        if not player_response:
-                            pl_response = get_video_info.get('player_response', [None])[0]
-                            player_response = extract_player_response(pl_response, video_id)
-                        add_dash_mpd(get_video_info)
-                        if view_count is None:
-                            view_count = extract_view_count(get_video_info)
-                        if not video_info:
-                            video_info = get_video_info
-                        get_token = extract_token(get_video_info)
-                        if get_token:
-                            # Different get_video_info requests may report different results, e.g.
-                            # some may report video unavailability, but some may serve it without
-                            # any complaint (see https://github.com/ytdl-org/youtube-dl/issues/7362,
-                            # the original webpage as well as el=info and el=embedded get_video_info
-                            # requests report video unavailability due to geo restriction while
-                            # el=detailpage succeeds and returns valid data). This is probably
-                            # due to YouTube measures against IP ranges of hosting providers.
-                            # Working around by preferring the first succeeded video_info containing
-                            # the token if no such video_info yet was found.
-                            token = extract_token(video_info)
-                            if not token:
-                                video_info = get_video_info
-                            break
-                else:
+                if not video_info:
                     video_info = {'title': 'Unknown'}
 
         def extract_unavailable_message():

From 659cad81165a303f596f412328a76c28843ac61b Mon Sep 17 00:00:00 2001
From: Avi Peretz <pavi@videocites.com>
Date: Thu, 23 Jan 2020 08:25:54 +0200
Subject: [PATCH 18/46] add flag

---
 youtube_dl/extractor/youtube.py | 47 ++++++++++++++++++++++++++++++++-
 1 file changed, 46 insertions(+), 1 deletion(-)

diff --git a/youtube_dl/extractor/youtube.py b/youtube_dl/extractor/youtube.py
index 0200cb1b8..b999b3fa5 100644
--- a/youtube_dl/extractor/youtube.py
+++ b/youtube_dl/extractor/youtube.py
@@ -1780,7 +1780,52 @@ class YoutubeIE(YoutubeBaseInfoExtractor):
                 # manifest pointed by get_video_info's dashmpd).
                 # The general idea is to take a union of itags of both DASH manifests (for example
                 # video with such 'manifest behavior' see https://github.com/ytdl-org/youtube-dl/issues/6093)
-                if not video_info:
+                if self._downloader.params.get('youtube_extend_dash_manifest', True) is True:
+                    self.report_video_info_webpage_download(video_id)
+                    for el in ('embedded', 'detailpage', 'vevo', ''):
+                        query = {
+                            'video_id': video_id,
+                            'ps': 'default',
+                            'eurl': '',
+                            'gl': 'US',
+                            'hl': 'en',
+                        }
+                        if el:
+                            query['el'] = el
+                        if sts:
+                            query['sts'] = sts
+                        video_info_webpage = self._download_webpage(
+                            '%s://www.youtube.com/get_video_info' % proto,
+                            video_id, note=False,
+                            errnote='unable to download video info webpage',
+                            fatal=False, query=query)
+                        if not video_info_webpage:
+                            continue
+                        get_video_info = compat_parse_qs(video_info_webpage)
+                        if not player_response:
+                            pl_response = get_video_info.get('player_response', [None])[0]
+                            player_response = extract_player_response(pl_response, video_id)
+                        add_dash_mpd(get_video_info)
+                        if view_count is None:
+                            view_count = extract_view_count(get_video_info)
+                        if not video_info:
+                            video_info = get_video_info
+                        get_token = extract_token(get_video_info)
+                        if get_token:
+                            # Different get_video_info requests may report different results, e.g.
+                            # some may report video unavailability, but some may serve it without
+                            # any complaint (see https://github.com/ytdl-org/youtube-dl/issues/7362,
+                            # the original webpage as well as el=info and el=embedded get_video_info
+                            # requests report video unavailability due to geo restriction while
+                            # el=detailpage succeeds and returns valid data). This is probably
+                            # due to YouTube measures against IP ranges of hosting providers.
+                            # Working around by preferring the first succeeded video_info containing
+                            # the token if no such video_info yet was found.
+                            token = extract_token(video_info)
+                            if not token:
+                                video_info = get_video_info
+                            break
+                else:
                     video_info = {'title': 'Unknown'}
 
         def extract_unavailable_message():

From 2593d5fb7b789056d927b1628ee063133076ad68 Mon Sep 17 00:00:00 2001
From: jhalvors-school <jhalvors-school@users.noreply.github.com>
Date: Sat, 22 Feb 2020 11:03:57 -0800
Subject: [PATCH 19/46] [imdb] Relax _VALID_URL (closes #23443) (#24040)

---
 youtube_dl/extractor/imdb.py | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/youtube_dl/extractor/imdb.py b/youtube_dl/extractor/imdb.py
index 436759da5..e286d5ba6 100644
--- a/youtube_dl/extractor/imdb.py
+++ b/youtube_dl/extractor/imdb.py
@@ -15,7 +15,7 @@ from ..utils import (
 class ImdbIE(InfoExtractor):
     IE_NAME = 'imdb'
     IE_DESC = 'Internet Movie Database trailers'
-    _VALID_URL = r'https?://(?:www|m)\.imdb\.com/(?:video|title|list).+?[/-]vi(?P<id>\d+)'
+    _VALID_URL = r'https?://(?:www|m)\.imdb\.com/(?:video|title|list).*?[/-]vi(?P<id>\d+)'
 
     _TESTS = [{
         'url': 'http://www.imdb.com/video/imdb/vi2524815897',
@@ -43,6 +43,9 @@ class ImdbIE(InfoExtractor):
     }, {
         'url': 'https://www.imdb.com/list/ls009921623/videoplayer/vi260482329',
         'only_matching': True,
+    }, {
+        'url': 'https://www.imdb.com/video/vi3251092761?ref_=ttvi_vi_imdb_13',
+        'only_matching': True,
     }]
 
     def _real_extract(self, url):

From ccfae40229596473153b07d81e10858528c634fe Mon Sep 17 00:00:00 2001
From: Avi Peretz <pavi@videocites.com>
Date: Sun, 1 Mar 2020 08:53:01 +0200
Subject: [PATCH 20/46] extract internal data.

---
 youtube_dl/extractor/facebook.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/youtube_dl/extractor/facebook.py b/youtube_dl/extractor/facebook.py
index ca966b150..abe5fb504 100644
--- a/youtube_dl/extractor/facebook.py
+++ b/youtube_dl/extractor/facebook.py
@@ -505,7 +505,8 @@ class FacebookIE(InfoExtractor):
             'share_count': shares_count,
             'subtitles': subtitles,
             'comment_count': comment_count,
-            'other_posts_view_count': other_posts_view_count
+            'other_posts_view_count': other_posts_view_count,
+            '_internal_data_list': [webpage, tahoe_data.primary, tahoe_data.secondary]
         }
         if uploader_id:
             info_dict['uploader_like_count'] = FacebookAjax(self, webpage, uploader_id).page_likes

From 9d190365ab5ca47ab11cd015b596efeb43420c2e Mon Sep 17 00:00:00 2001
From: Avi Peretz <pavi@videocites.com>
Date: Sun, 1 Mar 2020 08:55:54 +0200
Subject: [PATCH 21/46] remove photos.

---
 youtube_dl/extractor/facebook.py | 326 -------------------------------
 1 file changed, 326 deletions(-)

diff --git a/youtube_dl/extractor/facebook.py b/youtube_dl/extractor/facebook.py
index abe5fb504..7b30e5d52 100644
--- a/youtube_dl/extractor/facebook.py
+++ b/youtube_dl/extractor/facebook.py
@@ -694,329 +694,3 @@ class FacebookPluginsVideoIE(InfoExtractor):
         return self.url_result(
             compat_urllib_parse_unquote(self._match_id(url)),
             FacebookIE.ie_key())
-
-
-class FacebookPhotosIE(InfoExtractor):
-    _VALID_URL = r'^https?:\/\/(?:www\.|)facebook\.com\/(.*?)\/videos\/([^?&\/]*)'
-    IE_NAME = 'facebook_photos'
-
-    _CHROME_USER_AGENT = 'Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/48.0.2564.97 Safari/537.36'
-
-
-    @staticmethod
-    def _extract_urls(webpage):
-        urls = []
-        for mobj in re.finditer(
-                r'<iframe[^>]+?src=(["\'])(?P<url>https?://www\.facebook\.com/(?:video/embed|plugins/video\.php).+?)\1',
-                webpage):
-            urls.append(mobj.group('url'))
-        # Facebook API embed
-        # see https://developers.facebook.com/docs/plugins/embedded-video-player
-        for mobj in re.finditer(r'''(?x)<div[^>]+
-                class=(?P<q1>[\'"])[^\'"]*\bfb-(?:video|post)\b[^\'"]*(?P=q1)[^>]+
-                data-href=(?P<q2>[\'"])(?P<url>(?:https?:)?//(?:www\.)?facebook.com/.+?)(?P=q2)''', webpage):
-            urls.append(mobj.group('url'))
-        return urls
-
-    def _login(self):
-        useremail, password = self._get_login_info()
-        if useremail is None:
-            return
-
-        login_page_req = sanitized_Request(self._LOGIN_URL)
-        self._set_cookie('facebook.com', 'locale', 'en_US')
-        login_page = self._download_webpage(login_page_req, None,
-                                            note='Downloading login page',
-                                            errnote='Unable to download login page')
-        lsd = self._search_regex(
-            r'<input type="hidden" name="lsd" value="([^"]*)"',
-            login_page, 'lsd')
-        lgnrnd = self._search_regex(r'name="lgnrnd" value="([^"]*?)"', login_page, 'lgnrnd')
-
-        login_form = {
-            'email': useremail,
-            'pass': password,
-            'lsd': lsd,
-            'lgnrnd': lgnrnd,
-            'next': 'http://facebook.com/home.php',
-            'default_persistent': '0',
-            'legacy_return': '1',
-            'timezone': '-60',
-            'trynum': '1',
-        }
-        request = sanitized_Request(self._LOGIN_URL, urlencode_postdata(login_form))
-        request.add_header('Content-Type', 'application/x-www-form-urlencoded')
-        try:
-            login_results = self._download_webpage(request, None,
-                                                   note='Logging in', errnote='unable to fetch login page')
-            if re.search(r'<form(.*)name="login"(.*)</form>', login_results) is not None:
-                error = self._html_search_regex(
-                    r'(?s)<div[^>]+class=(["\']).*?login_error_box.*?\1[^>]*><div[^>]*>.*?</div><div[^>]*>(?P<error>.+?)</div>',
-                    login_results, 'login error', default=None, group='error')
-                if error:
-                    raise ExtractorError('Unable to login: %s' % error, expected=True)
-                self._downloader.report_warning('unable to log in: bad username/password, or exceeded login rate limit (~3/min). Check credentials or wait.')
-                return
-
-            fb_dtsg = self._search_regex(
-                r'name="fb_dtsg" value="(.+?)"', login_results, 'fb_dtsg', default=None)
-            h = self._search_regex(
-                r'name="h"\s+(?:\w+="[^"]+"\s+)*?value="([^"]+)"', login_results, 'h', default=None)
-
-            if not fb_dtsg or not h:
-                return
-
-            check_form = {
-                'fb_dtsg': fb_dtsg,
-                'h': h,
-                'name_action_selected': 'dont_save',
-            }
-            check_req = sanitized_Request(self._CHECKPOINT_URL, urlencode_postdata(check_form))
-            check_req.add_header('Content-Type', 'application/x-www-form-urlencoded')
-            check_response = self._download_webpage(check_req, None,
-                                                    note='Confirming login')
-            if re.search(r'id="checkpointSubmitButton"', check_response) is not None:
-                self._downloader.report_warning('Unable to confirm login, you have to login in your browser and authorize the login.')
-        except (compat_urllib_error.URLError, compat_http_client.HTTPException, socket.error) as err:
-            self._downloader.report_warning('unable to log in: %s' % error_to_compat_str(err))
-            return
-
-    def _real_initialize(self):
-        self._login()
-
-    def _extract_from_url(self, url, video_id, fatal_if_no_video=True):
-        req = sanitized_Request(url)
-        req.add_header('User-Agent', self._CHROME_USER_AGENT)
-        webpage = self._download_webpage(req, video_id)
-
-        video_data = None
-
-        def extract_video_data(instances):
-            for item in instances:
-                if item[1][0] == 'VideoConfig':
-                    video_item = item[2][0]
-                    if video_item.get('video_id'):
-                        return video_item['videoData']
-
-        server_js_data = self._parse_json(self._search_regex(
-            r'handleServerJS\(({.+})(?:\);|,")', webpage,
-            'server js data', default='{}'), video_id, fatal=False)
-
-        if server_js_data:
-            video_data = extract_video_data(server_js_data.get('instances', []))
-
-        def extract_from_jsmods_instances(js_data):
-            if js_data:
-                return extract_video_data(try_get(
-                    js_data, lambda x: x['jsmods']['instances'], list) or [])
-
-        if not video_data:
-            server_js_data = self._parse_json(
-                self._search_regex(
-                    r'bigPipe\.onPageletArrive\(({.+?})\)\s*;\s*}\s*\)\s*,\s*["\']onPageletArrive\s+(?:pagelet_group_mall|permalink_video_pagelet|hyperfeed_story_id_\d+)',
-                    webpage, 'js data', default='{}'),
-                video_id, transform_source=js_to_json, fatal=False)
-            video_data = extract_from_jsmods_instances(server_js_data)
-
-        tahoe_data = FacebookTahoeData(self, webpage, video_id)
-        if not video_data:
-            if not fatal_if_no_video:
-                return webpage, False
-            m_msg = re.search(r'class="[^"]*uiInterstitialContent[^"]*"><div>(.*?)</div>', webpage)
-            if m_msg is not None:
-                raise ExtractorError(
-                    'The video is not available, Facebook said: "%s"' % m_msg.group(1),
-                    expected=True)
-            elif '>You must log in to continue' in webpage:
-                self.raise_login_required()
-            # Video info not in first request, do a secondary request using
-            # tahoe player specific URL
-            tahoe_js_data = self._parse_json(
-                self._search_regex(
-                    r'for\s+\(\s*;\s*;\s*\)\s*;(.+)', tahoe_data.primary,
-                    'tahoe js data', default='{}'),
-                video_id, fatal=False)
-
-            video_data = extract_from_jsmods_instances(tahoe_js_data)
-
-        if not video_data :
-            if self._search_regex(r'newsFeedStream.*?<h1><span class.*?>(.*?)<\/span><\/h1>', webpage, "video_title") is not None:
-                self.raise_login_required()
-            raise ExtractorError('Cannot parse data')
-
-        is_scheduled = '"isScheduledLive":true' in tahoe_data.secondary
-        is_live_stream = video_data[0].get('is_live_stream', False)
-        is_broadcast = video_data[0].get('is_broadcast', False)
-
-        live_status = 'not_live'
-        if is_broadcast:
-            live_status = 'completed'
-            if is_live_stream:
-                live_status = 'live'
-                if is_scheduled:
-                    live_status = 'upcoming'
-
-        is_live = live_status == 'live'
-
-        subtitles = {}
-        formats = []
-        for f in video_data:
-            format_id = f['stream_type']
-            if f and isinstance(f, dict):
-                f = [f]
-            if not f or not isinstance(f, list):
-                continue
-            for quality in ('sd', 'hd'):
-                for src_type in ('src', 'src_no_ratelimit'):
-                    src = f[0].get('%s_%s' % (quality, src_type))
-                    if src:
-                        preference = -10 if format_id == 'progressive' else 0
-                        if quality == 'hd':
-                            preference += 5
-                        formats.append({
-                            'format_id': '%s_%s_%s' % (format_id, quality, src_type),
-                            'url': src,
-                            'preference': preference,
-                        })
-            dash_manifest = f[0].get('dash_manifest')
-            if dash_manifest:
-                formats.extend(self._parse_mpd_formats(
-                    compat_etree_fromstring(compat_urllib_parse_unquote_plus(dash_manifest))))
-            subtitles_src = f[0].get('subtitles_src')
-            if subtitles_src:
-                subtitles.setdefault('en', []).append({'url': subtitles_src})
-        if not formats:
-            raise ExtractorError('Cannot find video formats')
-
-        # Downloads with browser's User-Agent are rate limited. Working around
-        # with non-browser User-Agent.
-        for f in formats:
-            f.setdefault('http_headers', {})['User-Agent'] = 'facebookexternalhit/1.1'
-
-        self._sort_formats(formats)
-
-        video_title = self._html_search_regex(
-            r'<h2\s+[^>]*class="uiHeaderTitle"[^>]*>([^<]*)</h2>', webpage,
-            'title', default=None)
-        if not video_title:
-            video_title = self._html_search_regex(
-                r'(?s)<span class="fbPhotosPhotoCaption".*?id="fbPhotoPageCaption"><span class="hasCaption">(.*?)</span>',
-                webpage, 'alternative title', default=None)
-        if not video_title:
-            video_title = self._og_search_title(webpage, default=None)
-        if not video_title:
-            video_title = self._html_search_meta(
-                'description', webpage, 'title', default=None)
-        if video_title:
-            video_title = limit_length(video_title, 80)
-        else:
-            video_title = 'Facebook video #%s' % video_id
-
-        uploader = clean_html(get_element_by_id(
-            'fbPhotoPageAuthorName', webpage)) or self._search_regex(
-            r'ownerName\s*:\s*"([^"]+)"', webpage, 'uploader',default=None) or \
-                   lowercase_escape(self._search_regex(
-                        r'\"ownerName\":"(.+?)"', tahoe_data.secondary,
-                        'uploader_id', fatal=False)) or self._og_search_title(webpage, default=None)
-
-
-        timestamp = int_or_none(self._search_regex(
-            r'data-utime=\\\"(\d+)\\\"', tahoe_data.secondary,
-            'timestamp', default=None) or self._search_regex(
-            r'<abbr[^>]+data-utime=["\'](\d+)', webpage,
-            'timestamp', default=None))
-
-        uploader_id = self._search_regex(
-            r'ownerid:"([\d]+)', webpage,
-            'uploader_id', default=None) or self._search_regex(
-            r'[\'\"]ownerid[\'\"]\s*:\s*[\'\"](\d+)[\'\"]', tahoe_data.secondary,
-            'uploader_id', fatal=False)
-
-
-        thumbnail = self._html_search_meta(['og:image', 'twitter:image'], webpage)
-        if is_live:
-            view_count = parse_count(
-                self._search_regex(r'viewerCount:([\d]+)', webpage, 'views', fatal=False) or \
-                self._search_regex(r'[\'\"]viewerCount[\'\"]\s*:\s*(\d+)', tahoe_data.primary, 'views', fatal=False)
-            )
-        else:
-            view_count = parse_count(self._extract_meta_count(['postViewCount', 'viewCount'], webpage, tahoe_data, 'likes'))
-
-        likes_count = parse_count(self._extract_likes(webpage, tahoe_data))
-        shares_count = parse_count(self._extract_meta_count(['sharecount'], webpage, tahoe_data, 'shares'))
-        comment_count = parse_count(self._extract_meta_count(['commentCount'], webpage, tahoe_data, 'shares'))
-
-        info_dict = {
-            'id': video_id,
-            'title': video_title,
-            'formats': formats,
-            'uploader': uploader,
-            'timestamp': timestamp,
-            'thumbnail': thumbnail,
-            'view_count': view_count,
-            'uploader_id': uploader_id,
-            'is_live': is_live,
-            'live_status': live_status,
-            'like_count': likes_count,
-            'share_count': shares_count,
-            'subtitles': subtitles,
-            'comment_count': comment_count
-        }
-        if uploader_id:
-            info_dict['uploader_like_count'] = FacebookAjax(self, webpage, uploader_id).page_likes
-
-        return webpage, info_dict
-
-    def _extract_meta_count(self, fields, webpage, tahoe_data, name, ):
-        value = None
-
-        for f in fields:
-            if value:
-                break
-            value = self._search_regex(
-                    r'\b%s\s*:\s*["\']([\d,.]+)' % f, webpage, name,
-                    default=None
-            )
-            if value:
-                break
-
-            value = self._search_regex(
-                r'[\'\"]%s[\'\"]\s*:\s*(\d+)' % f, tahoe_data.secondary, name,
-                default=None)
-
-        return value
-
-    def _extract_likes(self, webpage, tahoe_data):
-        values = re.findall(r'\blikecount\s*:\s*["\']([\d,.]+)', webpage)
-        if values:
-            return values[-1]
-
-
-        values = re.findall(r'[\'\"]\blikecount[\'\"]\s*:\s*(\d+)', tahoe_data.secondary)
-        if values:
-            return values[-1]
-
-    def _real_extract(self, url):
-        video_id = self._match_id(url)
-
-        real_url = self._VIDEO_PAGE_TEMPLATE % video_id if url.startswith('facebook:') else url
-        webpage, info_dict = self._extract_from_url(real_url, video_id, fatal_if_no_video=False)
-
-        if info_dict:
-            return info_dict
-
-        if '/posts/' in url:
-            entries = [
-                self.url_result('facebook:%s' % vid, FacebookIE.ie_key())
-                for vid in self._parse_json(
-                    self._search_regex(
-                        r'(["\'])video_ids\1\s*:\s*(?P<ids>\[.+?\])',
-                        webpage, 'video ids', group='ids'),
-                    video_id)]
-
-            return self.playlist_result(entries, video_id)
-        else:
-            _, info_dict = self._extract_from_url(
-                self._VIDEO_PAGE_TEMPLATE % video_id,
-                video_id, fatal_if_no_video=True)
-            return info_dict
\ No newline at end of file

From cac71916f76100513ce80b1772ace692711604c4 Mon Sep 17 00:00:00 2001
From: Avi Peretz <pavi@videocites.com>
Date: Sun, 1 Mar 2020 09:01:39 +0200
Subject: [PATCH 22/46] .

---
 youtube_dl/extractor/facebook.py | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/youtube_dl/extractor/facebook.py b/youtube_dl/extractor/facebook.py
index 7b30e5d52..96e303c00 100644
--- a/youtube_dl/extractor/facebook.py
+++ b/youtube_dl/extractor/facebook.py
@@ -506,7 +506,10 @@ class FacebookIE(InfoExtractor):
             'subtitles': subtitles,
             'comment_count': comment_count,
             'other_posts_view_count': other_posts_view_count,
-            '_internal_data_list': [webpage, tahoe_data.primary, tahoe_data.secondary]
+            '_internal_data': {
+                'page': webpage,
+                'api_response_list': [tahoe_data.primary, tahoe_data.secondary]
+            }
         }
         if uploader_id:
             info_dict['uploader_like_count'] = FacebookAjax(self, webpage, uploader_id).page_likes

From 68e71dfc24a2e316def073dce0b7928e183cefd2 Mon Sep 17 00:00:00 2001
From: Avi Peretz <pavi@videocites.com>
Date: Tue, 10 Mar 2020 15:41:17 +0200
Subject: [PATCH 23/46] fix bug.

---
 youtube_dl/extractor/facebook.py | 6 +++++-
 1 file changed, 5 insertions(+), 1 deletion(-)

diff --git a/youtube_dl/extractor/facebook.py b/youtube_dl/extractor/facebook.py
index 96e303c00..0160b5a9d 100644
--- a/youtube_dl/extractor/facebook.py
+++ b/youtube_dl/extractor/facebook.py
@@ -455,10 +455,14 @@ class FacebookIE(InfoExtractor):
         else:
             video_title = 'Facebook video #%s' % video_id
 
+        def _lowercase_escape(s):
+            if s:
+                return lowercase_escape(s)
+
         uploader = clean_html(get_element_by_id(
             'fbPhotoPageAuthorName', webpage)) or self._search_regex(
             r'ownerName\s*:\s*"([^"]+)"', webpage, 'uploader',default=None) or \
-                   lowercase_escape(self._search_regex(
+                   _lowercase_escape(self._search_regex(
                         r'\"ownerName\":"(.+?)"', tahoe_data.secondary,
                         'uploader_id', fatal=False)) or self._og_search_title(webpage, default=None)
 

From b8c508587817ac1f22a3af57036244ed03a2938e Mon Sep 17 00:00:00 2001
From: Avi Peretz <pavi@videocites.com>
Date: Tue, 10 Mar 2020 17:23:21 +0200
Subject: [PATCH 24/46] .

---
 youtube_dl/extractor/facebook.py | 11 -----------
 1 file changed, 11 deletions(-)

diff --git a/youtube_dl/extractor/facebook.py b/youtube_dl/extractor/facebook.py
index 0160b5a9d..49b586cf6 100644
--- a/youtube_dl/extractor/facebook.py
+++ b/youtube_dl/extractor/facebook.py
@@ -455,17 +455,6 @@ class FacebookIE(InfoExtractor):
         else:
             video_title = 'Facebook video #%s' % video_id
 
-        def _lowercase_escape(s):
-            if s:
-                return lowercase_escape(s)
-
-        uploader = clean_html(get_element_by_id(
-            'fbPhotoPageAuthorName', webpage)) or self._search_regex(
-            r'ownerName\s*:\s*"([^"]+)"', webpage, 'uploader',default=None) or \
-                   _lowercase_escape(self._search_regex(
-                        r'\"ownerName\":"(.+?)"', tahoe_data.secondary,
-                        'uploader_id', fatal=False)) or self._og_search_title(webpage, default=None)
-
 
         timestamp = int_or_none(self._search_regex(
             r'data-utime=\\\"(\d+)\\\"', tahoe_data.secondary,

From 75f904e579ba04a03199499800eb6d1b31832621 Mon Sep 17 00:00:00 2001
From: Avi Peretz <pavi@videocites.com>
Date: Tue, 10 Mar 2020 17:23:40 +0200
Subject: [PATCH 25/46] .

---
 youtube_dl/extractor/facebook.py | 13 ++++++++++++-
 1 file changed, 12 insertions(+), 1 deletion(-)

diff --git a/youtube_dl/extractor/facebook.py b/youtube_dl/extractor/facebook.py
index 49b586cf6..8df46ff54 100644
--- a/youtube_dl/extractor/facebook.py
+++ b/youtube_dl/extractor/facebook.py
@@ -455,7 +455,18 @@ class FacebookIE(InfoExtractor):
         else:
             video_title = 'Facebook video #%s' % video_id
 
-
+        def _lowercase_escape(s):
+            if s:
+                return lowercase_escape(s)
+
+
+        uploader = clean_html(get_element_by_id(
+            'fbPhotoPageAuthorName', webpage)) or self._search_regex(
+            r'ownerName\s*:\s*"([^"]+)"', webpage, 'uploader',default=None) or \
+                   _lowercase_escape(self._search_regex(
+                        r'\"ownerName\":"(.+?)"', tahoe_data.secondary,
+                        'uploader_id', fatal=False)) or self._og_search_title(webpage, default=None)
+        
         timestamp = int_or_none(self._search_regex(
             r'data-utime=\\\"(\d+)\\\"', tahoe_data.secondary,
             'timestamp', default=None) or self._search_regex(

From 5dadd9c357f252689cd0d8fe2454776ed3474d22 Mon Sep 17 00:00:00 2001
From: Avi Peretz <pavi@videocites.com>
Date: Tue, 10 Mar 2020 23:52:01 +0200
Subject: [PATCH 26/46] add page id.

---
 youtube_dl/extractor/facebook.py | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/youtube_dl/extractor/facebook.py b/youtube_dl/extractor/facebook.py
index 8df46ff54..996711ab4 100644
--- a/youtube_dl/extractor/facebook.py
+++ b/youtube_dl/extractor/facebook.py
@@ -466,7 +466,7 @@ class FacebookIE(InfoExtractor):
                    _lowercase_escape(self._search_regex(
                         r'\"ownerName\":"(.+?)"', tahoe_data.secondary,
                         'uploader_id', fatal=False)) or self._og_search_title(webpage, default=None)
-        
+
         timestamp = int_or_none(self._search_regex(
             r'data-utime=\\\"(\d+)\\\"', tahoe_data.secondary,
             'timestamp', default=None) or self._search_regex(
@@ -477,7 +477,8 @@ class FacebookIE(InfoExtractor):
             r'ownerid:"([\d]+)', webpage,
             'uploader_id', default=None) or self._search_regex(
             r'[\'\"]ownerid[\'\"]\s*:\s*[\'\"](\d+)[\'\"]', tahoe_data.secondary,
-            'uploader_id', fatal=False)
+            'uploader_id', default=None) or \
+            self._search_regex(r'\\\"page_id\\\"\s*:\s*\\\"(\d+)\\\"', tahoe_data.secondary, 'uploader_id', fatal=False)
 
 
         thumbnail = self._html_search_meta(['og:image', 'twitter:image'], webpage)

From 7c9a677d98dbabc928647ea2f2c7cab2c7087223 Mon Sep 17 00:00:00 2001
From: Avi Peretz <pavi@videocites.com>
Date: Wed, 11 Mar 2020 00:18:08 +0200
Subject: [PATCH 27/46] fix timestamp.

---
 youtube_dl/extractor/facebook.py | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/youtube_dl/extractor/facebook.py b/youtube_dl/extractor/facebook.py
index 996711ab4..078f4f3dc 100644
--- a/youtube_dl/extractor/facebook.py
+++ b/youtube_dl/extractor/facebook.py
@@ -468,6 +468,8 @@ class FacebookIE(InfoExtractor):
                         'uploader_id', fatal=False)) or self._og_search_title(webpage, default=None)
 
         timestamp = int_or_none(self._search_regex(
+            r'\\\"timestamp\\\":([\d]+)', tahoe_data.secondary,
+            'timestamp', default=None)) or int_or_none(self._search_regex(
             r'data-utime=\\\"(\d+)\\\"', tahoe_data.secondary,
             'timestamp', default=None) or self._search_regex(
             r'<abbr[^>]+data-utime=["\'](\d+)', webpage,

From 9549c3a016f0f55ef57ebf644c17facad23eda8b Mon Sep 17 00:00:00 2001
From: Avi Peretz <pavi@videocites.com>
Date: Wed, 11 Mar 2020 08:42:31 +0200
Subject: [PATCH 28/46] fix date

---
 youtube_dl/extractor/facebook.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/youtube_dl/extractor/facebook.py b/youtube_dl/extractor/facebook.py
index 078f4f3dc..f88795ba2 100644
--- a/youtube_dl/extractor/facebook.py
+++ b/youtube_dl/extractor/facebook.py
@@ -468,11 +468,11 @@ class FacebookIE(InfoExtractor):
                         'uploader_id', fatal=False)) or self._og_search_title(webpage, default=None)
 
         timestamp = int_or_none(self._search_regex(
-            r'\\\"timestamp\\\":([\d]+)', tahoe_data.secondary,
-            'timestamp', default=None)) or int_or_none(self._search_regex(
             r'data-utime=\\\"(\d+)\\\"', tahoe_data.secondary,
             'timestamp', default=None) or self._search_regex(
             r'<abbr[^>]+data-utime=["\'](\d+)', webpage,
+            'timestamp', default=None)) or int_or_none(self._search_regex(
+            r'publish_time&quot;:([\d]+)', webpage,
             'timestamp', default=None))
 
         uploader_id = self._search_regex(

From 1f52df87c3e6d668385652a32070a07cd4075153 Mon Sep 17 00:00:00 2001
From: Avichai <cavichai@videocites.com>
Date: Wed, 11 Mar 2020 18:46:58 +0200
Subject: [PATCH 29/46] adding another option for extracting uploader

---
 youtube_dl/extractor/facebook.py | 12 ++++++------
 1 file changed, 6 insertions(+), 6 deletions(-)

diff --git a/youtube_dl/extractor/facebook.py b/youtube_dl/extractor/facebook.py
index f88795ba2..00b899c73 100644
--- a/youtube_dl/extractor/facebook.py
+++ b/youtube_dl/extractor/facebook.py
@@ -460,12 +460,12 @@ class FacebookIE(InfoExtractor):
                 return lowercase_escape(s)
 
 
-        uploader = clean_html(get_element_by_id(
-            'fbPhotoPageAuthorName', webpage)) or self._search_regex(
-            r'ownerName\s*:\s*"([^"]+)"', webpage, 'uploader',default=None) or \
-                   _lowercase_escape(self._search_regex(
-                        r'\"ownerName\":"(.+?)"', tahoe_data.secondary,
-                        'uploader_id', fatal=False)) or self._og_search_title(webpage, default=None)
+        uploader = clean_html(get_element_by_id('fbPhotoPageAuthorName', webpage)) or \
+                   self._search_regex(r'ownerName\s*:\s*"([^"]+)"', webpage, 'uploader',default=None) or \
+                   _lowercase_escape(self._search_regex(r'\"ownerName\":"(.+?)"', tahoe_data.secondary, 'uploader_id', fatal=False)) or \
+                   self._search_regex(r'ownerName"\s*:\s*"([^"]+)"', webpage, 'uploader', default=None) or \
+                   self._og_search_title(webpage, default=None)
+
 
         timestamp = int_or_none(self._search_regex(
             r'data-utime=\\\"(\d+)\\\"', tahoe_data.secondary,

From 2b594af6f02b9ec7bdd00b61322557f27ee3a67d Mon Sep 17 00:00:00 2001
From: Avichai <cavichai@videocites.com>
Date: Wed, 11 Mar 2020 18:48:24 +0200
Subject: [PATCH 30/46] adding option for views extraction

---
 youtube_dl/extractor/facebook.py | 11 ++++++++++-
 1 file changed, 10 insertions(+), 1 deletion(-)

diff --git a/youtube_dl/extractor/facebook.py b/youtube_dl/extractor/facebook.py
index 00b899c73..228e96690 100644
--- a/youtube_dl/extractor/facebook.py
+++ b/youtube_dl/extractor/facebook.py
@@ -490,7 +490,7 @@ class FacebookIE(InfoExtractor):
                 self._search_regex(r'[\'\"]viewerCount[\'\"]\s*:\s*(\d+)', tahoe_data.primary, 'views', fatal=False)
             )
         else:
-            view_count = parse_count(self._extract_meta_count(['postViewCount', 'viewCount'], webpage, tahoe_data, 'likes'))
+            view_count = parse_count(self._extract_views(webpage, tahoe_data))
 
         other_posts_view_count = parse_count(self._extract_meta_count(['otherPostsViewCount'], webpage, tahoe_data, 'other_post_views'))
         likes_count = parse_count(self._extract_likes(webpage, tahoe_data))
@@ -552,6 +552,15 @@ class FacebookIE(InfoExtractor):
         if values:
             return values[-1]
 
+    def _extract_views(self, webpage, tahoe_data):
+        value = self._extract_meta_count(['postViewCount', 'viewCount'], webpage, tahoe_data, 'likes')
+        if value:
+            return value
+
+        values = re.findall(r'(\d+\w?) Views', tahoe_data.secondary)
+        if values:
+            return values[-1]
+
     def _real_extract(self, url):
         video_id = self._match_id(url)
 

From e23f867b398022db44f1c30da394332e4b6435bd Mon Sep 17 00:00:00 2001
From: Avichai <cavichai@videocites.com>
Date: Wed, 11 Mar 2020 18:49:08 +0200
Subject: [PATCH 31/46] adding option for likes extraction

---
 youtube_dl/extractor/facebook.py | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/youtube_dl/extractor/facebook.py b/youtube_dl/extractor/facebook.py
index 228e96690..b41c040dc 100644
--- a/youtube_dl/extractor/facebook.py
+++ b/youtube_dl/extractor/facebook.py
@@ -552,6 +552,10 @@ class FacebookIE(InfoExtractor):
         if values:
             return values[-1]
 
+        values = re.findall(r'"reaction_count"\s*:\s*{\s*"count"\s*:\s*(\d+)', tahoe_data.secondary)
+        if values:
+            return values[-1]
+
     def _extract_views(self, webpage, tahoe_data):
         value = self._extract_meta_count(['postViewCount', 'viewCount'], webpage, tahoe_data, 'likes')
         if value:

From 056baf9e9fa0f3d1fa5631415873cfacf6b49a7e Mon Sep 17 00:00:00 2001
From: Avichai <cavichai@videocites.com>
Date: Wed, 11 Mar 2020 18:50:13 +0200
Subject: [PATCH 32/46] adding option to shares extraction

---
 youtube_dl/extractor/facebook.py | 11 ++++++++++-
 1 file changed, 10 insertions(+), 1 deletion(-)

diff --git a/youtube_dl/extractor/facebook.py b/youtube_dl/extractor/facebook.py
index b41c040dc..4fe9bd01a 100644
--- a/youtube_dl/extractor/facebook.py
+++ b/youtube_dl/extractor/facebook.py
@@ -494,8 +494,8 @@ class FacebookIE(InfoExtractor):
 
         other_posts_view_count = parse_count(self._extract_meta_count(['otherPostsViewCount'], webpage, tahoe_data, 'other_post_views'))
         likes_count = parse_count(self._extract_likes(webpage, tahoe_data))
-        shares_count = parse_count(self._extract_meta_count(['sharecount'], webpage, tahoe_data, 'shares'))
         comment_count = parse_count(self._extract_meta_count(['commentCount'], webpage, tahoe_data, 'shares'))
+        shares_count = parse_count(self._extract_shares(webpage, tahoe_data))
 
         info_dict = {
             'id': video_id,
@@ -556,6 +556,15 @@ class FacebookIE(InfoExtractor):
         if values:
             return values[-1]
 
+    def _extract_shares(self, webpage, tahoe_data):
+        value = self._extract_meta_count(['sharecount'], webpage, tahoe_data, 'shares')
+        if value:
+            return value
+        a = r'(\d+\w) Views'
+        values = re.findall(r'"share_count"\s*:\s*{\s*"count"\s*:\s*(\d+)', tahoe_data.secondary)
+        if values:
+            return values[-1]
+
     def _extract_views(self, webpage, tahoe_data):
         value = self._extract_meta_count(['postViewCount', 'viewCount'], webpage, tahoe_data, 'likes')
         if value:

From d003505adc94f3fb4101baecd3d1a87128437ba7 Mon Sep 17 00:00:00 2001
From: Avichai <cavichai@videocites.com>
Date: Wed, 11 Mar 2020 18:50:42 +0200
Subject: [PATCH 33/46] adding option to extract comments count

---
 youtube_dl/extractor/facebook.py | 13 ++++++++++---
 1 file changed, 10 insertions(+), 3 deletions(-)

diff --git a/youtube_dl/extractor/facebook.py b/youtube_dl/extractor/facebook.py
index 4fe9bd01a..2eb43fa65 100644
--- a/youtube_dl/extractor/facebook.py
+++ b/youtube_dl/extractor/facebook.py
@@ -494,8 +494,8 @@ class FacebookIE(InfoExtractor):
 
         other_posts_view_count = parse_count(self._extract_meta_count(['otherPostsViewCount'], webpage, tahoe_data, 'other_post_views'))
         likes_count = parse_count(self._extract_likes(webpage, tahoe_data))
-        comment_count = parse_count(self._extract_meta_count(['commentCount'], webpage, tahoe_data, 'shares'))
         shares_count = parse_count(self._extract_shares(webpage, tahoe_data))
+        comment_count = parse_count(self._extract_comments_count(webpage, tahoe_data))
 
         info_dict = {
             'id': video_id,
@@ -547,7 +547,6 @@ class FacebookIE(InfoExtractor):
         if values:
             return values[-1]
 
-
         values = re.findall(r'[\'\"]\blikecount[\'\"]\s*:\s*(\d+)', tahoe_data.secondary)
         if values:
             return values[-1]
@@ -565,6 +564,15 @@ class FacebookIE(InfoExtractor):
         if values:
             return values[-1]
 
+    def _extract_comments_count(self, webpage, tahoe_data):
+        value = self._extract_meta_count(['commentCount'], webpage, tahoe_data, 'comment_count')
+        if value:
+            return value
+
+        values = re.findall(r'Comments\s\((\d+)', tahoe_data.secondary)
+        if values:
+            return values[-1]
+
     def _extract_views(self, webpage, tahoe_data):
         value = self._extract_meta_count(['postViewCount', 'viewCount'], webpage, tahoe_data, 'likes')
         if value:
@@ -599,7 +607,6 @@ class FacebookIE(InfoExtractor):
                 video_id, fatal_if_no_video=True)
             return info_dict
 
-
 class FacebookTahoeData:
     def __init__(self, extractor, page, video_id):
         self._page = page

From 3a3645e6f271c96a3b70683d8a4d31547b85594c Mon Sep 17 00:00:00 2001
From: Avichai <cavichai@videocites.com>
Date: Wed, 18 Mar 2020 12:14:42 +0200
Subject: [PATCH 34/46] fixing missing video-title

---
 youtube_dl/extractor/facebook.py | 41 +++++++++++++++++++-------------
 1 file changed, 25 insertions(+), 16 deletions(-)

diff --git a/youtube_dl/extractor/facebook.py b/youtube_dl/extractor/facebook.py
index 2eb43fa65..3fc7bd563 100644
--- a/youtube_dl/extractor/facebook.py
+++ b/youtube_dl/extractor/facebook.py
@@ -438,22 +438,7 @@ class FacebookIE(InfoExtractor):
 
         self._sort_formats(formats)
 
-        video_title = self._html_search_regex(
-            r'<h2\s+[^>]*class="uiHeaderTitle"[^>]*>([^<]*)</h2>', webpage,
-            'title', default=None)
-        if not video_title:
-            video_title = self._html_search_regex(
-                r'(?s)<span class="fbPhotosPhotoCaption".*?id="fbPhotoPageCaption"><span class="hasCaption">(.*?)</span>',
-                webpage, 'alternative title', default=None)
-        if not video_title:
-            video_title = self._og_search_title(webpage, default=None)
-        if not video_title:
-            video_title = self._html_search_meta(
-                'description', webpage, 'title', default=None)
-        if video_title:
-            video_title = limit_length(video_title, 80)
-        else:
-            video_title = 'Facebook video #%s' % video_id
+        video_title = self._extract_video_title(webpage, tahoe_data, video_id)
 
         def _lowercase_escape(s):
             if s:
@@ -607,6 +592,30 @@ class FacebookIE(InfoExtractor):
                 video_id, fatal_if_no_video=True)
             return info_dict
 
+    def _extract_video_title(self, webpage, tahoe_data, video_id):
+        video_title = self._html_search_regex(
+            r'<h2\s+[^>]*class="uiHeaderTitle"[^>]*>([^<]*)</h2>', webpage,
+            'title', default=None)
+        if not video_title:
+            video_title = self._html_search_regex(
+                r'(?s)<span class="fbPhotosPhotoCaption".*?id="fbPhotoPageCaption"><span class="hasCaption">(.*?)</span>',
+                webpage, 'alternative title', default=None)
+        if not video_title:
+            video_title = self._og_search_title(webpage, default=None)
+        if not video_title:
+            video_title = self._html_search_meta(
+                'description', webpage, 'title', default=None)
+        if not video_title:
+            values = re.findall(r'videoTitle"\s*:\s*"(.*?)"', tahoe_data.secondary)
+            if values:
+                video_title = values[-1]
+        if video_title:
+            video_title = limit_length(video_title, 80)
+        else:
+            video_title = 'Facebook video #%s' % video_id
+        return video_title
+
+
 class FacebookTahoeData:
     def __init__(self, extractor, page, video_id):
         self._page = page

From 615f63bb83891a1b31b73447db907a0ad6752b19 Mon Sep 17 00:00:00 2001
From: Avichai <cavichai@videocites.com>
Date: Wed, 18 Mar 2020 13:20:29 +0200
Subject: [PATCH 35/46] fix twitch thumbnail bug

---
 youtube_dl/extractor/twitch.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/youtube_dl/extractor/twitch.py b/youtube_dl/extractor/twitch.py
index 0db2dca41..1452df419 100644
--- a/youtube_dl/extractor/twitch.py
+++ b/youtube_dl/extractor/twitch.py
@@ -617,7 +617,7 @@ class TwitchStreamIE(TwitchBaseIE):
 
         thumbnails = []
         for thumbnail_key, thumbnail_url in stream['preview'].items():
-            m = re.search(r'(?P<width>\d+)x(?P<height>\d+)\.jpg$', thumbnail_key)
+            m = re.search(r'(?P<width>\d+)x(?P<height>\d+)\.jpg$', thumbnail_url)
             if not m:
                 continue
             thumbnails.append({

From 079235e6d9b0a571b0ccdbd13fb9d4393bf03a96 Mon Sep 17 00:00:00 2001
From: Avichai <cavichai@videocites.com>
Date: Thu, 19 Mar 2020 13:28:38 +0200
Subject: [PATCH 36/46] adding uploader_like_count to twitch

---
 youtube_dl/extractor/twitch.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/youtube_dl/extractor/twitch.py b/youtube_dl/extractor/twitch.py
index 1452df419..d3833fbc7 100644
--- a/youtube_dl/extractor/twitch.py
+++ b/youtube_dl/extractor/twitch.py
@@ -638,6 +638,7 @@ class TwitchStreamIE(TwitchBaseIE):
             'view_count': view_count,
             'formats': formats,
             'is_live': True,
+            'uploader_like_count': stream.get('channel',{}).get('followers')
         }
 
 

From 37df22f24a4e2744ec178e95e6880042ba071326 Mon Sep 17 00:00:00 2001
From: Avichai <cavichai@videocites.com>
Date: Thu, 19 Mar 2020 19:31:18 +0200
Subject: [PATCH 37/46] adding uploader_like_count and description to VOD
 twitch video

---
 youtube_dl/extractor/twitch.py | 11 +++++++++++
 1 file changed, 11 insertions(+)

diff --git a/youtube_dl/extractor/twitch.py b/youtube_dl/extractor/twitch.py
index d3833fbc7..f933cdcea 100644
--- a/youtube_dl/extractor/twitch.py
+++ b/youtube_dl/extractor/twitch.py
@@ -349,6 +349,17 @@ class TwitchVodIE(TwitchItemBaseIE):
                     'ext': 'json',
                 }],
             }
+        channel_id = info['uploader_id']
+        channel = self._call_api(
+            'kraken/channels/%s' % channel_id,
+            channel_id, 'Downloading channel info JSON')
+
+        info['uploader_like_count'] = channel.get('followers')
+
+        description = info['description']
+        if description is None:
+            description = channel.get('status')
+        info['description'] = description
 
         return info
 

From a965e5a0417a4b49a66d9f9deeed9734271f743e Mon Sep 17 00:00:00 2001
From: Avi Peretz <pavi@videocites.com>
Date: Sun, 22 Mar 2020 18:21:34 +0200
Subject: [PATCH 38/46] update facebook user agent.

---
 youtube_dl/extractor/facebook.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/youtube_dl/extractor/facebook.py b/youtube_dl/extractor/facebook.py
index 3fc7bd563..4234e7a1a 100644
--- a/youtube_dl/extractor/facebook.py
+++ b/youtube_dl/extractor/facebook.py
@@ -57,7 +57,7 @@ class FacebookIE(InfoExtractor):
     _NETRC_MACHINE = 'facebook'
     IE_NAME = 'facebook'
 
-    _CHROME_USER_AGENT = 'Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/48.0.2564.97 Safari/537.36'
+    _CHROME_USER_AGENT = 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/80.0.3987.132 Safari/537.36'
 
     _VIDEO_PAGE_TEMPLATE = 'https://www.facebook.com/video/video.php?v=%s'
     _VIDEO_PAGE_TAHOE_TEMPLATE = 'https://www.facebook.com/video/tahoe/async/%s/?chain=true&isvideo=true&payloadtype=%s'

From 0c0cab39e9793850ed105bb89ae4942f0f76ab58 Mon Sep 17 00:00:00 2001
From: Avi Peretz <pavi@videocites.com>
Date: Tue, 31 Mar 2020 17:32:15 +0300
Subject: [PATCH 39/46] add uploader handle.

---
 youtube_dl/extractor/facebook.py | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/youtube_dl/extractor/facebook.py b/youtube_dl/extractor/facebook.py
index 4234e7a1a..802547337 100644
--- a/youtube_dl/extractor/facebook.py
+++ b/youtube_dl/extractor/facebook.py
@@ -482,6 +482,9 @@ class FacebookIE(InfoExtractor):
         shares_count = parse_count(self._extract_shares(webpage, tahoe_data))
         comment_count = parse_count(self._extract_comments_count(webpage, tahoe_data))
 
+        uploader_handle = self._search_regex(r'"video_path":"\\\/([^\/]+)\\\/', tahoe_data.primary, 'uploader_handle', fatal=False)
+        if uploader_handle:
+            uploader_handle = uploader_handle.lower()
         info_dict = {
             'id': video_id,
             'title': video_title,
@@ -498,6 +501,7 @@ class FacebookIE(InfoExtractor):
             'subtitles': subtitles,
             'comment_count': comment_count,
             'other_posts_view_count': other_posts_view_count,
+            'uploader_handle': uploader_handle,
             '_internal_data': {
                 'page': webpage,
                 'api_response_list': [tahoe_data.primary, tahoe_data.secondary]

From 6d29af9b1a0800d8489b1d7d9cb997106fbb7e6c Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Sergey=20M=E2=80=A4?= <dstftw@gmail.com>
Date: Sun, 5 Apr 2020 21:27:36 +0700
Subject: [PATCH 40/46] [mofosex] Add support for generic embeds (closes
 #24633)

---
 youtube_dl/extractor/extractors.py |  5 ++++-
 youtube_dl/extractor/generic.py    |  6 ++++++
 youtube_dl/extractor/mofosex.py    | 24 ++++++++++++++++++++++++
 3 files changed, 34 insertions(+), 1 deletion(-)

diff --git a/youtube_dl/extractor/extractors.py b/youtube_dl/extractor/extractors.py
index ef803b8a7..e407ab3d9 100644
--- a/youtube_dl/extractor/extractors.py
+++ b/youtube_dl/extractor/extractors.py
@@ -636,7 +636,10 @@ from .mixcloud import (
 from .mlb import MLBIE
 from .mnet import MnetIE
 from .moevideo import MoeVideoIE
-from .mofosex import MofosexIE
+from .mofosex import (
+    MofosexIE,
+    MofosexEmbedIE,
+)
 from .mojvideo import MojvideoIE
 from .morningstar import MorningstarIE
 from .motherless import (
diff --git a/youtube_dl/extractor/generic.py b/youtube_dl/extractor/generic.py
index 0ada6354e..ce8252f6a 100644
--- a/youtube_dl/extractor/generic.py
+++ b/youtube_dl/extractor/generic.py
@@ -60,6 +60,7 @@ from .tnaflix import TNAFlixNetworkEmbedIE
 from .drtuber import DrTuberIE
 from .redtube import RedTubeIE
 from .tube8 import Tube8IE
+from .mofosex import MofosexEmbedIE
 from .spankwire import SpankwireIE
 from .youporn import YouPornIE
 from .vimeo import VimeoIE
@@ -2717,6 +2718,11 @@ class GenericIE(InfoExtractor):
         if tube8_urls:
             return self.playlist_from_matches(tube8_urls, video_id, video_title, ie=Tube8IE.ie_key())
 
+        # Look for embedded Mofosex player
+        mofosex_urls = MofosexEmbedIE._extract_urls(webpage)
+        if mofosex_urls:
+            return self.playlist_from_matches(mofosex_urls, video_id, video_title, ie=MofosexEmbedIE.ie_key())
+
         # Look for embedded Spankwire player
         spankwire_urls = SpankwireIE._extract_urls(webpage)
         if spankwire_urls:
diff --git a/youtube_dl/extractor/mofosex.py b/youtube_dl/extractor/mofosex.py
index 1c652813a..3f2b87c42 100644
--- a/youtube_dl/extractor/mofosex.py
+++ b/youtube_dl/extractor/mofosex.py
@@ -1,5 +1,8 @@
 from __future__ import unicode_literals
 
+import re
+
+from .common import InfoExtractor
 from ..utils import (
     int_or_none,
     str_to_int,
@@ -54,3 +57,24 @@ class MofosexIE(KeezMoviesIE):
         })
 
         return info
+
+
+class MofosexEmbedIE(InfoExtractor):
+    _VALID_URL = r'https?://(?:www\.)?mofosex\.com/embed/?\?.*?\bvideoid=(?P<id>\d+)'
+    _TESTS = [{
+        'url': 'https://www.mofosex.com/embed/?videoid=318131&referrer=KM',
+        'only_matching': True,
+    }]
+
+    @staticmethod
+    def _extract_urls(webpage):
+        return re.findall(
+            r'<iframe[^>]+\bsrc=["\']((?:https?:)?//(?:www\.)?mofosex\.com/embed/?\?.*?\bvideoid=\d+)',
+            webpage)
+
+    def _real_extract(self, url):
+        video_id = self._match_id(url)
+        return self.url_result(
+            'http://www.mofosex.com/videos/{0}/{0}.html'.format(video_id),
+            ie=MofosexIE.ie_key(), video_id=video_id)
+

From 88081b0795d4f222bfe612a47fad83e8fecc06c3 Mon Sep 17 00:00:00 2001
From: Avi Peretz <pavi@videocites.com>
Date: Sun, 5 Apr 2020 17:39:33 +0300
Subject: [PATCH 41/46] fix facebook channel handle.

---
 youtube_dl/extractor/facebook.py | 14 +++++++++++---
 1 file changed, 11 insertions(+), 3 deletions(-)

diff --git a/youtube_dl/extractor/facebook.py b/youtube_dl/extractor/facebook.py
index 802547337..a85005caa 100644
--- a/youtube_dl/extractor/facebook.py
+++ b/youtube_dl/extractor/facebook.py
@@ -482,9 +482,7 @@ class FacebookIE(InfoExtractor):
         shares_count = parse_count(self._extract_shares(webpage, tahoe_data))
         comment_count = parse_count(self._extract_comments_count(webpage, tahoe_data))
 
-        uploader_handle = self._search_regex(r'"video_path":"\\\/([^\/]+)\\\/', tahoe_data.primary, 'uploader_handle', fatal=False)
-        if uploader_handle:
-            uploader_handle = uploader_handle.lower()
+        uploader_handle = self._resolve_uploader_handle(tahoe_data, uploader_id)
         info_dict = {
             'id': video_id,
             'title': video_title,
@@ -512,6 +510,16 @@ class FacebookIE(InfoExtractor):
 
         return webpage, info_dict
 
+    def _resolve_uploader_handle(self, tahoe_data, uploader_id):
+        uploader_handle = self._search_regex(r'"video_path":"\\\/([^\/]+)\\\/', tahoe_data.primary, 'uploader_handle',
+                                             fatal=False)
+        if uploader_handle == uploader_id:
+            uploader_handle = self._search_regex(r'href=\\"https:\\\/\\\/www.facebook.com\\\/(.+?)\\\/\\', tahoe_data.secondary,
+                                               'uploader_handle',
+                                                 fatal=False)
+
+        return uploader_handle
+
     def _extract_meta_count(self, fields, webpage, tahoe_data, name, ):
         value = None
 

From 50c7aa32a5f567eeded3b87f285cfe0af6f5697f Mon Sep 17 00:00:00 2001
From: hashark <18191362+hashark@users.noreply.github.com>
Date: Sun, 12 Apr 2020 16:42:29 +0300
Subject: [PATCH 42/46] added Hodaya as a reviewer

---
 .github/pull.yml | 1 +
 1 file changed, 1 insertion(+)

diff --git a/.github/pull.yml b/.github/pull.yml
index cb259a99c..b3a5dbf88 100644
--- a/.github/pull.yml
+++ b/.github/pull.yml
@@ -6,3 +6,4 @@ rules:
     reviewers:
       - aviperes
       - hashark
+      - hodayabu

From 9a6068fdf3ab4652204a9e3edfd325203b710a9b Mon Sep 17 00:00:00 2001
From: Avi Peretz <pavi@videocites.com>
Date: Tue, 14 Apr 2020 11:33:21 +0300
Subject: [PATCH 43/46] add processing error handling.

---
 youtube_dl/extractor/odnoklassniki.py | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/youtube_dl/extractor/odnoklassniki.py b/youtube_dl/extractor/odnoklassniki.py
index 4b46117a7..2c8cc7c59 100644
--- a/youtube_dl/extractor/odnoklassniki.py
+++ b/youtube_dl/extractor/odnoklassniki.py
@@ -184,6 +184,9 @@ class OdnoklassnikiIE(InfoExtractor):
 
         movie = metadata['movie']
 
+        if movie.get('status') == 'PROCESSING':
+            raise ExtractorError('Video is still processing', video_id=video_id)
+
         # Some embedded videos may not contain title in movie dict (e.g.
         # http://ok.ru/video/62036049272859-0) thus we allow missing title
         # here and it's going to be extracted later by an extractor that

From 469c1dc4e3575203d388c6317b1b528bc1b9ba6c Mon Sep 17 00:00:00 2001
From: hodayabu <bhodaya@videocites.com>
Date: Mon, 20 Apr 2020 13:40:18 +0300
Subject: [PATCH 44/46] tiktok youtube-dl

---
 test/ci/test_tiktok.py         | 15 ++++++++
 youtube_dl/extractor/tiktok.py | 63 ++++++++++++++++++++++++++++++----
 2 files changed, 71 insertions(+), 7 deletions(-)
 create mode 100644 test/ci/test_tiktok.py

diff --git a/test/ci/test_tiktok.py b/test/ci/test_tiktok.py
new file mode 100644
index 000000000..130097688
--- /dev/null
+++ b/test/ci/test_tiktok.py
@@ -0,0 +1,15 @@
+import unittest
+import youtube_dl
+
+
+class MyTestCase(unittest.TestCase):
+    def test_something(self):
+        url = 'https://www.tiktok.com/@danieltbraun/video/6817099671043853574'
+        params = {}
+        ydl = youtube_dl.YoutubeDL(params)
+        info = ydl.extract_info(url, download=False)
+        self.assertEquals(info['title'], "She got a face full of DUSTBIN #foryou")
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/youtube_dl/extractor/tiktok.py b/youtube_dl/extractor/tiktok.py
index 66088b9ab..24ed25557 100644
--- a/youtube_dl/extractor/tiktok.py
+++ b/youtube_dl/extractor/tiktok.py
@@ -1,6 +1,10 @@
 # coding: utf-8
 from __future__ import unicode_literals
 
+from newspaper import Article
+from bs4 import BeautifulSoup
+import requests
+import json
 from .common import InfoExtractor
 from ..utils import (
     compat_str,
@@ -69,7 +73,8 @@ class TikTokIE(TikTokBaseIE):
                         https?://
                             (?:
                                 (?:m\.)?tiktok\.com/v|
-                                (?:www\.)?tiktok\.com/share/video
+                                (?:www\.)?tiktok\.com/share/video|
+                                (?:www\.|)tiktok\.com\/@(?:.*?)\/video
                             )
                             /(?P<id>\d+)
                     '''
@@ -94,12 +99,56 @@ class TikTokIE(TikTokBaseIE):
     }]
 
     def _real_extract(self, url):
-        video_id = self._match_id(url)
-        webpage = self._download_webpage(
-            'https://m.tiktok.com/v/%s.html' % video_id, video_id)
-        data = self._parse_json(self._search_regex(
-            r'\bdata\s*=\s*({.+?})\s*;', webpage, 'data'), video_id)
-        return self._extract_aweme(data)
+        #extract meta data using the official api
+        res = requests.get('https://www.tiktok.com/oembed?url='+url)
+        #json contains: provider url, titile, html, author_namee, height, thumbnail_width, width, version,
+        #author_url, thumbnail_height, thumbnail_url, type, provider_name (tiktok)
+        json= res.json()
+
+        #extract metadata with beautifulSoup
+        #class - jsx-1038045583 jsx-3192540912 jsx-2150087249 video-meta-count conatins likes and comments
+        result = requests.get(url)
+        src = result.content
+        soup = BeautifulSoup(result.text, 'html.parser')
+
+        meta_data= soup.find_all("div",{ "class": "jsx-1715470091.desktop-container"})
+        print (meta_data)
+
+        #
+        #
+        # video_id = self._match_id(url)
+        # webpage = self._download_webpage(url, video_id)
+        # s_rejex=self._search_regex(r'\bdata\s*=\s*({.+?})\s*;', webpage, 'data')
+        # data = self._parse_json(s_rejex, video_id)
+        # #return self.info_dict()
+        #return self._extract_aweme(data)
+        return None
+
+    # def info_dict(self,video_id,video_title,formats,uploader, timestamp, thumbnail, view_count, uploader_id, is_live, live_status
+    #               , likes_count, shares_count, subtitles, comment_count, ):
+    #     info_dict = {
+    #         'id': video_id,
+    #         'title': video_title,
+    #         'formats': formats,
+    #         'uploader': uploader,
+    #         'timestamp': timestamp,
+    #         'thumbnail': thumbnail,
+    #         'view_count': view_count,
+    #         'uploader_id': uploader_id,
+    #         'is_live': is_live,
+    #         'live_status': live_status,
+    #         'like_count': likes_count,
+    #         'share_count': shares_count,
+    #         'subtitles': subtitles,
+    #         'comment_count': comment_count,
+    #         'other_posts_view_count': other_posts_view_count,
+    #         'uploader_handle': uploader_handle,
+    #         '_internal_data': {
+    #             'page': webpage,
+    #             'api_response_list': [tahoe_data.primary, tahoe_data.secondary]
+    #         }
+    #     }
+    #     return info_dict
 
 
 class TikTokUserIE(TikTokBaseIE):

From 82381d8dd4bd97e51aef2cda2c05b0ed684dbd7e Mon Sep 17 00:00:00 2001
From: hodayabu <bhodaya@videocites.com>
Date: Mon, 20 Apr 2020 15:27:31 +0300
Subject: [PATCH 45/46] tiktok youtube-dl

---
 test/ci/test_tiktok.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/test/ci/test_tiktok.py b/test/ci/test_tiktok.py
index 130097688..7d2f87047 100644
--- a/test/ci/test_tiktok.py
+++ b/test/ci/test_tiktok.py
@@ -2,8 +2,8 @@ import unittest
 import youtube_dl
 
 
-class MyTestCase(unittest.TestCase):
-    def test_something(self):
+class TikTokTestYoutubeDl(unittest.TestCase):
+    def test_meta_data(self):
         url = 'https://www.tiktok.com/@danieltbraun/video/6817099671043853574'
         params = {}
         ydl = youtube_dl.YoutubeDL(params)

From 817be403ebd45c8f20049b00a4f414a17f1270f1 Mon Sep 17 00:00:00 2001
From: hodayabu <bhodaya@videocites.com>
Date: Mon, 20 Apr 2020 20:54:18 +0300
Subject: [PATCH 46/46] tiktok extractor

---
 test/ci/__init__.py            |   0
 test/ci/test_tiktok.py         |   3 +-
 youtube_dl/extractor/tiktok.py | 125 +++++++++++++++++++--------------
 3 files changed, 75 insertions(+), 53 deletions(-)
 create mode 100644 test/ci/__init__.py

diff --git a/test/ci/__init__.py b/test/ci/__init__.py
new file mode 100644
index 000000000..e69de29bb
diff --git a/test/ci/test_tiktok.py b/test/ci/test_tiktok.py
index 7d2f87047..7f0294c2a 100644
--- a/test/ci/test_tiktok.py
+++ b/test/ci/test_tiktok.py
@@ -8,7 +8,8 @@ class TikTokTestYoutubeDl(unittest.TestCase):
         params = {}
         ydl = youtube_dl.YoutubeDL(params)
         info = ydl.extract_info(url, download=False)
-        self.assertEquals(info['title'], "She got a face full of DUSTBIN #foryou")
+        self.assertEquals(info['share_count'], 110)
+
 
 
 if __name__ == '__main__':
diff --git a/youtube_dl/extractor/tiktok.py b/youtube_dl/extractor/tiktok.py
index 24ed25557..140db07bc 100644
--- a/youtube_dl/extractor/tiktok.py
+++ b/youtube_dl/extractor/tiktok.py
@@ -1,7 +1,6 @@
 # coding: utf-8
 from __future__ import unicode_literals
-
-from newspaper import Article
+import ast
 from bs4 import BeautifulSoup
 import requests
 import json
@@ -16,6 +15,9 @@ from ..utils import (
 )
 
 
+# add to requirements.txt- bs4, newspaper, requests
+
+
 class TikTokBaseIE(InfoExtractor):
     def _extract_aweme(self, data):
         video = data['video']
@@ -68,6 +70,8 @@ class TikTokBaseIE(InfoExtractor):
         }
 
 
+
+
 class TikTokIE(TikTokBaseIE):
     _VALID_URL = r'''(?x)
                         https?://
@@ -99,57 +103,74 @@ class TikTokIE(TikTokBaseIE):
     }]
 
     def _real_extract(self, url):
-        #extract meta data using the official api
-        res = requests.get('https://www.tiktok.com/oembed?url='+url)
-        #json contains: provider url, titile, html, author_namee, height, thumbnail_width, width, version,
-        #author_url, thumbnail_height, thumbnail_url, type, provider_name (tiktok)
-        json= res.json()
-
-        #extract metadata with beautifulSoup
-        #class - jsx-1038045583 jsx-3192540912 jsx-2150087249 video-meta-count conatins likes and comments
-        result = requests.get(url)
-        src = result.content
-        soup = BeautifulSoup(result.text, 'html.parser')
-
-        meta_data= soup.find_all("div",{ "class": "jsx-1715470091.desktop-container"})
-        print (meta_data)
-
-        #
-        #
-        # video_id = self._match_id(url)
-        # webpage = self._download_webpage(url, video_id)
-        # s_rejex=self._search_regex(r'\bdata\s*=\s*({.+?})\s*;', webpage, 'data')
-        # data = self._parse_json(s_rejex, video_id)
-        # #return self.info_dict()
-        #return self._extract_aweme(data)
-        return None
-
-    # def info_dict(self,video_id,video_title,formats,uploader, timestamp, thumbnail, view_count, uploader_id, is_live, live_status
-    #               , likes_count, shares_count, subtitles, comment_count, ):
-    #     info_dict = {
-    #         'id': video_id,
-    #         'title': video_title,
-    #         'formats': formats,
-    #         'uploader': uploader,
-    #         'timestamp': timestamp,
-    #         'thumbnail': thumbnail,
-    #         'view_count': view_count,
-    #         'uploader_id': uploader_id,
-    #         'is_live': is_live,
-    #         'live_status': live_status,
-    #         'like_count': likes_count,
-    #         'share_count': shares_count,
-    #         'subtitles': subtitles,
-    #         'comment_count': comment_count,
-    #         'other_posts_view_count': other_posts_view_count,
-    #         'uploader_handle': uploader_handle,
-    #         '_internal_data': {
-    #             'page': webpage,
-    #             'api_response_list': [tahoe_data.primary, tahoe_data.secondary]
-    #         }
-    #     }
-    #     return info_dict
+        video_id = url.split('/')[-1]
+
+        # extract meta data using the official api
+        # Response json contains: provider url, title, html, author_namee, height, thumbnail_width, width, version,
+        # author_url, thumbnail_height, thumbnail_url, type, provider_name (tiktok)
+
+        json_api = self._download_json('https://www.tiktok.com/oembed?url=' + url, video_id)
+
+        # extract metadata with beautifulSoup
+        webpage = self._download_webpage(url, video_id)
+        soup = BeautifulSoup(webpage, features="html.parser")
+        h2 = soup.find_all("h2", {"class": "jsx-1038045583 jsx-3192540912 jsx-2150087249 video-meta-count"})
+        data = h2[0].text.split(' ')
+        likes_count = self.numeric_convert(data[0])
+        comments_count = self.numeric_convert(data[3])
+        json_next_data = soup.find(id='__NEXT_DATA__')
+        props = json_next_data.contents[0]
+        json_data_encode = json.dumps(props.encode('utf-8'))
+        ast_le = ast.literal_eval(json_data_encode)
+        data_dict = json.loads(ast_le)
+        timestamp = self.numeric_convert(data_dict['props']['pageProps']['videoData']['itemInfos']['createTime'])
+
+        shares = data_dict['props']['pageProps']['videoData']['itemInfos']['shareCount']
+        views = data_dict['props']['pageProps']['videoData']['itemInfos']['playCount']
+        duration = data_dict['props']['pageProps']['videoData']['itemInfos']['video']['videoMeta']['duration']
+        provider_id = data_dict['props']['pageProps']['videoData']['itemInfos']['authorId']
+
+        # TO-DO- check on formats
+
+        return self.info_dict(video_id, str(url), json_api['title'],
+                              json_api['author_name'], timestamp, json_api['thumbnail_url'],
+                              views, provider_id, False, 'not_live', likes_count, shares, '', comments_count,duration)
+
+    def numeric_convert(self, unicode):
+        if 'K' in unicode:
+            unicode=unicode[:-1]
+            return int(float(unicode)*1000)
+        if 'M' in unicode:
+            unicode=unicode[:-1]
+            return int(float(unicode)*100000)
+        else:
+            return int(unicode)
+
+
+
+    def info_dict (self, video_id, url, video_title,
+                   uploader, timestamp, thumbnail,
+                   view_count, uploader_id, is_live, live_status
+                   , likes_count, shares_count, subtitles, comment_count, duration):
+        info_dict = {
+            'id': video_id,
+            'url': url,
+            'title': video_title,
+            'uploader': uploader,
+            'timestamp': timestamp,
+            'thumbnail': thumbnail,
+            'view_count': view_count,
+            'uploader_id': uploader_id,
+            'is_live': is_live,
+            'live_status': live_status,
+            'like_count': likes_count,
+            'share_count': shares_count,
+            'subtitles': subtitles,
+            'comment_count': comment_count,
+            'duration': duration
 
+        }
+        return info_dict
 
 class TikTokUserIE(TikTokBaseIE):
     _VALID_URL = r'''(?x)