From e28e135d6fd6a430fed3e20dfe1a8c8bbc5f9185 Mon Sep 17 00:00:00 2001
From: marcdumais <420612+marcdumais@users.noreply.github.com>
Date: Sun, 25 Feb 2024 18:21:08 -0500
Subject: [PATCH] [ie/altcensored:channel] Fix playlist extraction (#9297)
Authored by: marcdumais
---
yt_dlp/extractor/altcensored.py | 17 ++++++++++++-----
1 file changed, 12 insertions(+), 5 deletions(-)
diff --git a/yt_dlp/extractor/altcensored.py b/yt_dlp/extractor/altcensored.py
index 0e1627bfd1..a8428ce2ed 100644
--- a/yt_dlp/extractor/altcensored.py
+++ b/yt_dlp/extractor/altcensored.py
@@ -22,7 +22,7 @@ class AltCensoredIE(InfoExtractor):
'title': "QUELLES SONT LES CONSÉQUENCES DE L'HYPERSEXUALISATION DE LA SOCIÉTÉ ?",
'display_id': 'k0srjLSkga8.webm',
'release_date': '20180403',
- 'creator': 'Virginie Vota',
+ 'creators': ['Virginie Vota'],
'release_year': 2018,
'upload_date': '20230318',
'uploader': 'admin@altcensored.com',
@@ -32,7 +32,7 @@ class AltCensoredIE(InfoExtractor):
'duration': 926.09,
'thumbnail': 'https://archive.org/download/youtube-k0srjLSkga8/youtube-k0srjLSkga8.thumbs/k0srjLSkga8_000925.jpg',
'view_count': int,
- 'categories': ['News & Politics'],
+ 'categories': ['News & Politics'], # FIXME
}
}]
@@ -62,14 +62,21 @@ class AltCensoredChannelIE(InfoExtractor):
'title': 'Virginie Vota',
'id': 'UCFPTO55xxHqFqkzRZHu4kcw',
},
- 'playlist_count': 91
+ 'playlist_count': 85,
}, {
'url': 'https://altcensored.com/channel/UC9CcJ96HKMWn0LZlcxlpFTw',
'info_dict': {
'title': 'yukikaze775',
'id': 'UC9CcJ96HKMWn0LZlcxlpFTw',
},
- 'playlist_count': 4
+ 'playlist_count': 4,
+ }, {
+ 'url': 'https://altcensored.com/channel/UCfYbb7nga6-icsFWWgS-kWw',
+ 'info_dict': {
+ 'title': 'Mister Metokur',
+ 'id': 'UCfYbb7nga6-icsFWWgS-kWw',
+ },
+ 'playlist_count': 121,
}]
def _real_extract(self, url):
@@ -78,7 +85,7 @@ class AltCensoredChannelIE(InfoExtractor):
url, channel_id, 'Download channel webpage', 'Unable to get channel webpage')
title = self._html_search_meta('altcen_title', webpage, 'title', fatal=False)
page_count = int_or_none(self._html_search_regex(
- r']+href="/channel/\w+/page/(\d+)">(?:\1)',
+ r']+href="/channel/[\w-]+/page/(\d+)">(?:\1)',
webpage, 'page count', default='1'))
def page_func(page_num):