From 28445dbfbfb28f86f5b92eff3134e7ce0a16a957 Mon Sep 17 00:00:00 2001 From: ajnar Date: Mon, 10 Jun 2024 20:59:18 -0300 Subject: [PATCH] [MercadoLibre] Add extractor --- yt_dlp/extractor/_extractors.py | 1 + yt_dlp/extractor/mercadolibre.py | 113 +++++++++++++++++++++++++++++++ 2 files changed, 114 insertions(+) create mode 100644 yt_dlp/extractor/mercadolibre.py diff --git a/yt_dlp/extractor/_extractors.py b/yt_dlp/extractor/_extractors.py index e9cd38a651..5b849aac11 100644 --- a/yt_dlp/extractor/_extractors.py +++ b/yt_dlp/extractor/_extractors.py @@ -1111,6 +1111,7 @@ ) from .meipai import MeipaiIE from .melonvod import MelonVODIE +from .mercadolibre import MercadoLibreIE from .metacritic import MetacriticIE from .mgtv import MGTVIE from .microsoftembed import MicrosoftEmbedIE diff --git a/yt_dlp/extractor/mercadolibre.py b/yt_dlp/extractor/mercadolibre.py new file mode 100644 index 0000000000..4a43b8b45a --- /dev/null +++ b/yt_dlp/extractor/mercadolibre.py @@ -0,0 +1,113 @@ +from .common import InfoExtractor +from ..utils import ExtractorError, traverse_obj + + +class MercadoLibreIE(InfoExtractor): + + _VALID_URL = r'https?://(?:www\.|.*\.)?mercadolibre\.com\.ar/*.*/(?PMLA-?[0-9]+)' + + _TESTS = [ + { + 'url': 'https://articulo.mercadolibre.com.ar/MLA-780443524-pool-profesional-mesa-de-ping-pong-comedor-accesorios-_JM#position=5&search_layout=stack&type=item&tracking_id=b9180504-37fc-4829-adff-4320ac49464c', + 'info_dict': { + 'id': 'MLA-780443524', + 'title': 'Pool Profesional + Mesa De Ping Pong + Comedor + Accesorios', + 'price': '651.999' + }, + 'playlist': [{ + 'info_dict': { + 'id': 'iUvfyU', + 'ext': 'mp4', + 'formats': 'mincount:2', + 'duration': 49.08, + 'title': 'Pool Profesional + Mesa De Ping Pong + Comedor + Accesorios', + 'view_count': int + } + } + ], + 'params': { + 'skip_download': True, + } + }, + { + 'url': 'https://www.mercadolibre.com.ar/motorola-moto-e22-64gb-azul-4gb-ram/p/MLA25665291?pdp_filters=seller_id%3A225480741#reco_item_pos=20&reco_backend=machinalis-seller-items-pdp&reco_backend_type=low_level&reco_client=vip-seller_items-above&reco_id=08cf53bc-f759-4c39-9253-ae21f5d75ae9', + 'info_dict': { + 'id': 'MLA25665291', + 'title': 'Motorola Moto E22 64GB Azul 4GB RAM', + 'price': '399.999', + }, + 'playlist': [{ + 'info_dict': { + 'id': 'gO27T5', + 'ext': 'mp4', + 'formats': 'mincount:4', + 'duration': 56.21, + 'title': 'Motorola Moto E22 64GB Azul 4GB RAM', + 'view_count': int, + } + } + ], + 'params': { + 'skip_download': True, + } + }, + { + 'url': 'https://www.mercadolibre.com.ar/sony-playstation-5-825gb-digital-edition-color-blanco-y-negro-2020/p/MLA16253015', + 'info_dict': { + 'id': 'MLA16253015', + 'title': 'Sony PlayStation 5 825GB Digital Edition color blanco y negro 2020', + 'price': '1.779.999', + }, + 'playlist_mincount': 2, + 'params': { + 'skip_download': True, + } + }, + ] + + def _real_initialize(self): + self._request_webpage('https://www.mercadolibre.com.ar/', None, 'Setting up session') + + def _real_extract(self, url): + + display_id = self._match_id(url) + + webpage = self._download_webpage(url, display_id) + + title = self._search_regex(r'

(.*?)

', webpage, 'title', fatal=True) + price = self._search_regex(r'', webpage, 'precio', fatal=True) + + data = self._search_json( + r'window\.__PRELOADED_STATE__\s*=', webpage, 'json data', display_id) + + shorts = traverse_obj(data, ( + 'initialState', 'components', 'gallery', 'clips', 'shorts')) + + if len(shorts) == 0: + raise ExtractorError('No videos found at the site') + + entries = [] + for short in shorts: + video_id = short['id'] + video_url = short['video_url'] + + formats = self._extract_m3u8_formats(video_url, video_id) + + entry = { + 'id': video_id, + 'title': title, + 'duration': short['video_duration'], + 'view_count': short['views'], + 'formats': formats + } + entries.append(entry) + + response = { + '_type': 'playlist', + 'id': display_id, + 'title': title, + 'price': price, + 'entries': entries, + } + + return response