youtube-dl/youtube_dl/extractor/neteasemusic.py

# coding: utf-8
from __future__ import unicode_literals

from base64 import b64encode
from binascii import hexlify
from datetime import datetime
from hashlib import md5
from random import randint
import json
import re
import time

from .common import InfoExtractor
from ..aes import aes_ecb_encrypt, pkcs7_padding
from ..compat import (
    compat_urllib_parse_urlencode,
    compat_str,
    compat_itertools_count,
)
from ..utils import (
    ExtractorError,
    bytes_to_intlist,
    error_to_compat_str,
    float_or_none,
    int_or_none,
    intlist_to_bytes,
    sanitized_Request,
    std_headers,
    try_get,
)


class NetEaseMusicBaseIE(InfoExtractor):
    _FORMATS = ['bMusic', 'mMusic', 'hMusic']
    _NETEASE_SALT = '3go8&$8*3*3h0k(2)2'
    _API_BASE = 'http://music.163.com/api/'

    @classmethod
    def _encrypt(cls, dfsid):
        salt_bytes = bytearray(cls._NETEASE_SALT.encode('utf-8'))
        string_bytes = bytearray(compat_str(dfsid).encode('ascii'))
        salt_len = len(salt_bytes)
        for i in range(len(string_bytes)):
            string_bytes[i] = string_bytes[i] ^ salt_bytes[i % salt_len]
        m = md5()
        m.update(bytes(string_bytes))
        result = b64encode(m.digest()).decode('ascii')
        return result.replace('/', '_').replace('+', '-')

    @classmethod
    def make_player_api_request_data_and_headers(cls, song_id, bitrate):
        KEY = b'e82ckenh8dichen8'
        URL = '/api/song/enhance/player/url'
        now = int(time.time() * 1000)
        rand = randint(0, 1000)
        cookie = {
            'osver': None,
            'deviceId': None,
            'appver': '8.0.0',
            'versioncode': '140',
            'mobilename': None,
            'buildver': '1623435496',
            'resolution': '1920x1080',
            '__csrf': '',
            'os': 'pc',
            'channel': None,
            'requestId': '{0}_{1:04}'.format(now, rand),
        }
        request_text = json.dumps(
            {'ids': '[{0}]'.format(song_id), 'br': bitrate, 'header': cookie},
            separators=(',', ':'))
        message = 'nobody{0}use{1}md5forencrypt'.format(
            URL, request_text).encode('latin1')
        msg_digest = md5(message).hexdigest()

        data = '{0}-36cd479b6b5-{1}-36cd479b6b5-{2}'.format(
            URL, request_text, msg_digest)
        data = pkcs7_padding(bytes_to_intlist(data))
        encrypted = intlist_to_bytes(aes_ecb_encrypt(data, bytes_to_intlist(KEY)))
        encrypted_params = hexlify(encrypted).decode('ascii').upper()

        cookie = '; '.join(
            ['{0}={1}'.format(k, v if v is not None else 'undefined')
             for [k, v] in cookie.items()])

        headers = {
            'User-Agent': std_headers['User-Agent'],
            'Content-Type': 'application/x-www-form-urlencoded',
            'Referer': 'https://music.163.com',
            'Cookie': cookie,
        }
        return ('params={0}'.format(encrypted_params), headers)

    def _call_player_api(self, song_id, bitrate):
        url = 'https://interface3.music.163.com/eapi/song/enhance/player/url'
        data, headers = self.make_player_api_request_data_and_headers(song_id, bitrate)
        try:
            msg = 'empty result'
            result = self._download_json(
                url, song_id, data=data.encode('ascii'), headers=headers)
            if result:
                return result
        except ExtractorError as e:
            if type(e.cause) in (ValueError, TypeError):
                # JSON load failure
                raise
        except Exception as e:
            msg = error_to_compat_str(e)
            self.report_warning('%s API call (%s) failed: %s' % (
                song_id, bitrate, msg))
        return {}

    def extract_formats(self, info):
        err = 0
        formats = []
        song_id = info['id']
        for song_format in self._FORMATS:
            details = info.get(song_format)
            if not details:
                continue

            bitrate = int_or_none(details.get('bitrate')) or 999000
            data = self._call_player_api(song_id, bitrate)
            for song in try_get(data, lambda x: x['data'], list) or []:
                song_url = try_get(song, lambda x: x['url'])
                if not song_url:
                    continue
                if self._is_valid_url(song_url, info['id'], 'song'):
                    formats.append({
                        'url': song_url,
                        'ext': details.get('extension'),
                        'abr': float_or_none(song.get('br'), scale=1000),
                        'format_id': song_format,
                        'filesize': int_or_none(song.get('size')),
                        'asr': int_or_none(details.get('sr')),
                    })
                elif err == 0:
                    err = try_get(song, lambda x: x['code'], int)

        if not formats:
            msg = 'No media links found'
            if err != 0 and (err < 200 or err >= 400):
                raise ExtractorError(
                    '%s (site code %d)' % (msg, err, ), expected=True)
            else:
                self.raise_geo_restricted(
                    msg + ': probably this video is not available from your location due to geo restriction.',
                    countries=['CN'])

        return formats

    @classmethod
    def convert_milliseconds(cls, ms):
        return int(round(ms / 1000.0))

    def query_api(self, endpoint, video_id, note):
        req = sanitized_Request('%s%s' % (self._API_BASE, endpoint))
        req.add_header('Referer', self._API_BASE)
        return self._download_json(req, video_id, note)


class NetEaseMusicIE(NetEaseMusicBaseIE):
    IE_NAME = 'netease:song'
    IE_DESC = '网易云音乐'
    _VALID_URL = r'https?://(y\.)?music\.163\.com/(?:[#m]/)?song\?.*?\bid=(?P<id>[0-9]+)'
    _TESTS = [{
        'url': 'http://music.163.com/#/song?id=32102397',
        'md5': '3e909614ce09b1ccef4a3eb205441190',
        'info_dict': {
            'id': '32102397',
            'ext': 'mp3',
            'title': 'Bad Blood',
            'creator': 'Taylor Swift / Kendrick Lamar',
            'upload_date': '20150516',
            'timestamp': 1431792000,
            'description': 'md5:25fc5f27e47aad975aa6d36382c7833c',
        },
    }, {
        'note': 'No lyrics.',
        'url': 'http://music.163.com/song?id=17241424',
        'info_dict': {
            'id': '17241424',
            'ext': 'mp3',
            'title': 'Opus 28',
            'creator': 'Dustin O\'Halloran',
            'upload_date': '20080211',
            'description': 'md5:f12945b0f6e0365e3b73c5032e1b0ff4',
            'timestamp': 1202745600,
        },
    }, {
        'note': 'Has translated name.',
        'url': 'http://music.163.com/#/song?id=22735043',
        'info_dict': {
            'id': '22735043',
            'ext': 'mp3',
            'title': '소원을 말해봐 (Genie)',
            'creator': '少女时代',
            'description': 'md5:79d99cc560e4ca97e0c4d86800ee4184',
            'upload_date': '20100127',
            'timestamp': 1264608000,
            'alt_title': '说出愿望吧(Genie)',
        },
    }, {
        'url': 'https://y.music.163.com/m/song?app_version=8.8.45&id=95670&uct2=sKnvS4+0YStsWkqsPhFijw%3D%3D&dlt=0846',
        'md5': '95826c73ea50b1c288b22180ec9e754d',
        'info_dict': {
            'id': '95670',
            'ext': 'mp3',
            'title': '国际歌',
            'creator': '马备',
            'upload_date': '19911130',
            'timestamp': 691516800,
            'description': 'md5:1ba2f911a2b0aa398479f595224f2141',
        },
    }]

    def _process_lyrics(self, lyrics_info):
        original = lyrics_info.get('lrc', {}).get('lyric')
        translated = lyrics_info.get('tlyric', {}).get('lyric')

        if not translated:
            return original

        lyrics_expr = r'(\[[0-9]{2}:[0-9]{2}\.[0-9]{2,}\])([^\n]+)'
        original_ts_texts = re.findall(lyrics_expr, original)
        translation_ts_dict = dict(
            (time_stamp, text) for time_stamp, text in re.findall(lyrics_expr, translated)
        )
        lyrics = '\n'.join([
            '%s%s / %s' % (time_stamp, text, translation_ts_dict.get(time_stamp, ''))
            for time_stamp, text in original_ts_texts
        ])
        return lyrics

    def _real_extract(self, url):
        song_id = self._match_id(url)

        params = {
            'id': song_id,
            'ids': '[%s]' % song_id
        }
        info = self.query_api(
            'song/detail?' + compat_urllib_parse_urlencode(params),
            song_id, 'Downloading song info')['songs'][0]

        formats = self.extract_formats(info)
        self._sort_formats(formats)

        lyrics_info = self.query_api(
            'song/lyric?id=%s&lv=-1&tv=-1' % song_id,
            song_id, 'Downloading lyrics data')
        lyrics = self._process_lyrics(lyrics_info)

        alt_title = None
        if info.get('transNames'):
            alt_title = '/'.join(info.get('transNames'))

        return {
            'id': song_id,
            'title': info['name'],
            'alt_title': alt_title,
            'creator': ' / '.join([artist['name'] for artist in info.get('artists', [])]),
            'timestamp': self.convert_milliseconds(info.get('album', {}).get('publishTime')),
            'thumbnail': info.get('album', {}).get('picUrl'),
            'duration': self.convert_milliseconds(info.get('duration', 0)),
            'description': lyrics,
            'formats': formats,
        }


class NetEaseMusicAlbumIE(NetEaseMusicBaseIE):
    IE_NAME = 'netease:album'
    IE_DESC = '网易云音乐 - 专辑'
    _VALID_URL = r'https?://music\.163\.com/(#/)?album\?id=(?P<id>[0-9]+)'
    _TEST = {
        'url': 'http://music.163.com/#/album?id=220780',
        'info_dict': {
            'id': '220780',
            'title': 'B\'day',
        },
        'playlist_count': 23,
        'skip': 'Blocked outside Mainland China',
    }

    def _real_extract(self, url):
        album_id = self._match_id(url)

        info = self.query_api(
            'album/%s?id=%s' % (album_id, album_id),
            album_id, 'Downloading album data')['album']

        name = info['name']
        desc = info.get('description')
        entries = [
            self.url_result('http://music.163.com/#/song?id=%s' % song['id'],
                            'NetEaseMusic', song['id'])
            for song in info['songs']
        ]
        return self.playlist_result(entries, album_id, name, desc)


class NetEaseMusicSingerIE(NetEaseMusicBaseIE):
    IE_NAME = 'netease:singer'
    IE_DESC = '网易云音乐 - 歌手'
    _VALID_URL = r'https?://music\.163\.com/(#/)?artist\?id=(?P<id>[0-9]+)'
    _TESTS = [{
        'note': 'Singer has aliases.',
        'url': 'http://music.163.com/#/artist?id=10559',
        'info_dict': {
            'id': '10559',
            'title': '张惠妹 - aMEI;阿密特',
        },
        'playlist_count': 50,
        'skip': 'Blocked outside Mainland China',
    }, {
        'note': 'Singer has translated name.',
        'url': 'http://music.163.com/#/artist?id=124098',
        'info_dict': {
            'id': '124098',
            'title': '李昇基 - 이승기',
        },
        'playlist_count': 50,
        'skip': 'Blocked outside Mainland China',
    }]

    def _real_extract(self, url):
        singer_id = self._match_id(url)

        info = self.query_api(
            'artist/%s?id=%s' % (singer_id, singer_id),
            singer_id, 'Downloading singer data')

        name = info['artist']['name']
        if info['artist']['trans']:
            name = '%s - %s' % (name, info['artist']['trans'])
        if info['artist']['alias']:
            name = '%s - %s' % (name, ';'.join(info['artist']['alias']))

        entries = [
            self.url_result('http://music.163.com/#/song?id=%s' % song['id'],
                            'NetEaseMusic', song['id'])
            for song in info['hotSongs']
        ]
        return self.playlist_result(entries, singer_id, name)


class NetEaseMusicListIE(NetEaseMusicBaseIE):
    IE_NAME = 'netease:playlist'
    IE_DESC = '网易云音乐 - 歌单'
    _VALID_URL = r'https?://music\.163\.com/(#/)?(playlist|discover/toplist)\?id=(?P<id>[0-9]+)'
    _TESTS = [{
        'url': 'http://music.163.com/#/playlist?id=79177352',
        'info_dict': {
            'id': '79177352',
            'title': 'Billboard 2007 Top 100',
            'description': 'md5:12fd0819cab2965b9583ace0f8b7b022'
        },
        'playlist_count': 99,
        'skip': 'Blocked outside Mainland China',
    }, {
        'note': 'Toplist/Charts sample',
        'url': 'http://music.163.com/#/discover/toplist?id=3733003',
        'info_dict': {
            'id': '3733003',
            'title': 're:韩国Melon排行榜周榜 [0-9]{4}-[0-9]{2}-[0-9]{2}',
            'description': 'md5:73ec782a612711cadc7872d9c1e134fc',
        },
        'playlist_count': 50,
        'skip': 'Blocked outside Mainland China',
    }]

    def _real_extract(self, url):
        list_id = self._match_id(url)

        info = self.query_api(
            'playlist/detail?id=%s&lv=-1&tv=-1' % list_id,
            list_id, 'Downloading playlist data')['result']

        name = info['name']
        desc = info.get('description')

        if info.get('specialType') == 10:  # is a chart/toplist
            datestamp = datetime.fromtimestamp(
                self.convert_milliseconds(info['updateTime'])).strftime('%Y-%m-%d')
            name = '%s %s' % (name, datestamp)

        entries = [
            self.url_result('http://music.163.com/#/song?id=%s' % song['id'],
                            'NetEaseMusic', song['id'])
            for song in info['tracks']
        ]
        return self.playlist_result(entries, list_id, name, desc)


class NetEaseMusicMvIE(NetEaseMusicBaseIE):
    IE_NAME = 'netease:mv'
    IE_DESC = '网易云音乐 - MV'
    _VALID_URL = r'https?://music\.163\.com/(#/)?mv\?id=(?P<id>[0-9]+)'
    _TEST = {
        'url': 'http://music.163.com/#/mv?id=415350',
        'info_dict': {
            'id': '415350',
            'ext': 'mp4',
            'title': '이럴거면 그러지말지',
            'description': '白雅言自作曲唱甜蜜爱情',
            'creator': '白雅言',
            'upload_date': '20150520',
        },
        'skip': 'Blocked outside Mainland China',
    }

    def _real_extract(self, url):
        mv_id = self._match_id(url)

        info = self.query_api(
            'mv/detail?id=%s&type=mp4' % mv_id,
            mv_id, 'Downloading mv info')['data']

        formats = [
            {'url': mv_url, 'ext': 'mp4', 'format_id': '%sp' % brs, 'height': int(brs)}
            for brs, mv_url in info['brs'].items()
        ]
        self._sort_formats(formats)

        return {
            'id': mv_id,
            'title': info['name'],
            'description': info.get('desc') or info.get('briefDesc'),
            'creator': info['artistName'],
            'upload_date': info['publishTime'].replace('-', ''),
            'formats': formats,
            'thumbnail': info.get('cover'),
            'duration': self.convert_milliseconds(info.get('duration', 0)),
        }


class NetEaseMusicProgramIE(NetEaseMusicBaseIE):
    IE_NAME = 'netease:program'
    IE_DESC = '网易云音乐 - 电台节目'
    _VALID_URL = r'https?://music\.163\.com/(#/?)program\?id=(?P<id>[0-9]+)'
    _TESTS = [{
        'url': 'http://music.163.com/#/program?id=10109055',
        'info_dict': {
            'id': '10109055',
            'ext': 'mp3',
            'title': '不丹足球背后的故事',
            'description': '喜马拉雅人的足球梦 ...',
            'creator': '大话西藏',
            'timestamp': 1434179342,
            'upload_date': '20150613',
            'duration': 900,
        },
        'skip': 'Blocked outside Mainland China',
    }, {
        'note': 'This program has accompanying songs.',
        'url': 'http://music.163.com/#/program?id=10141022',
        'info_dict': {
            'id': '10141022',
            'title': '25岁，你是自在如风的少年<27°C>',
            'description': 'md5:8d594db46cc3e6509107ede70a4aaa3b',
        },
        'playlist_count': 4,
        'skip': 'Blocked outside Mainland China',
    }, {
        'note': 'This program has accompanying songs.',
        'url': 'http://music.163.com/#/program?id=10141022',
        'info_dict': {
            'id': '10141022',
            'ext': 'mp3',
            'title': '25岁，你是自在如风的少年<27°C>',
            'description': 'md5:8d594db46cc3e6509107ede70a4aaa3b',
            'timestamp': 1434450841,
            'upload_date': '20150616',
        },
        'params': {
            'noplaylist': True
        },
        'skip': 'Blocked outside Mainland China',
    }]

    def _real_extract(self, url):
        program_id = self._match_id(url)

        info = self.query_api(
            'dj/program/detail?id=%s' % program_id,
            program_id, 'Downloading program info')['program']

        name = info['name']
        description = info['description']

        if not info['songs'] or self._downloader.params.get('noplaylist'):
            if info['songs']:
                self.to_screen(
                    'Downloading just the main audio %s because of --no-playlist'
                    % info['mainSong']['id'])

            formats = self.extract_formats(info['mainSong'])
            self._sort_formats(formats)

            return {
                'id': program_id,
                'title': name,
                'description': description,
                'creator': info['dj']['brand'],
                'timestamp': self.convert_milliseconds(info['createTime']),
                'thumbnail': info['coverUrl'],
                'duration': self.convert_milliseconds(info.get('duration', 0)),
                'formats': formats,
            }

        self.to_screen(
            'Downloading playlist %s - add --no-playlist to just download the main audio %s'
            % (program_id, info['mainSong']['id']))

        song_ids = [info['mainSong']['id']]
        song_ids.extend([song['id'] for song in info['songs']])
        entries = [
            self.url_result('http://music.163.com/#/song?id=%s' % song_id,
                            'NetEaseMusic', song_id)
            for song_id in song_ids
        ]
        return self.playlist_result(entries, program_id, name, description)


class NetEaseMusicDjRadioIE(NetEaseMusicBaseIE):
    IE_NAME = 'netease:djradio'
    IE_DESC = '网易云音乐 - 电台'
    _VALID_URL = r'https?://music\.163\.com/(#/)?djradio\?id=(?P<id>[0-9]+)'
    _TEST = {
        'url': 'http://music.163.com/#/djradio?id=42',
        'info_dict': {
            'id': '42',
            'title': '声音蔓延',
            'description': 'md5:766220985cbd16fdd552f64c578a6b15'
        },
        'playlist_mincount': 40,
        'skip': 'Blocked outside Mainland China',
    }
    _PAGE_SIZE = 1000

    def _real_extract(self, url):
        dj_id = self._match_id(url)

        name = None
        desc = None
        entries = []
        for offset in compat_itertools_count(start=0, step=self._PAGE_SIZE):
            info = self.query_api(
                'dj/program/byradio?asc=false&limit=%d&radioId=%s&offset=%d'
                % (self._PAGE_SIZE, dj_id, offset),
                dj_id, 'Downloading dj programs - %d' % offset)

            entries.extend([
                self.url_result(
                    'http://music.163.com/#/program?id=%s' % program['id'],
                    'NetEaseMusicProgram', program['id'])
                for program in info['programs']
            ])

            if name is None:
                radio = info['programs'][0]['radio']
                name = radio['name']
                desc = radio['desc']

            if not info['more']:
                break

        return self.playlist_result(entries, dj_id, name, desc)
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								# coding: utf-8
 								from __future__ import unicode_literals
-												[neteasemusic] Changes after review

											
										
										
											2015-07-10 07:29:57 +02:00
+								from base64 import b64encode
-												[netease] Get netease music download url through player api (#31235)

* remove unplayable song from test
* compatible with python 2
* using standard User_Agent, fix imports
* use hash instead of long description
* fix lint
* fix hash
											
										
										
											2022-10-11 14:55:09 +02:00
+								from binascii import hexlify
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								from datetime import datetime
-												[netease] Get netease music download url through player api (#31235)

* remove unplayable song from test
* compatible with python 2
* using standard User_Agent, fix imports
* use hash instead of long description
* fix lint
* fix hash
											
										
										
											2022-10-11 14:55:09 +02:00
+								from hashlib import md5
 								from random import randint
 								import json
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								import re
-												[netease] Get netease music download url through player api (#31235)

* remove unplayable song from test
* compatible with python 2
* using standard User_Agent, fix imports
* use hash instead of long description
* fix lint
* fix hash
											
										
										
											2022-10-11 14:55:09 +02:00
+								import time
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
 								from .common import InfoExtractor
-												[netease] Get netease music download url through player api (#31235)

* remove unplayable song from test
* compatible with python 2
* using standard User_Agent, fix imports
* use hash instead of long description
* fix lint
* fix hash
											
										
										
											2022-10-11 14:55:09 +02:00
+								from ..aes import aes_ecb_encrypt, pkcs7_padding
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								from ..compat import (
-												[compat] Add compat_urllib_parse_urlencode and eliminate encode_dict

encode_dict functionality has been improved and moved directly into compat_urllib_parse_urlencode
All occurrences of compat_urllib_parse.urlencode throughout the codebase have been replaced by compat_urllib_parse_urlencode

Closes #8974

											
										
										
											2016-03-25 20:46:57 +01:00
+								    compat_urllib_parse_urlencode,
-												[neteasemusic] Encoding fixes for Python 2.6 and 3.x

											
										
										
											2015-07-10 12:43:38 +02:00
+								    compat_str,
-												[netease:djradio] Use compat_itertools_count

											
										
										
											2015-07-10 12:59:12 +02:00
+								    compat_itertools_count,
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								)
-												[neteasemusic] Use float_or_none

											
										
										
											2016-01-19 21:21:51 +01:00
+								from ..utils import (
-												[netease] Get netease music download url through player api (#31235)

* remove unplayable song from test
* compatible with python 2
* using standard User_Agent, fix imports
* use hash instead of long description
* fix lint
* fix hash
											
										
										
											2022-10-11 14:55:09 +02:00
+								    ExtractorError,
 								    bytes_to_intlist,
-												[netease] Impove error handling (#31303)

* add warnings for users outside of China
* skip empty song urls

Co-authored-by: dirkf <fieldhouse@gmx.net>
											
										
										
											2022-10-30 12:46:46 +01:00
+								    error_to_compat_str,
-												[neteasemusic] Use float_or_none

											
										
										
											2016-01-19 21:21:51 +01:00
+								    float_or_none,
-												[netease] Get netease music download url through player api (#31235)

* remove unplayable song from test
* compatible with python 2
* using standard User_Agent, fix imports
* use hash instead of long description
* fix lint
* fix hash
											
										
										
											2022-10-11 14:55:09 +02:00
+								    int_or_none,
 								    intlist_to_bytes,
 								    sanitized_Request,
 								    std_headers,
 								    try_get,
-												[neteasemusic] Use float_or_none

											
										
										
											2016-01-19 21:21:51 +01:00
+								)
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
 								class NetEaseMusicBaseIE(InfoExtractor):
 								    _FORMATS = ['bMusic', 'mMusic', 'hMusic']
 								    _NETEASE_SALT = '3go8&$8*3*3h0k(2)2'
 								    _API_BASE = 'http://music.163.com/api/'
 								    @classmethod
 								    def _encrypt(cls, dfsid):
-												[neteasemusic] Encoding fixes for Python 2.6 and 3.x

											
										
										
											2015-07-10 12:43:38 +02:00
+								        salt_bytes = bytearray(cls._NETEASE_SALT.encode('utf-8'))
 								        string_bytes = bytearray(compat_str(dfsid).encode('ascii'))
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								        salt_len = len(salt_bytes)
-												[neteasemusic] Changes after review

											
										
										
											2015-07-10 07:29:57 +02:00
+								        for i in range(len(string_bytes)):
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								            string_bytes[i] = string_bytes[i] ^ salt_bytes[i % salt_len]
 								        m = md5()
-												[neteasemusic] Encoding fixes for Python 2.6 and 3.x

											
										
										
											2015-07-10 12:43:38 +02:00
+								        m.update(bytes(string_bytes))
 								        result = b64encode(m.digest()).decode('ascii')
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								        return result.replace('/', '_').replace('+', '-')
-												[netease] Get netease music download url through player api (#31235)

* remove unplayable song from test
* compatible with python 2
* using standard User_Agent, fix imports
* use hash instead of long description
* fix lint
* fix hash
											
										
										
											2022-10-11 14:55:09 +02:00
+								    @classmethod
 								    def make_player_api_request_data_and_headers(cls, song_id, bitrate):
 								        KEY = b'e82ckenh8dichen8'
 								        URL = '/api/song/enhance/player/url'
 								        now = int(time.time() * 1000)
 								        rand = randint(0, 1000)
 								        cookie = {
 								            'osver': None,
 								            'deviceId': None,
 								            'appver': '8.0.0',
 								            'versioncode': '140',
 								            'mobilename': None,
 								            'buildver': '1623435496',
 								            'resolution': '1920x1080',
 								            '__csrf': '',
 								            'os': 'pc',
 								            'channel': None,
 								            'requestId': '{0}_{1:04}'.format(now, rand),
 								        }
 								        request_text = json.dumps(
 								            {'ids': '[{0}]'.format(song_id), 'br': bitrate, 'header': cookie},
 								            separators=(',', ':'))
 								        message = 'nobody{0}use{1}md5forencrypt'.format(
 								            URL, request_text).encode('latin1')
 								        msg_digest = md5(message).hexdigest()
 								        data = '{0}-36cd479b6b5-{1}-36cd479b6b5-{2}'.format(
 								            URL, request_text, msg_digest)
 								        data = pkcs7_padding(bytes_to_intlist(data))
 								        encrypted = intlist_to_bytes(aes_ecb_encrypt(data, bytes_to_intlist(KEY)))
 								        encrypted_params = hexlify(encrypted).decode('ascii').upper()
 								        cookie = '; '.join(
 								            ['{0}={1}'.format(k, v if v is not None else 'undefined')
 								             for [k, v] in cookie.items()])
 								        headers = {
 								            'User-Agent': std_headers['User-Agent'],
 								            'Content-Type': 'application/x-www-form-urlencoded',
 								            'Referer': 'https://music.163.com',
 								            'Cookie': cookie,
 								        }
 								        return ('params={0}'.format(encrypted_params), headers)
 								    def _call_player_api(self, song_id, bitrate):
 								        url = 'https://interface3.music.163.com/eapi/song/enhance/player/url'
 								        data, headers = self.make_player_api_request_data_and_headers(song_id, bitrate)
 								        try:
-												[netease] Impove error handling (#31303)

* add warnings for users outside of China
* skip empty song urls

Co-authored-by: dirkf <fieldhouse@gmx.net>
											
										
										
											2022-10-30 12:46:46 +01:00
+								            msg = 'empty result'
 								            result = self._download_json(
-												[netease] Get netease music download url through player api (#31235)

* remove unplayable song from test
* compatible with python 2
* using standard User_Agent, fix imports
* use hash instead of long description
* fix lint
* fix hash
											
										
										
											2022-10-11 14:55:09 +02:00
+								                url, song_id, data=data.encode('ascii'), headers=headers)
-												[netease] Impove error handling (#31303)

* add warnings for users outside of China
* skip empty song urls

Co-authored-by: dirkf <fieldhouse@gmx.net>
											
										
										
											2022-10-30 12:46:46 +01:00
+								            if result:
 								                return result
-												[netease] Get netease music download url through player api (#31235)

* remove unplayable song from test
* compatible with python 2
* using standard User_Agent, fix imports
* use hash instead of long description
* fix lint
* fix hash
											
										
										
											2022-10-11 14:55:09 +02:00
+								        except ExtractorError as e:
 								            if type(e.cause) in (ValueError, TypeError):
 								                # JSON load failure
 								                raise
-												[netease] Impove error handling (#31303)

* add warnings for users outside of China
* skip empty song urls

Co-authored-by: dirkf <fieldhouse@gmx.net>
											
										
										
											2022-10-30 12:46:46 +01:00
+								        except Exception as e:
 								            msg = error_to_compat_str(e)
 								            self.report_warning('%s API call (%s) failed: %s' % (
 								                song_id, bitrate, msg))
-												[netease] Get netease music download url through player api (#31235)

* remove unplayable song from test
* compatible with python 2
* using standard User_Agent, fix imports
* use hash instead of long description
* fix lint
* fix hash
											
										
										
											2022-10-11 14:55:09 +02:00
+								        return {}
-												[neteasemusic] Fallback to alt hosts if m5.music.126.net doesn't work

											
										
										
											2016-01-17 00:48:46 +01:00
+								    def extract_formats(self, info):
-												[netease] Impove error handling (#31303)

* add warnings for users outside of China
* skip empty song urls

Co-authored-by: dirkf <fieldhouse@gmx.net>
											
										
										
											2022-10-30 12:46:46 +01:00
+								        err = 0
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								        formats = []
-												[netease] Get netease music download url through player api (#31235)

* remove unplayable song from test
* compatible with python 2
* using standard User_Agent, fix imports
* use hash instead of long description
* fix lint
* fix hash
											
										
										
											2022-10-11 14:55:09 +02:00
+								        song_id = info['id']
-												[neteasemusic] Fallback to alt hosts if m5.music.126.net doesn't work

											
										
										
											2016-01-17 00:48:46 +01:00
+								        for song_format in self._FORMATS:
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								            details = info.get(song_format)
 								            if not details:
 								                continue
-												[netease] Get netease music download url through player api (#31235)

* remove unplayable song from test
* compatible with python 2
* using standard User_Agent, fix imports
* use hash instead of long description
* fix lint
* fix hash
											
										
										
											2022-10-11 14:55:09 +02:00
 								            bitrate = int_or_none(details.get('bitrate')) or 999000
 								            data = self._call_player_api(song_id, bitrate)
 								            for song in try_get(data, lambda x: x['data'], list) or []:
 								                song_url = try_get(song, lambda x: x['url'])
-												[netease] Impove error handling (#31303)

* add warnings for users outside of China
* skip empty song urls

Co-authored-by: dirkf <fieldhouse@gmx.net>
											
										
										
											2022-10-30 12:46:46 +01:00
+								                if not song_url:
 								                    continue
-												[neteasemusic] Fallback to alt hosts if m5.music.126.net doesn't work

											
										
										
											2016-01-17 00:48:46 +01:00
+								                if self._is_valid_url(song_url, info['id'], 'song'):
 								                    formats.append({
 								                        'url': song_url,
 								                        'ext': details.get('extension'),
-												[netease] Get netease music download url through player api (#31235)

* remove unplayable song from test
* compatible with python 2
* using standard User_Agent, fix imports
* use hash instead of long description
* fix lint
* fix hash
											
										
										
											2022-10-11 14:55:09 +02:00
+								                        'abr': float_or_none(song.get('br'), scale=1000),
-												[neteasemusic] Fallback to alt hosts if m5.music.126.net doesn't work

											
										
										
											2016-01-17 00:48:46 +01:00
+								                        'format_id': song_format,
-												[netease] Get netease music download url through player api (#31235)

* remove unplayable song from test
* compatible with python 2
* using standard User_Agent, fix imports
* use hash instead of long description
* fix lint
* fix hash
											
										
										
											2022-10-11 14:55:09 +02:00
+								                        'filesize': int_or_none(song.get('size')),
 								                        'asr': int_or_none(details.get('sr')),
-												[neteasemusic] Fallback to alt hosts if m5.music.126.net doesn't work

											
										
										
											2016-01-17 00:48:46 +01:00
+								                    })
-												[netease] Impove error handling (#31303)

* add warnings for users outside of China
* skip empty song urls

Co-authored-by: dirkf <fieldhouse@gmx.net>
											
										
										
											2022-10-30 12:46:46 +01:00
+								                elif err == 0:
 								                    err = try_get(song, lambda x: x['code'], int)
 								        if not formats:
 								            msg = 'No media links found'
 								            if err != 0 and (err < 200 or err >= 400):
 								                raise ExtractorError(
 								                    '%s (site code %d)' % (msg, err, ), expected=True)
 								            else:
 								                self.raise_geo_restricted(
 								                    msg + ': probably this video is not available from your location due to geo restriction.',
 								                    countries=['CN'])
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								        return formats
-												[neteasemusic] Do proper rounding conversion of millisecond timestamps/durations

											
										
										
											2015-06-21 05:44:50 +02:00
+								    @classmethod
 								    def convert_milliseconds(cls, ms):
-												[neteasemusic] PEP8

											
										
										
											2015-07-10 12:30:23 +02:00
+								        return int(round(ms / 1000.0))
-												[neteasemusic] Do proper rounding conversion of millisecond timestamps/durations

											
										
										
											2015-06-21 05:44:50 +02:00
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								    def query_api(self, endpoint, video_id, note):
-												Switch codebase to use sanitized_Request instead of
compat_urllib_request.Request

[downloader/dash] Use sanitized_Request

[downloader/http] Use sanitized_Request

[atresplayer] Use sanitized_Request

[bambuser] Use sanitized_Request

[bliptv] Use sanitized_Request

[brightcove] Use sanitized_Request

[cbs] Use sanitized_Request

[ceskatelevize] Use sanitized_Request

[collegerama] Use sanitized_Request

[extractor/common] Use sanitized_Request

[crunchyroll] Use sanitized_Request

[dailymotion] Use sanitized_Request

[dcn] Use sanitized_Request

[dramafever] Use sanitized_Request

[dumpert] Use sanitized_Request

[eitb] Use sanitized_Request

[escapist] Use sanitized_Request

[everyonesmixtape] Use sanitized_Request

[extremetube] Use sanitized_Request

[facebook] Use sanitized_Request

[fc2] Use sanitized_Request

[flickr] Use sanitized_Request

[4tube] Use sanitized_Request

[gdcvault] Use sanitized_Request

[extractor/generic] Use sanitized_Request

[hearthisat] Use sanitized_Request

[hotnewhiphop] Use sanitized_Request

[hypem] Use sanitized_Request

[iprima] Use sanitized_Request

[ivi] Use sanitized_Request

[keezmovies] Use sanitized_Request

[letv] Use sanitized_Request

[lynda] Use sanitized_Request

[metacafe] Use sanitized_Request

[minhateca] Use sanitized_Request

[miomio] Use sanitized_Request

[meovideo] Use sanitized_Request

[mofosex] Use sanitized_Request

[moniker] Use sanitized_Request

[mooshare] Use sanitized_Request

[movieclips] Use sanitized_Request

[mtv] Use sanitized_Request

[myvideo] Use sanitized_Request

[neteasemusic] Use sanitized_Request

[nfb] Use sanitized_Request

[niconico] Use sanitized_Request

[noco] Use sanitized_Request

[nosvideo] Use sanitized_Request

[novamov] Use sanitized_Request

[nowness] Use sanitized_Request

[nuvid] Use sanitized_Request

[played] Use sanitized_Request

[pluralsight] Use sanitized_Request

[pornhub] Use sanitized_Request

[pornotube] Use sanitized_Request

[primesharetv] Use sanitized_Request

[promptfile] Use sanitized_Request

[qqmusic] Use sanitized_Request

[rtve] Use sanitized_Request

[safari] Use sanitized_Request

[sandia] Use sanitized_Request

[shared] Use sanitized_Request

[sharesix] Use sanitized_Request

[sina] Use sanitized_Request

[smotri] Use sanitized_Request

[sohu] Use sanitized_Request

[spankwire] Use sanitized_Request

[sportdeutschland] Use sanitized_Request

[streamcloud] Use sanitized_Request

[streamcz] Use sanitized_Request

[tapely] Use sanitized_Request

[tube8] Use sanitized_Request

[tubitv] Use sanitized_Request

[twitch] Use sanitized_Request

[twitter] Use sanitized_Request

[udemy] Use sanitized_Request

[vbox7] Use sanitized_Request

[veoh] Use sanitized_Request

[vessel] Use sanitized_Request

[vevo] Use sanitized_Request

[viddler] Use sanitized_Request

[videomega] Use sanitized_Request

[viewvster] Use sanitized_Request

[viki] Use sanitized_Request

[vk] Use sanitized_Request

[vodlocker] Use sanitized_Request

[voicerepublic] Use sanitized_Request

[wistia] Use sanitized_Request

[xfileshare] Use sanitized_Request

[xtube] Use sanitized_Request

[xvideos] Use sanitized_Request

[yandexmusic] Use sanitized_Request

[youku] Use sanitized_Request

[youporn] Use sanitized_Request

[youtube] Use sanitized_Request

[patreon] Use sanitized_Request

[extractor/common] Remove unused import

[nfb] PEP 8

											
										
										
											2015-11-21 17:18:17 +01:00
+								        req = sanitized_Request('%s%s' % (self._API_BASE, endpoint))
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								        req.add_header('Referer', self._API_BASE)
 								        return self._download_json(req, video_id, note)
 								class NetEaseMusicIE(NetEaseMusicBaseIE):
 								    IE_NAME = 'netease:song'
-												[neteasemusic] Add localized name

											
										
										
											2015-07-10 18:51:35 +02:00
+								    IE_DESC = '网易云音乐'
-												[netease] Support urls shared from mobile app (#31304)

Co-authored-by: dirkf <fieldhouse@gmx.net>
											
										
										
											2022-10-30 12:48:44 +01:00
+								    _VALID_URL = r'https?://(y\.)?music\.163\.com/(?:[#m]/)?song\?.*?\bid=(?P<id>[0-9]+)'
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								    _TESTS = [{
 								        'url': 'http://music.163.com/#/song?id=32102397',
-												[netease] Get netease music download url through player api (#31235)

* remove unplayable song from test
* compatible with python 2
* using standard User_Agent, fix imports
* use hash instead of long description
* fix lint
* fix hash
											
										
										
											2022-10-11 14:55:09 +02:00
+								        'md5': '3e909614ce09b1ccef4a3eb205441190',
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								        'info_dict': {
 								            'id': '32102397',
 								            'ext': 'mp3',
-												[netease] Get netease music download url through player api (#31235)

* remove unplayable song from test
* compatible with python 2
* using standard User_Agent, fix imports
* use hash instead of long description
* fix lint
* fix hash
											
										
										
											2022-10-11 14:55:09 +02:00
+								            'title': 'Bad Blood',
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								            'creator': 'Taylor Swift / Kendrick Lamar',
-												[netease] Get netease music download url through player api (#31235)

* remove unplayable song from test
* compatible with python 2
* using standard User_Agent, fix imports
* use hash instead of long description
* fix lint
* fix hash
											
										
										
											2022-10-11 14:55:09 +02:00
+								            'upload_date': '20150516',
 								            'timestamp': 1431792000,
 								            'description': 'md5:25fc5f27e47aad975aa6d36382c7833c',
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								        },
 								    }, {
 								        'note': 'No lyrics.',
 								        'url': 'http://music.163.com/song?id=17241424',
 								        'info_dict': {
 								            'id': '17241424',
 								            'ext': 'mp3',
 								            'title': 'Opus 28',
 								            'creator': 'Dustin O\'Halloran',
 								            'upload_date': '20080211',
-												[netease] Get netease music download url through player api (#31235)

* remove unplayable song from test
* compatible with python 2
* using standard User_Agent, fix imports
* use hash instead of long description
* fix lint
* fix hash
											
										
										
											2022-10-11 14:55:09 +02:00
+								            'description': 'md5:f12945b0f6e0365e3b73c5032e1b0ff4',
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								            'timestamp': 1202745600,
 								        },
-												[neteasemusic] Changes after review

											
										
										
											2015-07-10 07:29:57 +02:00
+								    }, {
 								        'note': 'Has translated name.',
 								        'url': 'http://music.163.com/#/song?id=22735043',
 								        'info_dict': {
 								            'id': '22735043',
 								            'ext': 'mp3',
 								            'title': '소원을 말해봐 (Genie)',
 								            'creator': '少女时代',
 								            'description': 'md5:79d99cc560e4ca97e0c4d86800ee4184',
 								            'upload_date': '20100127',
 								            'timestamp': 1264608000,
 								            'alt_title': '说出愿望吧(Genie)',
-												[netease] Skip all tests: completely georestricted

											
										
										
											2016-04-12 22:50:44 +02:00
+								        },
-												[netease] Support urls shared from mobile app (#31304)

Co-authored-by: dirkf <fieldhouse@gmx.net>
											
										
										
											2022-10-30 12:48:44 +01:00
+								    }, {
 								        'url': 'https://y.music.163.com/m/song?app_version=8.8.45&id=95670&uct2=sKnvS4+0YStsWkqsPhFijw%3D%3D&dlt=0846',
 								        'md5': '95826c73ea50b1c288b22180ec9e754d',
 								        'info_dict': {
 								            'id': '95670',
 								            'ext': 'mp3',
 								            'title': '国际歌',
 								            'creator': '马备',
 								            'upload_date': '19911130',
 								            'timestamp': 691516800,
 								            'description': 'md5:1ba2f911a2b0aa398479f595224f2141',
 								        },
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								    }]
 								    def _process_lyrics(self, lyrics_info):
 								        original = lyrics_info.get('lrc', {}).get('lyric')
 								        translated = lyrics_info.get('tlyric', {}).get('lyric')
 								        if not translated:
 								            return original
 								        lyrics_expr = r'(\[[0-9]{2}:[0-9]{2}\.[0-9]{2,}\])([^\n]+)'
 								        original_ts_texts = re.findall(lyrics_expr, original)
-												[neteasemusic] Changes after review

											
										
										
											2015-07-10 07:29:57 +02:00
+								        translation_ts_dict = dict(
 								            (time_stamp, text) for time_stamp, text in re.findall(lyrics_expr, translated)
 								        )
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								        lyrics = '\n'.join([
 								            '%s%s / %s' % (time_stamp, text, translation_ts_dict.get(time_stamp, ''))
 								            for time_stamp, text in original_ts_texts
 								        ])
 								        return lyrics
 								    def _real_extract(self, url):
 								        song_id = self._match_id(url)
 								        params = {
 								            'id': song_id,
 								            'ids': '[%s]' % song_id
 								        }
 								        info = self.query_api(
-												[compat] Add compat_urllib_parse_urlencode and eliminate encode_dict

encode_dict functionality has been improved and moved directly into compat_urllib_parse_urlencode
All occurrences of compat_urllib_parse.urlencode throughout the codebase have been replaced by compat_urllib_parse_urlencode

Closes #8974

											
										
										
											2016-03-25 20:46:57 +01:00
+								            'song/detail?' + compat_urllib_parse_urlencode(params),
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								            song_id, 'Downloading song info')['songs'][0]
 								        formats = self.extract_formats(info)
 								        self._sort_formats(formats)
 								        lyrics_info = self.query_api(
-												[neteasemusic] PEP8

											
										
										
											2015-07-10 12:30:23 +02:00
+								            'song/lyric?id=%s&lv=-1&tv=-1' % song_id,
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								            song_id, 'Downloading lyrics data')
 								        lyrics = self._process_lyrics(lyrics_info)
 								        alt_title = None
-												[neteasemusic] Changes after review

											
										
										
											2015-07-10 07:29:57 +02:00
+								        if info.get('transNames'):
 								            alt_title = '/'.join(info.get('transNames'))
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
 								        return {
 								            'id': song_id,
 								            'title': info['name'],
 								            'alt_title': alt_title,
 								            'creator': ' / '.join([artist['name'] for artist in info.get('artists', [])]),
-												[neteasemusic] Do proper rounding conversion of millisecond timestamps/durations

											
										
										
											2015-06-21 05:44:50 +02:00
+								            'timestamp': self.convert_milliseconds(info.get('album', {}).get('publishTime')),
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								            'thumbnail': info.get('album', {}).get('picUrl'),
-												[neteasemusic] Do proper rounding conversion of millisecond timestamps/durations

											
										
										
											2015-06-21 05:44:50 +02:00
+								            'duration': self.convert_milliseconds(info.get('duration', 0)),
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								            'description': lyrics,
 								            'formats': formats,
 								        }
 								class NetEaseMusicAlbumIE(NetEaseMusicBaseIE):
 								    IE_NAME = 'netease:album'
-												[neteasemusic] Add more localized names

											
										
										
											2015-07-10 19:21:18 +02:00
+								    IE_DESC = '网易云音乐 - 专辑'
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								    _VALID_URL = r'https?://music\.163\.com/(#/)?album\?id=(?P<id>[0-9]+)'
 								    _TEST = {
 								        'url': 'http://music.163.com/#/album?id=220780',
 								        'info_dict': {
 								            'id': '220780',
 								            'title': 'B\'day',
 								        },
 								        'playlist_count': 23,
-												[netease] Skip all tests: completely georestricted

											
										
										
											2016-04-12 22:50:44 +02:00
+								        'skip': 'Blocked outside Mainland China',
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								    }
 								    def _real_extract(self, url):
 								        album_id = self._match_id(url)
 								        info = self.query_api(
-												[neteasemusic] PEP8

											
										
										
											2015-07-10 12:30:23 +02:00
+								            'album/%s?id=%s' % (album_id, album_id),
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								            album_id, 'Downloading album data')['album']
 								        name = info['name']
 								        desc = info.get('description')
 								        entries = [
 								            self.url_result('http://music.163.com/#/song?id=%s' % song['id'],
 								                            'NetEaseMusic', song['id'])
 								            for song in info['songs']
 								        ]
 								        return self.playlist_result(entries, album_id, name, desc)
 								class NetEaseMusicSingerIE(NetEaseMusicBaseIE):
 								    IE_NAME = 'netease:singer'
-												[neteasemusic] Add more localized names

											
										
										
											2015-07-10 19:21:18 +02:00
+								    IE_DESC = '网易云音乐 - 歌手'
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								    _VALID_URL = r'https?://music\.163\.com/(#/)?artist\?id=(?P<id>[0-9]+)'
 								    _TESTS = [{
 								        'note': 'Singer has aliases.',
 								        'url': 'http://music.163.com/#/artist?id=10559',
 								        'info_dict': {
 								            'id': '10559',
 								            'title': '张惠妹 - aMEI;阿密特',
 								        },
 								        'playlist_count': 50,
-												[netease] Skip all tests: completely georestricted

											
										
										
											2016-04-12 22:50:44 +02:00
+								        'skip': 'Blocked outside Mainland China',
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								    }, {
 								        'note': 'Singer has translated name.',
 								        'url': 'http://music.163.com/#/artist?id=124098',
 								        'info_dict': {
 								            'id': '124098',
 								            'title': '李昇基 - 이승기',
 								        },
 								        'playlist_count': 50,
-												[netease] Skip all tests: completely georestricted

											
										
										
											2016-04-12 22:50:44 +02:00
+								        'skip': 'Blocked outside Mainland China',
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								    }]
 								    def _real_extract(self, url):
 								        singer_id = self._match_id(url)
 								        info = self.query_api(
-												[neteasemusic] PEP8

											
										
										
											2015-07-10 12:30:23 +02:00
+								            'artist/%s?id=%s' % (singer_id, singer_id),
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								            singer_id, 'Downloading singer data')
 								        name = info['artist']['name']
 								        if info['artist']['trans']:
 								            name = '%s - %s' % (name, info['artist']['trans'])
 								        if info['artist']['alias']:
-												[kuwo] Regular expression improvements

1. Prevent .+ and .*
2. Use [^>]+ instead of spaces for HTML tags
3. Remove unnecessary trailing parts

											
										
										
											2015-07-10 17:23:07 +02:00
+								            name = '%s - %s' % (name, ';'.join(info['artist']['alias']))
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
 								        entries = [
 								            self.url_result('http://music.163.com/#/song?id=%s' % song['id'],
 								                            'NetEaseMusic', song['id'])
 								            for song in info['hotSongs']
 								        ]
 								        return self.playlist_result(entries, singer_id, name)
 								class NetEaseMusicListIE(NetEaseMusicBaseIE):
 								    IE_NAME = 'netease:playlist'
-												[neteasemusic] Add more localized names

											
										
										
											2015-07-10 19:21:18 +02:00
+								    IE_DESC = '网易云音乐 - 歌单'
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								    _VALID_URL = r'https?://music\.163\.com/(#/)?(playlist|discover/toplist)\?id=(?P<id>[0-9]+)'
 								    _TESTS = [{
 								        'url': 'http://music.163.com/#/playlist?id=79177352',
 								        'info_dict': {
 								            'id': '79177352',
 								            'title': 'Billboard 2007 Top 100',
 								            'description': 'md5:12fd0819cab2965b9583ace0f8b7b022'
 								        },
 								        'playlist_count': 99,
-												[netease] Skip all tests: completely georestricted

											
										
										
											2016-04-12 22:50:44 +02:00
+								        'skip': 'Blocked outside Mainland China',
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								    }, {
 								        'note': 'Toplist/Charts sample',
 								        'url': 'http://music.163.com/#/discover/toplist?id=3733003',
 								        'info_dict': {
 								            'id': '3733003',
 								            'title': 're:韩国Melon排行榜周榜 [0-9]{4}-[0-9]{2}-[0-9]{2}',
 								            'description': 'md5:73ec782a612711cadc7872d9c1e134fc',
 								        },
 								        'playlist_count': 50,
-												[netease] Skip all tests: completely georestricted

											
										
										
											2016-04-12 22:50:44 +02:00
+								        'skip': 'Blocked outside Mainland China',
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								    }]
 								    def _real_extract(self, url):
 								        list_id = self._match_id(url)
 								        info = self.query_api(
-												[neteasemusic] PEP8

											
										
										
											2015-07-10 12:30:23 +02:00
+								            'playlist/detail?id=%s&lv=-1&tv=-1' % list_id,
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								            list_id, 'Downloading playlist data')['result']
 								        name = info['name']
 								        desc = info.get('description')
 								        if info.get('specialType') == 10:  # is a chart/toplist
-												[neteasemusic] Do proper rounding conversion of millisecond timestamps/durations

											
										
										
											2015-06-21 05:44:50 +02:00
+								            datestamp = datetime.fromtimestamp(
 								                self.convert_milliseconds(info['updateTime'])).strftime('%Y-%m-%d')
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								            name = '%s %s' % (name, datestamp)
 								        entries = [
 								            self.url_result('http://music.163.com/#/song?id=%s' % song['id'],
 								                            'NetEaseMusic', song['id'])
 								            for song in info['tracks']
 								        ]
 								        return self.playlist_result(entries, list_id, name, desc)
 								class NetEaseMusicMvIE(NetEaseMusicBaseIE):
 								    IE_NAME = 'netease:mv'
-												[neteasemusic] Add more localized names

											
										
										
											2015-07-10 19:21:18 +02:00
+								    IE_DESC = '网易云音乐 - MV'
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								    _VALID_URL = r'https?://music\.163\.com/(#/)?mv\?id=(?P<id>[0-9]+)'
 								    _TEST = {
 								        'url': 'http://music.163.com/#/mv?id=415350',
 								        'info_dict': {
 								            'id': '415350',
 								            'ext': 'mp4',
 								            'title': '이럴거면 그러지말지',
 								            'description': '白雅言自作曲唱甜蜜爱情',
 								            'creator': '白雅言',
 								            'upload_date': '20150520',
 								        },
-												[netease] Skip all tests: completely georestricted

											
										
										
											2016-04-12 22:50:44 +02:00
+								        'skip': 'Blocked outside Mainland China',
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								    }
 								    def _real_extract(self, url):
 								        mv_id = self._match_id(url)
 								        info = self.query_api(
 								            'mv/detail?id=%s&type=mp4' % mv_id,
 								            mv_id, 'Downloading mv info')['data']
 								        formats = [
-												[neteasemusic] Changes after review

											
										
										
											2015-07-10 07:29:57 +02:00
+								            {'url': mv_url, 'ext': 'mp4', 'format_id': '%sp' % brs, 'height': int(brs)}
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								            for brs, mv_url in info['brs'].items()
 								        ]
 								        self._sort_formats(formats)
 								        return {
 								            'id': mv_id,
 								            'title': info['name'],
 								            'description': info.get('desc') or info.get('briefDesc'),
 								            'creator': info['artistName'],
 								            'upload_date': info['publishTime'].replace('-', ''),
 								            'formats': formats,
 								            'thumbnail': info.get('cover'),
-												[neteasemusic] Do proper rounding conversion of millisecond timestamps/durations

											
										
										
											2015-06-21 05:44:50 +02:00
+								            'duration': self.convert_milliseconds(info.get('duration', 0)),
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								        }
 								class NetEaseMusicProgramIE(NetEaseMusicBaseIE):
 								    IE_NAME = 'netease:program'
-												[neteasemusic] Add more localized names

											
										
										
											2015-07-10 19:21:18 +02:00
+								    IE_DESC = '网易云音乐 - 电台节目'
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								    _VALID_URL = r'https?://music\.163\.com/(#/?)program\?id=(?P<id>[0-9]+)'
 								    _TESTS = [{
 								        'url': 'http://music.163.com/#/program?id=10109055',
 								        'info_dict': {
 								            'id': '10109055',
 								            'ext': 'mp3',
 								            'title': '不丹足球背后的故事',
 								            'description': '喜马拉雅人的足球梦 ...',
 								            'creator': '大话西藏',
-												[neteasemusic] Do proper rounding conversion of millisecond timestamps/durations

											
										
										
											2015-06-21 05:44:50 +02:00
+								            'timestamp': 1434179342,
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								            'upload_date': '20150613',
 								            'duration': 900,
 								        },
-												[netease] Skip all tests: completely georestricted

											
										
										
											2016-04-12 22:50:44 +02:00
+								        'skip': 'Blocked outside Mainland China',
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								    }, {
 								        'note': 'This program has accompanying songs.',
 								        'url': 'http://music.163.com/#/program?id=10141022',
 								        'info_dict': {
 								            'id': '10141022',
 								            'title': '25岁，你是自在如风的少年<27°C>',
 								            'description': 'md5:8d594db46cc3e6509107ede70a4aaa3b',
 								        },
 								        'playlist_count': 4,
-												[netease] Skip all tests: completely georestricted

											
										
										
											2016-04-12 22:50:44 +02:00
+								        'skip': 'Blocked outside Mainland China',
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								    }, {
 								        'note': 'This program has accompanying songs.',
 								        'url': 'http://music.163.com/#/program?id=10141022',
 								        'info_dict': {
 								            'id': '10141022',
 								            'ext': 'mp3',
 								            'title': '25岁，你是自在如风的少年<27°C>',
 								            'description': 'md5:8d594db46cc3e6509107ede70a4aaa3b',
-												[neteasemusic] Do proper rounding conversion of millisecond timestamps/durations

											
										
										
											2015-06-21 05:44:50 +02:00
+								            'timestamp': 1434450841,
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								            'upload_date': '20150616',
 								        },
 								        'params': {
 								            'noplaylist': True
-												[netease] Skip all tests: completely georestricted

											
										
										
											2016-04-12 22:50:44 +02:00
+								        },
 								        'skip': 'Blocked outside Mainland China',
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								    }]
 								    def _real_extract(self, url):
 								        program_id = self._match_id(url)
 								        info = self.query_api(
 								            'dj/program/detail?id=%s' % program_id,
 								            program_id, 'Downloading program info')['program']
 								        name = info['name']
 								        description = info['description']
 								        if not info['songs'] or self._downloader.params.get('noplaylist'):
 								            if info['songs']:
 								                self.to_screen(
 								                    'Downloading just the main audio %s because of --no-playlist'
 								                    % info['mainSong']['id'])
-												[neteasemusic] PEP8

											
										
										
											2015-07-10 12:30:23 +02:00
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								            formats = self.extract_formats(info['mainSong'])
 								            self._sort_formats(formats)
 								            return {
 								                'id': program_id,
 								                'title': name,
 								                'description': description,
 								                'creator': info['dj']['brand'],
-												[neteasemusic] Do proper rounding conversion of millisecond timestamps/durations

											
										
										
											2015-06-21 05:44:50 +02:00
+								                'timestamp': self.convert_milliseconds(info['createTime']),
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								                'thumbnail': info['coverUrl'],
-												[neteasemusic] Do proper rounding conversion of millisecond timestamps/durations

											
										
										
											2015-06-21 05:44:50 +02:00
+								                'duration': self.convert_milliseconds(info.get('duration', 0)),
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								                'formats': formats,
 								            }
 								        self.to_screen(
 								            'Downloading playlist %s - add --no-playlist to just download the main audio %s'
 								            % (program_id, info['mainSong']['id']))
 								        song_ids = [info['mainSong']['id']]
 								        song_ids.extend([song['id'] for song in info['songs']])
 								        entries = [
 								            self.url_result('http://music.163.com/#/song?id=%s' % song_id,
 								                            'NetEaseMusic', song_id)
 								            for song_id in song_ids
 								        ]
 								        return self.playlist_result(entries, program_id, name, description)
 								class NetEaseMusicDjRadioIE(NetEaseMusicBaseIE):
 								    IE_NAME = 'netease:djradio'
-												[neteasemusic] Add more localized names

											
										
										
											2015-07-10 19:21:18 +02:00
+								    IE_DESC = '网易云音乐 - 电台'
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								    _VALID_URL = r'https?://music\.163\.com/(#/)?djradio\?id=(?P<id>[0-9]+)'
 								    _TEST = {
 								        'url': 'http://music.163.com/#/djradio?id=42',
 								        'info_dict': {
 								            'id': '42',
 								            'title': '声音蔓延',
 								            'description': 'md5:766220985cbd16fdd552f64c578a6b15'
 								        },
 								        'playlist_mincount': 40,
-												[netease] Skip all tests: completely georestricted

											
										
										
											2016-04-12 22:50:44 +02:00
+								        'skip': 'Blocked outside Mainland China',
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								    }
 								    _PAGE_SIZE = 1000
 								    def _real_extract(self, url):
 								        dj_id = self._match_id(url)
 								        name = None
 								        desc = None
 								        entries = []
-												[netease:djradio] Use compat_itertools_count

											
										
										
											2015-07-10 12:59:12 +02:00
+								        for offset in compat_itertools_count(start=0, step=self._PAGE_SIZE):
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								            info = self.query_api(
-												[neteasemusic] PEP8

											
										
										
											2015-07-10 12:30:23 +02:00
+								                'dj/program/byradio?asc=false&limit=%d&radioId=%s&offset=%d'
-												[neteasemusic] Add new extractor for music.163.com

											
										
										
											2015-06-21 05:12:31 +02:00
+								                % (self._PAGE_SIZE, dj_id, offset),
 								                dj_id, 'Downloading dj programs - %d' % offset)
 								            entries.extend([
 								                self.url_result(
 								                    'http://music.163.com/#/program?id=%s' % program['id'],
 								                    'NetEaseMusicProgram', program['id'])
 								                for program in info['programs']
 								            ])
 								            if name is None:
 								                radio = info['programs'][0]['radio']
 								                name = radio['name']
 								                desc = radio['desc']
 								            if not info['more']:
 								                break
 								        return self.playlist_result(entries, dj_id, name, desc)