[xminus] Capture description (#4300)

This commit is contained in:
Philipp Hagemeister 2014-12-04 17:43:34 +01:00
parent e8df5cee12
commit 81028ff9eb

View File

@ -1,6 +1,8 @@
# coding: utf-8 # coding: utf-8
from __future__ import unicode_literals from __future__ import unicode_literals
import re
from .common import InfoExtractor from .common import InfoExtractor
from ..compat import ( from ..compat import (
compat_chr, compat_chr,
@ -25,6 +27,7 @@ class XMinusIE(InfoExtractor):
'tbr': 320, 'tbr': 320,
'filesize_approx': 5900000, 'filesize_approx': 5900000,
'view_count': int, 'view_count': int,
'description': 'md5:03238c5b663810bc79cf42ef3c03e371',
} }
} }
@ -48,6 +51,11 @@ def _real_extract(self, url):
view_count = int_or_none(self._html_search_regex( view_count = int_or_none(self._html_search_regex(
r'<div class="quality.*?► ([0-9]+)', r'<div class="quality.*?► ([0-9]+)',
webpage, 'view count', fatal=False)) webpage, 'view count', fatal=False))
description = self._html_search_regex(
r'(?s)<div id="song_texts">(.*?)</div><br',
webpage, 'song lyrics', fatal=False)
if description:
description = re.sub(' *\r *', '\n', description)
enc_token = self._html_search_regex( enc_token = self._html_search_regex(
r'minus_track\.tkn="(.+?)"', webpage, 'enc_token') r'minus_track\.tkn="(.+?)"', webpage, 'enc_token')
@ -64,4 +72,5 @@ def _real_extract(self, url):
'filesize_approx': filesize_approx, 'filesize_approx': filesize_approx,
'tbr': tbr, 'tbr': tbr,
'view_count': view_count, 'view_count': view_count,
'description': description,
} }