[slideshare] fix description extraction
This commit is contained in:
parent
252a1f75d2
commit
77082c7b9e
1 changed files with 3 additions and 2 deletions
|
@ -9,6 +9,7 @@ from ..compat import (
|
|||
)
|
||||
from ..utils import (
|
||||
ExtractorError,
|
||||
get_element_by_id,
|
||||
)
|
||||
|
||||
|
||||
|
@ -40,7 +41,7 @@ class SlideshareIE(InfoExtractor):
|
|||
bucket = info['jsplayer']['video_bucket']
|
||||
ext = info['jsplayer']['video_extension']
|
||||
video_url = compat_urlparse.urljoin(bucket, doc + '-SD.' + ext)
|
||||
description = self._html_search_regex(
|
||||
description = get_element_by_id('slideshow-description-paragraph', webpage) or self._html_search_regex(
|
||||
r'(?s)<p[^>]+itemprop="description"[^>]*>(.+?)</p>', webpage,
|
||||
'description', fatal=False)
|
||||
|
||||
|
@ -51,5 +52,5 @@ class SlideshareIE(InfoExtractor):
|
|||
'ext': ext,
|
||||
'url': video_url,
|
||||
'thumbnail': info['slideshow']['pin_image_url'],
|
||||
'description': description,
|
||||
'description': description.strip() if description else None,
|
||||
}
|
||||
|
|
Loading…
Reference in a new issue