From 2580b0a1eb71a7935825ff7248245500ebaa2c60 Mon Sep 17 00:00:00 2001 From: r0oth3x49 Date: Sat, 9 Mar 2019 14:41:14 +0500 Subject: [PATCH] fixed #340, trailing space issue in windows 10 .. --- udemy/_extract.py | 7 ++++--- 1 file changed, 4 insertions(+), 3 deletions(-) diff --git a/udemy/_extract.py b/udemy/_extract.py index cc13a57..7a4aebc 100644 --- a/udemy/_extract.py +++ b/udemy/_extract.py @@ -66,7 +66,8 @@ def __init__(self): def _clean(self, text): ok = re.compile(r'[^\\/:*?"<>|]') text = "".join(x if ok.match(x) else "_" for x in text) - return re.sub('\.+$', '', text.rstrip()) if text.endswith(".") else text.rstrip() + text = re.sub(r'\.+$', '', text.strip()) + return text def _course_name(self, url): # mobj = re.search(r'(?i)(?:(.+)\.com/(?P[a-zA-Z0-9_-]+))', url, re.I) @@ -525,7 +526,7 @@ def _real_extract(self, url=''): text = '\r' + fc + sd + "[" + fm + sb + "*" + fc + sd + "] : " + fg + sb + "Downloading course information .. " self._spinner(text) lecture_index = entry.get('object_index') - lecture_title = self._sanitize(entry.get('title')) + lecture_title = self._clean(self._sanitize(entry.get('title'))) lecture = "{0:03d} {1!s}".format(lecture_index, lecture_title) unsafe_lecture = u'{0:03d} '.format(lecture_index) + entry.get('title') data, subs = self._html_to_json(view_html, lecture_id) @@ -563,7 +564,7 @@ def _real_extract(self, url=''): text = '\r' + fc + sd + "[" + fm + sb + "*" + fc + sd + "] : " + fg + sb + "Downloading course information .. " self._spinner(text) lecture_index = entry.get('object_index') - lecture_title = self._sanitize(entry.get('title')) + lecture_title = self._clean(self._sanitize(entry.get('title'))) lecture = "{0:03d} {1!s}".format(lecture_index, lecture_title) unsafe_lecture = u'{0:03d} '.format(lecture_index) + self._clean(entry.get('title')) data = asset.get('stream_urls')