We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 50547b0 commit d43fb61Copy full SHA for d43fb61
geektime_dl/geektime_ebook/maker.py
@@ -41,8 +41,14 @@ def generate_cover_img(url, output_dir):
41
42
def parse_image(content, output_dir):
43
44
- p = r'img src="(.*?)"'
45
- img_url_list = re.findall(p, content, re.S)
+ # remove the xxx `style=xxx`
+ p = r'img (.{1,15}=".*?") src=".*?"'
46
+ fucking_styles = re.findall(p, content)
47
+ for style in fucking_styles:
48
+ content = content.replace(style, '')
49
+
50
+ p = r'img\s+src="(.*?)"'
51
+ img_url_list = re.findall(p, content)
52
for url in img_url_list:
53
try:
54
url_local = str(uuid.uuid4()) + '.jpg'
0 commit comments