-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathfile_compress.py
84 lines (75 loc) · 3.88 KB
/
file_compress.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
'''
@Version: 0.0.1
@Author: ider
@Date: 2019-08-10 16:55:38
@LastEditors: ider
@LastEditTime: 2019-08-11 22:06:28
@Description: 压缩 图片和 html
'''
from bs4 import BeautifulSoup
import base64
from PIL import Image
import io
import os
Image.MAX_IMAGE_PIXELS = None
IMG_REPLACE = {
'':''
}
def compress_base64_img(data):
img_data = base64.b64decode(data.encode('utf8'))
img = Image.open(io.BytesIO(img_data))
newio = io.BytesIO()
try:
img.save(newio,format='webp',quality=10,lossless=False)
format = 'webp'
except OSError:
# webp 不能转换的使用黑白图保存为 png
img = img.convert('1')
img.save(newio,format='png',quality=10,optimize=True)
format = 'png'
newio.seek(0)
return base64.b64encode(newio.read()).decode('utf8'), format
def compress(file_path):
if file_path.endswith('.png'):
return compress_png(file_path)
elif file_path.endswith('.html'):
return compress_html(file_path)
return file_path
def compress_png(file_path):
with open(file_path,'rb')as f:
im = Image.open(f)
try:
new_file_path = file_path.rstrip('png') + 'webp'
with open(new_file_path,'wb')as fp:
im.save(fp,format='webp',quality=10,lossless=False)
except OSError:
with open(file_path,'wb')as fp:
im = im.convert('1')
im.save(fp,format='png',quality=10,optimize=True)
new_file_path = file_path
return new_file_path
def compress_html(file_path):
with open(file_path,'rb')as f:
html = f.read()
soup = BeautifulSoup(html,'lxml')
for img in soup.select('img'):
data = img.attrs.get('src')
if not data or not data.startswith('data:image'):
continue
if data.startswith('data:image/webp;base64'):
continue
line = data.split(',')
data, format = compress_base64_img(line[1])
img.attrs['src'] = 'data:image/'+format+';base64,'+data
ret_data = str(soup)
for k,v in IMG_REPLACE.items():
ret_data = ret_data.replace(k,v)
if len(ret_data):
with open(file_path,'wt')as f:
f.write(ret_data)
return file_path
if __name__ == '__main__':
print(compress('/tmp/cccc/img-3-3.png'))
print(compress('/tmp/cccc/temp.html'))
# print(compress('/home/ider/Downloads/tmp/cc.html'))
print(compress('/home/ider/Downloads/tmp/large.png'))