python - 将 PIL 图像转换为 base64 的更快方法
问题描述
这是我将 PIL 图像转换为 base64 的函数:
# input: single PIL image
def image_to_base64(self, image):
output_buffer = BytesIO()
now_time = time.time()
image.save(output_buffer, format='PNG')
print('--image.save:' + str(time.time()-now_time))
now_time = time.time()
byte_data = output_buffer.getvalue()
print('--output_buffer.getvalue:' + str(time.time()-now_time))
now_time = time.time()
encoded_input_string = base64.b64encode(byte_data)
print('--base64.b64encode:' + str(time.time()-now_time))
now_time = time.time()
input_string = encoded_input_string.decode("utf-8")
print('--encoded_input_string.decode:' + str(time.time()-now_time))
return input_string
我的输出:
--image.save:1.05138802528
--output_buffer.getvalue:0.000611066818237
--base64.b64编码:0.01047706604
--encoded_input_string.decode:0.0172328948975
正如我们所看到的,该功能非常缓慢。我们该怎样改进这个?
[编辑]
好的!这是完整的例子
import time
import requests
import base64
from PIL import Image
from io import BytesIO
# input: single PIL image
def image_to_base64(image):
output_buffer = BytesIO()
now_time = time.time()
image.save(output_buffer, format='PNG')
print('--image.save:' + str(time.time()-now_time))
now_time = time.time()
byte_data = output_buffer.getvalue()
print('--output_buffer.getvalue:' + str(time.time()-now_time))
now_time = time.time()
encoded_input_string = base64.b64encode(byte_data)
print('--base64.b64encode:' + str(time.time()-now_time))
now_time = time.time()
input_string = encoded_input_string.decode("utf-8")
print('--encoded_input_string.decode:' + str(time.time()-now_time))
return input_string
img_url = "https://www.cityscapes-dataset.com/wordpress/wp-content/uploads/2015/07/stuttgart03.png"
response = requests.get(img_url)
img = Image.open(BytesIO(response.content))
input_string = image_to_base64(img)
这里的瓶颈是
image.save(output_buffer, format='PNG')
它将 PIL 图像转换为字节。我想如果我能加快这一步就好了。
解决方案
As suggested in the comments, I tried pyvips
as below:
#!/usr/bin/env python3
import requests
import base64
import numpy as np
from PIL import Image
from io import BytesIO
from cv2 import imencode
import pyvips
def vips_2PNG(image,compression=6):
# Convert PIL Image to Numpy array
na = np.array(image)
height, width, bands = na.shape
# Convert Numpy array to Vips image
dtype_to_format = {
'uint8': 'uchar',
'int8': 'char',
'uint16': 'ushort',
'int16': 'short',
'uint32': 'uint',
'int32': 'int',
'float32': 'float',
'float64': 'double',
'complex64': 'complex',
'complex128': 'dpcomplex',
}
linear = na.reshape(width * height * bands)
vi = pyvips.Image.new_from_memory(linear.data, width, height, bands,dtype_to_format[str(na.dtype)])
# Save to memory buffer as PNG
data = vi.write_to_buffer(f".png[compression={compression}]")
return data
def vips_including_reading_from_disk(image):
# Load image from disk
image = pyvips.Image.new_from_file('stuttgart.png', access='sequential')
# Save to memory buffer as PNG
data = image.write_to_buffer('.png')
return data
def faster(image):
image_arr = np.array(image)
_, byte_data = imencode('.png', image_arr)
return byte_data
def orig(image, faster=True):
output_buffer = BytesIO()
image.save(output_buffer, format='PNG')
byte_data = output_buffer.getvalue()
return byte_data
# img_url = "https://www.cityscapes-dataset.com/wordpress/wp-content/uploads/2015/07/stuttgart03.png"
filename = 'stuttgart.png'
img = Image.open(filename)
# r = orig(img)
# print(len(r))
# %timeit r = orig(img)
# r = faster(img)
# print(len(r))
# %timeit r = faster(img)
# r = vips_including_reading_from_disk(filename)
# print(len(r))
# %timeit r = vips_including_reading_from_disk(filename)
# r = vips_2PNG(img,0)
# print(len(r))
# %timeit r = vips_2PNG(img,0)
I was looking at trading off the compression
parameter between file size and speed. Here is what I got - I wouldn't compare absolute values, but rather look at the performance relative to each other on my machine:
Filesize Time
PIL 1.7MB 1.12s
OpenCV 2.0MB 173ms <--- COMPARE
vips(comp=0) 6.2MB 66ms
vips(comp=1) 2.0MB 132ms <--- COMPARE
vips(comp=2) 2.0MB 153ms
I have put arrows next to the ones I would compare.
推荐阅读
- elasticsearch - 为某个字段创建具有搜索权限但没有读取权限的角色
- c# - 如何防止继承控件的组件出现在 Visual Studio 属性窗格中进行编辑?
- arrays - 一个包含 bash 中的子字符串的字符串 - 不工作
- swift - 如何在 Swift 中只隐藏键盘而不是 inputAccessoryView
- node.js - 如何使用 elemMatch
- c - 在 c 中搜索 char* 以查找 char* 数组的成员
- python - 如何读取带有 .zip 扩展名的 URL 并获取文件 .txt 并将其保存在目录中?
- python - ValueError:具有多个元素的数组的真值不明确。在 If 条件中使用相等时出错
- python - 是否可以从一个列表中复制一个项目并多次放入另一个列表中,然后单独修改每个项目?
- javascript - 如何在node.js中自动将图像从目录上传到axios