PaddleHub人像分割模型:AI人像摳圖及圖像合成


本項目根據DeepLabv3+模型一鍵摳圖示例,主要采用PaddleHub DeepLabv3+模型(deeplabv3p_xception65_humanseg)和python圖像處理庫opencv、PIL等完成。在最新作中,作者通過encoder-decoder進行多尺度信息的融合,同時保留了原來的空洞卷積和ASSP層, 其骨干網絡使用了Xception模型,提高了語義分割的健壯性和運行速率,在 PASCAL VOC 2012 dataset取得新的state-of-art performance,該PaddleHub Module使用百度自建數據集進行訓練,可用於人像分割,支持任意大小的圖片輸入。在完成一鍵摳圖之后,通過圖像合成,實現扣圖比賽任務。

PaddleHub 是基於 PaddlePaddle 開發的預訓練模型管理工具,可以借助預訓練模型更便捷地開展遷移學習工作,目前的預訓練模型涵蓋了圖像分類、目標檢測、詞法分析、語義模型、情感分析、視頻分類、圖像生成、圖像分割、文本審核、關鍵點檢測等主流模型。

PaddleHub官網:PaddleHub官網

PaddleHub項目地址:PaddleHub github

更多PaddleHub預訓練模型應用可見:教程合集課程

NOTE: 如果您在本地運行該項目示例,需要首先安裝PaddleHub。如果您在線運行,需要首先fork該項目示例。之后按照該示例操作即可。

一、安裝環境

!pip install paddlehub==1.6.0 -i https://pypi.tuna.tsinghua.edu.cn/simple
!hub install deeplabv3p_xception65_humanseg==1.0.0

二、開始P圖

1. 引入包

import matplotlib.pyplot as plt 
import matplotlib.image as mpimg 
from matplotlib import animation
import cv2
import paddlehub as hub
from PIL import Image, ImageSequence
from IPython.display import display, HTML
import numpy as np 
import imageio
import os
# 測試圖片路徑和輸出路徑
test_path = 'image/test/'
output_path = 'image/blend_out/'

# 待預測圖片
test_img_path = ["test.jpg"]
test_img_path = [test_path + img for img in test_img_path]
img = mpimg.imread(test_img_path[0]) 

# 展示待預測圖片
plt.figure(figsize=(10,10))
plt.imshow(img) 
plt.axis('off') 
plt.show()

2. 加載預訓練模型

通過加載PaddleHub DeepLabv3+模型(deeplabv3p_xception65_humanseg)實現一鍵摳圖

module = hub.Module(name="deeplabv3p_xception65_humanseg")
input_dict = {"image": test_img_path}

# execute predict and print the result
results = module.segmentation(data=input_dict)
for result in results:
    print(result)

# 預測結果展示
out_img_path = 'humanseg_output/' + os.path.basename(test_img_path[0]).split('.')[0] + '.png'
img = mpimg.imread(out_img_path)
plt.figure(figsize=(10,10))
plt.imshow(img) 
plt.axis('off') 
plt.show()
[2020-04-01 22:40:09,064] [    INFO] - Installing deeplabv3p_xception65_humanseg module
[2020-04-01 22:40:09,100] [    INFO] - Module deeplabv3p_xception65_humanseg already installed in /home/aistudio/.paddlehub/modules/deeplabv3p_xception65_humanseg
[2020-04-01 22:40:09,814] [    INFO] - 0 pretrained paramaters loaded by PaddleHub
{'origin': 'image/test/test.jpg', 'processed': 'humanseg_output/test.png'}

3. 圖像合成

# 合成函數
def blend_images(fore_image, base_image, output_path):
    """
    將摳出的人物圖像換背景
    fore_image: 前景圖片,摳出的人物圖片
    base_image: 背景圖片
    """
    # 讀入圖片
    base_image = Image.open(base_image).convert('RGB')
    fore_image = Image.open(fore_image).resize(base_image.size)

    # 圖片加權合成
    scope_map = np.array(fore_image)[:,:,-1] / 255
    scope_map = scope_map[:,:,np.newaxis]
    scope_map = np.repeat(scope_map, repeats=3, axis=2)
    res_image = np.multiply(scope_map, np.array(fore_image)[:,:,:3]) + np.multiply((1-scope_map), np.array(base_image))
    
    #保存圖片
    res_image = Image.fromarray(np.uint8(res_image))
    res_image.save(output_path)
output_path_img = output_path + 'blend_res_img.jpg'
blend_images('humanseg_output/test.png', 'image/test/bg.jpg', output_path_img)

# 展示合成圖片
plt.figure(figsize=(10,10))
img = mpimg.imread(output_path_img)
plt.imshow(img) 
plt.axis('off') 
plt.show()

output_path_img = output_path + 'blend_res_img2.jpg'
blend_images('humanseg_output/test.png', 'image/test/bg1.jpg', output_path_img)

# 展示合成圖片
plt.figure(figsize=(10,10))
img = mpimg.imread(output_path_img)
plt.imshow(img) 
plt.axis('off') 
plt.show()

# 完整流程來一張
test_img_path = ["xcd.jpg"]
test_img_path = [test_path + img for img in test_img_path]
img = mpimg.imread(test_img_path[0]) 

module = hub.Module(name="deeplabv3p_xception65_humanseg")
input_dict = {"image": test_img_path}

# execute predict and print the result
results = module.segmentation(data=input_dict)

output_path_img = output_path + 'blend_res_img2.jpg'
blend_images('humanseg_output/xcd.png', 'image/test/bg.jpg', output_path_img)

# 展示合成圖片
plt.figure(figsize=(10,10))
img = mpimg.imread(output_path_img)
plt.imshow(img) 
plt.axis('off') 
plt.show()
[2020-04-01 22:40:28,805] [    INFO] - Installing deeplabv3p_xception65_humanseg module
[2020-04-01 22:40:28,821] [    INFO] - Module deeplabv3p_xception65_humanseg already installed in /home/aistudio/.paddlehub/modules/deeplabv3p_xception65_humanseg
[2020-04-01 22:40:29,497] [    INFO] - 0 pretrained paramaters loaded by PaddleHub

三、GIF合成

GIF處理函數

def create_gif(gif_name, path, duration=0.3):
    '''
    生成gif文件,原始圖片僅支持png格式
    gif_name : 字符串,所生成的 gif 文件名,帶 .gif 后綴
    path :      需要合成為 gif 的圖片所在路徑
    duration :  gif 圖像時間間隔
    '''

    frames = []
    pngFiles = os.listdir(path)
    image_list = [os.path.join(path, f) for f in pngFiles]
    for image_name in image_list:
        frames.append(imageio.imread(image_name))
    # 保存為 gif
    imageio.mimsave(gif_name, frames, 'GIF', duration=duration)
    return

def split_gif(gif_name, output_path, resize=False):
    '''
    拆分gif文件,生成png格式,便於生成
    gif_name :  gif 文件路徑,帶 .gif 后綴
    path :      拆分圖片所在路徑
    '''
    gif_file = Image.open(gif_name)
    name = gif_name.split('/')[-1].split('.')[0]
    if not os.path.exists(output_path):                        # 判斷該文件夾是否存在,如果存在再創建則會報錯
        os.mkdir(output_path)

    for i, frame in enumerate(ImageSequence.Iterator(gif_file), 1):
        if resize:
            frame = frame.resize((300, 168), Image.ANTIALIAS)
        frame.save('%s/%s_%d.png' % (output_path, name, i))                       # 保存在等目錄的output文件夾下

def plot_sequence_images(image_array):
    ''' Display images sequence as an animation in jupyter notebook
    
    Args:
        image_array(numpy.ndarray): image_array.shape equal to (num_images, height, width, num_channels)
    '''
    dpi = 72.0
    xpixels, ypixels = image_array[0].shape[:2]
    fig = plt.figure(figsize=(ypixels/dpi, xpixels/dpi), dpi=dpi)
    im = plt.figimage(image_array[0])

    def animate(i):
        im.set_array(image_array[i])
        return (im,)

    anim = animation.FuncAnimation(fig, animate, frames=len(image_array), interval=500, repeat_delay=1, repeat=True)
    display(HTML(anim.to_html5_video()))

1. 拆分GIF

# 拆GIF文件為png幀
split_gif('image/test_gif/wushu.gif', 'image/test_gif/wushu_frame', True)

imgs = []
for i, fname in enumerate(os.listdir('image/test_gif/wushu_frame')): 
    img = cv2.imread('image/test_gif/wushu_frame/' + fname)
    img_rgb = cv2.cvtColor(img, cv2.COLOR_BGR2RGB) 
    imgs.append(img_rgb)
plot_sequence_images(imgs)

# 測試圖片路徑和輸出路徑
test_path = 'image/test_gif/wushu_frame/'
output_path = 'image/blend_out/'

# 待預測圖片
test_img_path = os.listdir(test_path)
test_img_path = [test_path + i for i in test_img_path]
img = mpimg.imread(test_img_path[0]) 
 
# 展示待預測圖片
plt.figure(figsize=(10,10))
plt.imshow(img) 
plt.axis('off') 
plt.show()

2. 預測分割

input_dict = {"image": test_img_path}

# execute predict and print the result
results = module.segmentation(data=input_dict)


# 預測結果展示
out_img_path = 'humanseg_output/' + os.path.basename(test_img_path[0]).split('.')[0] + '.png'
img = mpimg.imread(out_img_path)
plt.figure(figsize=(10,10))
plt.imshow(img) 
plt.axis('off') 
plt.show()

3. 合成結果

# 合成圖片
humanseg_wushu = [filename for filename in os.listdir('humanseg_output/') if filename.startswith("wushu")]

for i, img in enumerate(humanseg_wushu):
    img_path = os.path.join('humanseg_output/wushu_%d.png' % (i+1))
    output_path_img = output_path + 'wushu/%d.png' % i
    blend_images(img_path, 'image/test/bg1.jpg', output_path_img)

# 合成GIF
create_gif('image/blend_out/blend_res_wushu.gif', 'image/blend_out/wushu/', duration=0.5)

imgs = []
for i, fname in enumerate(os.listdir('image/blend_out/wushu/')): 
    img = cv2.imread('image/blend_out/wushu/' + fname)
    img_rgb = cv2.cvtColor(img, cv2.COLOR_BGR2RGB) 
    imgs.append(img_rgb)
plot_sequence_images(imgs)

四、視頻合成

# 拆視頻
cap = cv2.VideoCapture('image/video/input.mp4')

imgs = []
num = 0
while(True):
    ret,frame = cap.read() 
    if ret:
        cv2.imwrite('image/video/frame/%d.jpg'%num, frame)
        # img_rgb = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB) 
        # imgs.append(img_rgb)
        num += 1
    else:
        break
cap.release()#關閉相機


# plot_sequence_images(imgs)
# 顯示一張
out_img_path = 'image/video/frame/1.jpg'
img = mpimg.imread(out_img_path)
plt.figure(figsize=(10,10))
plt.imshow(img) 
plt.axis('off') 
plt.show()


frame_path = 'image/video/frame'
test_img_path = [os.path.join(frame_path, fname) for fname in os.listdir(frame_path)]
input_dict = {"image": test_img_path}

# execute predict and print the result
results = module.segmentation(data=input_dict, output_dir='image/video/frame_seg/')
# plot_sequence_images(imgs)
# 顯示一張
out_img_path = 'image/video/frame_seg/1.png'
img = mpimg.imread(out_img_path)
plt.figure(figsize=(10,10))
plt.imshow(img) 
plt.axis('off') 
plt.show()

# 合並輸出視頻
humanseg_wushu = [filename for filename in os.listdir('image/video/frame_seg/')]
for i, img in enumerate(humanseg_wushu):
    if i <= 145 or (i >= 250 and i <= 427) or (i >= 552 and i <= 601) or (i >= 729 and i <= 761):
        img_path = os.path.join('image/video/frame_seg/%d.png' % (i+1))
        output_path_img = output_path + 'video/%d.png' % i
        img = blend_images(img_path, 'image/test/bg2.jpg', output_path_img)
    if (i >= 146 and i <= 249) or (i >= 428 and i<= 551) or (i >= 602 and i<= 728):
        img_path = os.path.join('image/video/frame_seg/%d.png' % (i+1))
        output_path_img = output_path + 'video/%d.png' % i
        img = blend_images(img_path, 'image/test/bg3.jpg', output_path_img)
fourcc = cv2.VideoWriter_fourcc(*'XVID')
out = cv2.VideoWriter('output.avi',fourcc, 25.0, (1280,720))
files = os.listdir('image/blend_out/video')
for i in range(len(files)):
    img = cv2.imread('image/blend_out/video/%d.png' % i)
    img = cv2.resize(img, (1280,720))
    out.write(img)#保存幀
out.release()

項目地址:
PaddleHub創意賽:AI人像摳圖及圖像合成


視頻地址:

慶余年摳圖


免責聲明!

本站轉載的文章為個人學習借鑒使用,本站對版權不負任何法律責任。如果侵犯了您的隱私權益,請聯系本站郵箱yoyou2525@163.com刪除。



 
粵ICP備18138465號   © 2018-2025 CODEPRJ.COM