Embedded_game/TrafficSign/生成2.py
2025-01-02 12:48:11 +08:00

95 lines
3.4 KiB
Python

# -*- coding:utf-8 -*-
# @Author len
# @Create 2023/12/25 14:55
import cv2
import numpy as np
import random
import os
def coordinates2yolo(xmin,ymin,xmax,ymax):
img_w, img_h = 800, 480
# 保留6位小数
x = round((xmin+xmax)/(2.0*img_w),6)
y = round((ymin+ymax)/(2.0*img_h),6)
w1 = round((xmax-xmin)/(1.0*img_w),6)
h1 = round((ymax-ymin)/(1.0*img_h),6)
# print( x,y,w1,h1)
return x,y,w1,h1
def process_image(bg_path, logo_path, output_path):
background = cv2.imread(bg_path)
logo = cv2.imread(logo_path, -1) # -1 表示尝试读取透明度通道
flag = logo_path.split('\\')[-1][0]
if logo is None or background is None:
print(f"无法读取图像,跳过 {bg_path}{logo_path}")
return
# 检查标志图像是否有透明度通道
if logo.shape[2] == 4:
alpha_channel = logo[:, :, 3]
else:
alpha_channel = np.ones(logo.shape[:2], dtype=logo.dtype) * 255
# 确保标志图像小于背景图像
if logo.shape[1] > background.shape[1] or logo.shape[0] > background.shape[0]:
scale_factor = min(background.shape[1] / logo.shape[1], background.shape[0] / logo.shape[0]) * 0.9
else:
scale_factor = random.uniform(0.5, 1.5)
width = int(logo.shape[1] * scale_factor)#图像长宽
height = int(logo.shape[0] * scale_factor)
logo = cv2.resize(logo, (width, height))
alpha_channel = cv2.resize(alpha_channel, (width, height))
# 确保随机位置的计算是有效的
x_offset = random.randint(0, max(0, background.shape[1] - width))
y_offset = random.randint(0, max(0, background.shape[0] - height))
# 计算标志图片的右下角坐标
x_end = x_offset + width+random.randint(0, 5)
y_end = y_offset + height+random.randint(0, 5)
result1 = coordinates2yolo(x_offset-random.randint(0, 5), y_offset-random.randint(0, 5), x_end, y_end)
result = (flag + " " + str(result1[0]) + " " + str(result1[1]) + " " + str(result1[2]) + " " + str(result1[3]))
path_txt = output_path.split('.')[0] + '.txt'
# print(result)
# return
with open(path_txt, 'w') as f:
f.write(result)
# 合成图像
for c in range(0, 3):
background[y_offset:y_offset+height, x_offset:x_offset+width, c] = \
logo[:, :, c] * (alpha_channel / 255.0) + \
background[y_offset:y_offset+height, x_offset:x_offset+width, c] * (1.0 - alpha_channel / 255.0)
# 保存结果到文件
cv2.imwrite(output_path, background)
# 文件夹路径
backgrounds_path = r'D:\1225\back' # 替换为你的背景图片文件夹路径
logos_path = r'D:\1225\sign' # 替换为你的标志图片文件夹路径
output_path = r'D:\1225\add' # 替换为你的输出文件夹路径
# 确保输出路径存在
if not os.path.exists(output_path):
os.makedirs(output_path)
backgrounds = [f for f in os.listdir(backgrounds_path) if f.endswith(('.png', '.jpg', '.jpeg'))]
logos = [f for f in os.listdir(logos_path) if f.endswith(('.png', '.jpg', '.jpeg'))]
# 为每个背景图片和每个标志图片组合
for bg_file in backgrounds:
for logo_file in logos:
for i in range(8,10):
bg_full_path = os.path.join(backgrounds_path, bg_file)
logo_full_path = os.path.join(logos_path, logo_file)
output_full_path = os.path.join(output_path, f'combined{i}_{bg_file[:-4]}_{logo_file}')
process_image(bg_full_path, logo_full_path, output_full_path)
print("批量处理完成!")