图像扩展同比例缩小，补成正方形，补黑

🕗 发布于 2025-01-18 21:16 python 深度学习 numpy

/mnt/pfs/users/lbg/project/4dhuman/multi-hmr/utils/vitdet_dataset.py

def rotate_2d(pt_2d: np.array, rot_rad: float) -> np.array:
    """
    Rotate a 2D point on the x-y plane.
    Args:
        pt_2d (np.array): Input 2D point with shape (2,).
        rot_rad (float): Rotation angle
    Returns:
        np.array: Rotated 2D point.
    """
    x = pt_2d[0]
    y = pt_2d[1]
    sn, cs = np.sin(rot_rad), np.cos(rot_rad)
    xx = x * cs - y * sn
    yy = x * sn + y * cs
    return np.array([xx, yy], dtype=np.float32)

def gen_trans_from_patch_cv(c_x: float, c_y: float,
                            src_width: float, src_height: float,
                            dst_width: float, dst_height: float,
                            scale: float, rot: float) -> np.array:
    """
    Create transformation matrix for the bounding box crop.
    Args:
        c_x (float): Bounding box center x coordinate in the original image.
        c_y (float): Bounding box center y coordinate in the original image.
        src_width (float): Bounding box width.
        src_height (float): Bounding box height.
        dst_width (float): Output box width.
        dst_height (float): Output box height.
        scale (float): Rescaling factor for the bounding box (augmentation).
        rot (float): Random rotation applied to the box.
    Returns:
        trans (np.array): Target geometric transformation.
    """
    # augment size with scale
    src_w = src_width * scale
    src_h = src_height * scale
    src_center = np.zeros(2)
    src_center[0] = c_x
    src_center[1] = c_y
    # augment rotation
    rot_rad = np.pi * rot / 180
    src_downdir = rotate_2d(np.array([0, src_h * 0.5], dtype=np.float32), rot_rad)
    src_rightdir = rotate_2d(np.array([src_w * 0.5, 0], dtype=np.float32), rot_rad)

    dst_w = dst_width
    dst_h = dst_height
    dst_center = np.array([dst_w * 0.5, dst_h * 0.5], dtype=np.float32)
    dst_downdir = np.array([0, dst_h * 0.5], dtype=np.float32)
    dst_rightdir = np.array([dst_w * 0.5, 0], dtype=np.float32)

    src = np.zeros((3, 2), dtype=np.float32)
    src[0, :] = src_center
    src[1, :] = src_center + src_downdir
    src[2, :] = src_center + src_rightdir

    dst = np.zeros((3, 2), dtype=np.float32)
    dst[0, :] = dst_center
    dst[1, :] = dst_center + dst_downdir
    dst[2, :] = dst_center + dst_rightdir

    trans = cv2.getAffineTransform(np.float32(src), np.float32(dst))

    return trans


def generate_image_patch_cv2(img: np.array, c_x: float, c_y: float,
                             bb_width: float, bb_height: float,
                             patch_width: float, patch_height: float,
                             do_flip: bool, scale: float, rot: float,
                             border_mode=cv2.BORDER_CONSTANT, border_value=0) -> Tuple[np.array, np.array]:
    """
    Crop the input image and return the crop and the corresponding transformation matrix.
    Args:
        img (np.array): Input image of shape (H, W, 3)
        c_x (float): Bounding box center x coordinate in the original image.
        c_y (float): Bounding box center y coordinate in the original image.
        bb_width (float): Bounding box width.
        bb_height (float): Bounding box height.
        patch_width (float): Output box width.
        patch_height (float): Output box height.
        do_flip (bool): Whether to flip image or not.
        scale (float): Rescaling factor for the bounding box (augmentation).
        rot (float): Random rotation applied to the box.
    Returns:
        img_patch (np.array): Cropped image patch of shape (patch_height, patch_height, 3)
        trans (np.array): Transformation matrix.
    """

    img_height, img_width, img_channels = img.shape
    if do_flip:
        img = img[:, ::-1, :]
        c_x = img_width - c_x - 1


    trans = gen_trans_from_patch_cv(c_x, c_y, bb_width, bb_height, patch_width, patch_height, scale, rot)

    img_patch = cv2.warpAffine(img, trans, (int(patch_width), int(patch_height)), 
                        flags=cv2.INTER_LINEAR, 
                        borderMode=border_mode,
                        borderValue=border_value,
                )
    
    cv2.imwrite("aaa.jpg",img_patch)
    # Force borderValue=cv2.BORDER_CONSTANT for alpha channel
    if (img.shape[2] == 4) and (border_mode != cv2.BORDER_CONSTANT):
        img_patch[:,:,3] = cv2.warpAffine(img[:,:,3], trans, (int(patch_width), int(patch_height)), 
                                            flags=cv2.INTER_LINEAR, 
                                            borderMode=cv2.BORDER_CONSTANT,
                            )

    return img_patch, trans

原文地址：https://blog.csdn.net/jacke121/article/details/145216151

免责声明：本站文章内容转载自网络资源，如本站内容侵犯了原著者的合法权益，可联系本站删除。更多内容请关注自学内容网（zxcms.com）！

上一篇：为AI聊天工具添加一个知识系统之46 蒙板程序设计（第一版）：Facet六边形【意识形态：操纵】
下一篇：HTB：Access[WriteUP]

蓝桥杯3527阶乘的和 | 组合数学
这个题目的思路是对A~i~排序后，记录每个A~i~出现的次数dic[A~i~]。显然最小的A~0~满足m。每次遍历dic，如果m对应的A~i~出现的次数是A~i+1~的倍数，那么将其并入dic[A~i
阅读更多2025-01-19
三维扫描赋能文化：蔡司3D扫描仪让木质文化遗产焕发新生-沪敖3D
挪威文化历史博物馆在其修复工作中融入现代3D扫描技术，让数百年的历史焕发新生。
阅读更多2025-01-19
springboot基于微信小程序的停车场预订系统
Spring Boot 基于微信小程序的停车场预订系统在城市交通日益拥堵，停车难问题愈发凸显的当下，Spring Boot 基于微信小程序的停车场预订系统为车主们提供了便捷高效的停车解决方案，让出行停
阅读更多2025-01-19
2.用户登录流程
若依用户登录流程，能跟代码跟代码，跟不了代码背下来，流程相对固定
阅读更多2025-01-19
SparkSQL数据源与数据存储综合实践
在本次实战中，我们通过`SparkSQLDataSource`项目深入学习了如何使用Spark SQL加载和保存不同格式的数据。首先，我们查看了JSON、CSV和TXT格式的数据集，并通过`DataL
阅读更多2025-01-19
Hexo + NexT + Github搭建个人博客
先创建一个页面cd[your-site]#进到站点中hexonewpage[page-name]#创建页面在文件开头的YAML块（用于写入配置）中添加配置通过主题的配置文件将你所创建的页面路由写入菜单
阅读更多2025-01-19
Linux使用SSH连接GitHub指南
GitHub SSH密钥配置是一个重要的安全认证步骤。首先需要在本地终端通过ssh-keygen命令生成SSH密钥对，包含私钥和公钥两个文件。生成时可以设置密码短语进行额外保护。获得密钥后，需要将公钥
阅读更多2025-01-19
案例分析一
没几天入职后，去向技术副主管领任务，随便给了个任务并指派两个帮手（自己去联系）组成小组，顺口还提醒下“甲水平不行，乙还可以”（在以后工作中，发现甲的水平不是一般的好），然后就是开干。”，他头也没抬说了
阅读更多2025-01-19
在21世纪的我用C语言探寻世界本质——字符函数和字符串函数(2)
（9）现在我们就来看进行一次匹配的过程，也很简单，我们还是创建一个while循环，如果s1和s2解引用不是，并且解引用后相等，那我们就让s1和s2加加，一直往后走，当循环结束时，我们就判断s2解引用
阅读更多2025-01-19
tlias部门管理-新增部门-接口开发
tlias部门管理-新增部门-接口开发
阅读更多2025-01-19

图像扩展 同比例缩小，补成正方形，补黑

相关文章

图像扩展同比例缩小，补成正方形，补黑