Spaces:

MohmedAnik
/

ObjectOrientmodel

Sleeping

App Files Files Community

MohmedAnik commited on 25 days ago

Commit

21d3dc9

verified ·

1 Parent(s): b2b6cf0

Update utils.py

Browse files

Files changed (1) hide show

utils.py +31 -51

utils.py CHANGED Viewed

@@ -21,9 +21,8 @@ def resize_foreground(
         alpha[1].min(),
         alpha[1].max(),
     )
-    # crop the foreground
     fg = image[y1:y2, x1:x2]
-    # pad to square
     size = max(fg.shape[0], fg.shape[1])
     ph0, pw0 = (size - fg.shape[0]) // 2, (size - fg.shape[1]) // 2
     ph1, pw1 = size - fg.shape[0] - ph0, size - fg.shape[1] - pw0
@@ -34,9 +33,9 @@ def resize_foreground(
         constant_values=((0, 0), (0, 0), (0, 0)),
     )
-    # compute padding according to the ratio
     new_size = int(new_image.shape[0] / ratio)
-    # pad to size, double side
     ph0, pw0 = (new_size - size) // 2, (new_size - size) // 2
     ph1, pw1 = new_size - size - ph0, new_size - size - pw0
     new_image = np.pad(
@@ -62,25 +61,21 @@ def remove_background(image: Image,
     return image
 def random_crop(image, crop_scale=(0.8, 0.95)):
-    """
-    随机裁切图片
-        image (numpy.ndarray):  (H, W, C)。
-        crop_scale (tuple): (min_scale, max_scale)。
-    """
-    assert isinstance(image, Image.Image), "iput must be PIL.Image.Image"
     assert len(crop_scale) == 2 and 0 < crop_scale[0] <= crop_scale[1] <= 1
     width, height = image.size
-    # 计算裁切的高度和宽度
     crop_width = random.randint(int(width * crop_scale[0]), int(width * crop_scale[1]))
     crop_height = random.randint(int(height * crop_scale[0]), int(height * crop_scale[1]))
-    # 随机选择裁切的起始点
     left = random.randint(0, width - crop_width)
     top = random.randint(0, height - crop_height)
-    # 裁切图片
     cropped_image = image.crop((left, top, left + crop_width, top + crop_height))
     return cropped_image
@@ -102,7 +97,7 @@ def background_preprocess(input_image, do_remove_background):
     return input_image
 def remove_outliers_and_average(tensor, threshold=1.5):
-    assert tensor.dim() == 1, "dimension of input Tensor must equal to 1"
     q1 = torch.quantile(tensor, 0.25)
     q3 = torch.quantile(tensor, 0.75)
@@ -120,37 +115,32 @@ def remove_outliers_and_average(tensor, threshold=1.5):
 def remove_outliers_and_average_circular(tensor, threshold=1.5):
-    assert tensor.dim() == 1, "dimension of input Tensor must equal to 1"
-    # 将角度转换为二维平面上的点
     radians = tensor * torch.pi / 180.0
     x_coords = torch.cos(radians)
     y_coords = torch.sin(radians)
-    # 计算平均向量
     mean_x = torch.mean(x_coords)
     mean_y = torch.mean(y_coords)
     differences = torch.sqrt((x_coords - mean_x) * (x_coords - mean_x) + (y_coords - mean_y) * (y_coords - mean_y))
-    # 计算四分位数和 IQR
     q1 = torch.quantile(differences, 0.25)
     q3 = torch.quantile(differences, 0.75)
     iqr = q3 - q1
-    # 计算上下限
     lower_bound = q1 - threshold * iqr
     upper_bound = q3 + threshold * iqr
-    # 筛选非离群点
     non_outliers = tensor[(differences >= lower_bound) & (differences <= upper_bound)]
     if len(non_outliers) == 0:
         mean_angle = torch.atan2(mean_y, mean_x) * 180.0 / torch.pi
         mean_angle = (mean_angle + 360) % 360
-        return mean_angle  # 如果没有非离群点，返回 None
-    # 对非离群点再次计算平均向量
     radians = non_outliers * torch.pi / 180.0
     x_coords = torch.cos(radians)
     y_coords = torch.sin(radians)
@@ -181,7 +171,7 @@ def get_proj2D_XYZ(phi, theta, gamma):
     z = scale(z)
     return x, y, z
-# 绘制3D坐标轴
 def draw_axis(ax, origin, vector, color, label=None):
     ax.quiver(origin[0], origin[1], vector[0], vector[1], angles='xy', scale_units='xy', scale=1, color=color)
     if label!=None:
@@ -190,7 +180,7 @@ def draw_axis(ax, origin, vector, color, label=None):
 def matplotlib_2D_arrow(angles, rm_bkg_img):
     fig, ax = plt.subplots(figsize=(8, 8))
-    # 设置旋转角度
     phi   = np.radians(angles[0])
     theta = np.radians(angles[1])
     gamma = np.radians(-1*angles[2])
@@ -204,10 +194,10 @@ def matplotlib_2D_arrow(angles, rm_bkg_img):
     origin = np.array([0, 0])
-    # 旋转后的向量
     rot_x, rot_y, rot_z = get_proj2D_XYZ(phi, theta, gamma)
-    # draw arrow
     arrow_attr = [{'point':rot_x, 'color':'r', 'label':'front'},
                   {'point':rot_y, 'color':'g', 'label':'right'},
                   {'point':rot_z, 'color':'b', 'label':'top'}]
@@ -221,15 +211,13 @@ def matplotlib_2D_arrow(angles, rm_bkg_img):
     for i in range(3):
         draw_axis(ax, origin, arrow_attr[order[i]]['point'], arrow_attr[order[i]]['color'], arrow_attr[order[i]]['label'])
-        # draw_axis(ax, origin, rot_y, 'g', label='right')
-        # draw_axis(ax, origin, rot_z, 'b', label='top')
-        # draw_axis(ax, origin, rot_x, 'r', label='front')
-    # 关闭坐标轴和网格
     ax.set_axis_off()
     ax.grid(False)
-    # 设置坐标范围
     ax.set_xlim(-5, 5)
     ax.set_ylim(-5, 5)
@@ -245,11 +233,10 @@ import math
 axis_model = Model("./axis.obj", texture_filename="./axis.png")
 def render_3D_axis(phi, theta, gamma):
     radius = 240
-    # camera_location = [radius * math.cos(phi), radius * math.sin(phi), radius * math.tan(theta)]
-    # print(camera_location)
     camera_location = [-1*radius * math.cos(phi), -1*radius * math.tan(theta), radius * math.sin(phi)]
     img = render(
-        # Model("res/jinx.obj", texture_filename="res/jinx.tga"),
         axis_model,
         height=512,
         width=512,
@@ -260,44 +247,37 @@ def render_3D_axis(phi, theta, gamma):
     return img
 def overlay_images_with_scaling(center_image: Image.Image, background_image, target_size=(512, 512)):
-    """
-    调整前景图像大小为 512x512，将背景图像缩放以适配，并中心对齐叠加
-    :param center_image: 前景图像
-    :param background_image: 背景图像
-    :param target_size: 前景图像的目标大小，默认 (512, 512)
-    :return: 叠加后的图像
-    """
-    # 确保输入图像为 RGBA 模式
     if center_image.mode != "RGBA":
         center_image = center_image.convert("RGBA")
     if background_image.mode != "RGBA":
         background_image = background_image.convert("RGBA")
-    # 调整前景图像大小
     center_image = center_image.resize(target_size)
-    # 缩放背景图像，确保其适合前景图像的尺寸
     bg_width, bg_height = background_image.size
-    # 按宽度或高度等比例缩放背景
     scale = target_size[0] / max(bg_width, bg_height)
     new_width = int(bg_width * scale)
     new_height = int(bg_height * scale)
     resized_background = background_image.resize((new_width, new_height))
-    # 计算需要的填充量
     pad_width = target_size[0] - new_width
     pad_height = target_size[0] - new_height
-    # 计算上下左右的 padding
     left = pad_width // 2
     right = pad_width - left
     top = pad_height // 2
     bottom = pad_height - top
-    # 添加 padding
     resized_background = ImageOps.expand(resized_background, border=(left, top, right, bottom), fill=(255,255,255,255))
-    # 将前景图像叠加到背景图像上
     result = resized_background.copy()
     result.paste(center_image, (0, 0), mask=center_image)

         alpha[1].min(),
         alpha[1].max(),
     )
     fg = image[y1:y2, x1:x2]
     size = max(fg.shape[0], fg.shape[1])
     ph0, pw0 = (size - fg.shape[0]) // 2, (size - fg.shape[1]) // 2
     ph1, pw1 = size - fg.shape[0] - ph0, size - fg.shape[1] - pw0
         constant_values=((0, 0), (0, 0), (0, 0)),
     )
     new_size = int(new_image.shape[0] / ratio)
     ph0, pw0 = (new_size - size) // 2, (new_size - size) // 2
     ph1, pw1 = new_size - size - ph0, new_size - size - pw0
     new_image = np.pad(
     return image
 def random_crop(image, crop_scale=(0.8, 0.95)):
+    assert isinstance(image, Image.Image),
     assert len(crop_scale) == 2 and 0 < crop_scale[0] <= crop_scale[1] <= 1
     width, height = image.size
     crop_width = random.randint(int(width * crop_scale[0]), int(width * crop_scale[1]))
     crop_height = random.randint(int(height * crop_scale[0]), int(height * crop_scale[1]))
     left = random.randint(0, width - crop_width)
     top = random.randint(0, height - crop_height)
     cropped_image = image.crop((left, top, left + crop_width, top + crop_height))
     return cropped_image
     return input_image
 def remove_outliers_and_average(tensor, threshold=1.5):
+    assert tensor.dim() == 1,
     q1 = torch.quantile(tensor, 0.25)
     q3 = torch.quantile(tensor, 0.75)
 def remove_outliers_and_average_circular(tensor, threshold=1.5):
+    assert tensor.dim() == 1,
     radians = tensor * torch.pi / 180.0
     x_coords = torch.cos(radians)
     y_coords = torch.sin(radians)
     mean_x = torch.mean(x_coords)
     mean_y = torch.mean(y_coords)
     differences = torch.sqrt((x_coords - mean_x) * (x_coords - mean_x) + (y_coords - mean_y) * (y_coords - mean_y))
     q1 = torch.quantile(differences, 0.25)
     q3 = torch.quantile(differences, 0.75)
     iqr = q3 - q1
     lower_bound = q1 - threshold * iqr
     upper_bound = q3 + threshold * iqr
     non_outliers = tensor[(differences >= lower_bound) & (differences <= upper_bound)]
     if len(non_outliers) == 0:
         mean_angle = torch.atan2(mean_y, mean_x) * 180.0 / torch.pi
         mean_angle = (mean_angle + 360) % 360
+        return mean_angle
     radians = non_outliers * torch.pi / 180.0
     x_coords = torch.cos(radians)
     y_coords = torch.sin(radians)
     z = scale(z)
     return x, y, z
 def draw_axis(ax, origin, vector, color, label=None):
     ax.quiver(origin[0], origin[1], vector[0], vector[1], angles='xy', scale_units='xy', scale=1, color=color)
     if label!=None:
 def matplotlib_2D_arrow(angles, rm_bkg_img):
     fig, ax = plt.subplots(figsize=(8, 8))
     phi   = np.radians(angles[0])
     theta = np.radians(angles[1])
     gamma = np.radians(-1*angles[2])
     origin = np.array([0, 0])
     rot_x, rot_y, rot_z = get_proj2D_XYZ(phi, theta, gamma)
     arrow_attr = [{'point':rot_x, 'color':'r', 'label':'front'},
                   {'point':rot_y, 'color':'g', 'label':'right'},
                   {'point':rot_z, 'color':'b', 'label':'top'}]
     for i in range(3):
         draw_axis(ax, origin, arrow_attr[order[i]]['point'], arrow_attr[order[i]]['color'], arrow_attr[order[i]]['label'])
     ax.set_axis_off()
     ax.grid(False)
     ax.set_xlim(-5, 5)
     ax.set_ylim(-5, 5)
 axis_model = Model("./axis.obj", texture_filename="./axis.png")
 def render_3D_axis(phi, theta, gamma):
     radius = 240
     camera_location = [-1*radius * math.cos(phi), -1*radius * math.tan(theta), radius * math.sin(phi)]
     img = render(
         axis_model,
         height=512,
         width=512,
     return img
 def overlay_images_with_scaling(center_image: Image.Image, background_image, target_size=(512, 512)):
     if center_image.mode != "RGBA":
         center_image = center_image.convert("RGBA")
     if background_image.mode != "RGBA":
         background_image = background_image.convert("RGBA")
     center_image = center_image.resize(target_size)
     bg_width, bg_height = background_image.size
     scale = target_size[0] / max(bg_width, bg_height)
     new_width = int(bg_width * scale)
     new_height = int(bg_height * scale)
     resized_background = background_image.resize((new_width, new_height))
     pad_width = target_size[0] - new_width
     pad_height = target_size[0] - new_height
     left = pad_width // 2
     right = pad_width - left
     top = pad_height // 2
     bottom = pad_height - top
     resized_background = ImageOps.expand(resized_background, border=(left, top, right, bottom), fill=(255,255,255,255))
     result = resized_background.copy()
     result.paste(center_image, (0, 0), mask=center_image)