[SAM to OBB] Generate Point coord Tool

Development/SAM

[SAM to OBB] Generate Point coord Tool

吳鍾振 2024. 11. 10. 16:57

https://jjoh4803.tistory.com/64

SAM2 (Segment Anything Model 2)에서 포인트를 이용한 세그멘테이션

https://jjoh4803.tistory.com/62 SAM (OBB) 객체 추출항공 뷰 이미지 차량 객체 추출 방법론1. 배경 및 목적항공 이미지에서 특정 객체(이 경우 차량)를 정확하게 식별하고 추출하는 것은 도시 계획, 교통

jjoh4803.tistory.com

SAM2의 SAM2ImagePredictor에서 Point 좌표 생성을 위한 이미지 어노테이션(annotation) 도구.

1. 이미지 열람 및 탐색
- A/D 키로 이전/다음 이미지로 이동
- 폴더 내의 이미지들을 순차적으로 탐색 가능

2. 어노테이션 기능
- 마우스 클릭으로 점 찍기
- 점들을 연결하여 객체 표시
- 4점 폴리곤 생성 기능 ('O' 키)
- 생성된 점들은 JSON 파일로 저장 ('S' 키)

3. 편집 기능
- 'E' 키로 지우기 모드 전환
- 'C' 키로 모든 박스 지우기
- 이전에 저장된 어노테이션 불러오기

주요 단축키:
- A/D: 이전/다음 이미지
- S: 저장
- E: 지우기 모드
- C: 초기화
- O: 폴리곤 모드
- Q/ESC: 종료

import os
import cv2
import json
import argparse
import numpy as np

from glob import glob
from PySide6.QtCore import QSettings

setting = QSettings("test", "test")
print(f"마지막으로 저장한 Index: {setting.value('CurrentIndex')}")

parser = argparse.ArgumentParser()
parser.add_argument("-g", "--go", dest="go", action="store_true")
args = parser.parse_args()

drawing = False
ix, iy = -1, -1
ex, ey = -1, -1
img_copy = None
if args.go:
    current_img_index = setting.value("CurrentIndex") - 1
else:
    current_img_index = 0
point_list = []
polygon_points = []
object_point = []
erase_mode = False
polygon_mode = False


def distance(pt1, pt2):
    return np.sqrt((pt1[0] - pt2[0]) ** 2 + (pt1[1] - pt2[1]) ** 2)


def point_line_distance(pt: tuple, line_start: list, line_end: list):
    line_mag = distance(line_start, line_end)
    if line_mag < 0.000001:
        return distance(pt, line_start)

    u = ((pt[0] - line_start[0]) * (line_end[0] - line_start[0]) +
         (pt[1] - line_start[1]) * (line_end[1] - line_start[1])) / (line_mag ** 2)

    if u < 0.00001 or u > 1:
        ix = distance(pt, line_start)
        iy = distance(pt, line_end)
        return min(ix, iy)
    else:
        intersection = (line_start[0] + u * (line_end[0] - line_start[0]),
                        line_start[1] + u * (line_end[1] - line_start[1]))
        return distance(pt, intersection)


def draw_point(event, x, y, flags, param):
    global ix, iy, drawing, img_copy, point_list, object_point

    if polygon_mode:
        if event == cv2.EVENT_LBUTTONDOWN:
            polygon_points.append([x, y])
            cv2.circle(img, (x, y), 1, (0, 255, 0), 2)
            cv2.imshow('image', img)

            if len(polygon_points) > 1:
                for i in range(len(polygon_points) - 1):
                    pt1 = tuple(polygon_points[i])
                    pt2 = tuple(polygon_points[i + 1])
                    cv2.line(img, pt1, pt2, (0, 255, 0), 1)
            cv2.imshow('image', img)
            if len(polygon_points) == 4:
                cv2.line(img, tuple(polygon_points[-1]), tuple(polygon_points[0]), (0, 255, 0), 1)
                height, width, _ = img.shape
                normalized_points = [0, ]
                for point in polygon_points:
                    x = round(point[0] / width, 6)
                    y = round(point[1] / height, 6)
                    normalized_points.extend([x, y])
                print(normalized_points)
                cv2.imshow('image', img)

    elif erase_mode:
        if event == cv2.EVENT_LBUTTONDOWN:
            click_point = (x, y)
            threshold = 8

            for points in point_list:
                for point in points:
                    dist = distance(click_point, point)
                    if dist <= threshold:
                        print(f"Point: {points}")
    else:
        if event == cv2.EVENT_LBUTTONDOWN:
            drawing = True
            ix, iy = x, y
            img_copy = img.copy()

        elif event == cv2.EVENT_LBUTTONUP:
            drawing = False
            object_point.extend([[ix, iy]])
            if len(object_point) % 2 == 0:
                point_list.append(object_point)
                object_point = []
            cv2.circle(img, (ix, iy), 1, (0, 0, 255), 1)
            cv2.imshow('image', img)


base_path = "result_YOLO8OBB/culture"
result_folders = glob(os.path.join(base_path, "result_*"))
result_folders.sort()

image_files = []
for folder in result_folders:
    images = []

    for ext in ['*.jpg', '*.jpeg', '*.png', '*.bmp']:
        images.extend(glob(os.path.join(folder, ext)))

    image_files.extend(sorted(images))
for file in image_files:
    fname = file.split('\\')
    if "cv_" in fname[-1]:
        image_files.remove(file)

if not image_files:
    print("No images found in the specified directories")
    exit()

cv2.namedWindow('image', cv2.WINDOW_FULLSCREEN)
cv2.setMouseCallback('image', draw_point)


def show_current_image():
    global img, img_copy, point_list

    img = cv2.imread(image_files[current_img_index])
    img_copy = img.copy()
    print(f"\nCurrent image: {image_files[current_img_index]}")
    timestamp = image_files[current_img_index].split("\\")[1].split("_")[-1]

    if os.path.isfile(f"{result_folders[current_img_index]}/{timestamp}.json"):
        isfile = "O"
        with open(f"{result_folders[current_img_index]}/{timestamp}.json", "r") as f:
            pt = json.load(f)
            points = pt["points"]
            point_list = points
        for point in points:
            for x, y in point:
                cv2.circle(img, (x, y), 1, (0, 0, 255), 2)
            text_size, _ = cv2.getTextSize(f"{x, y}", cv2.FONT_ITALIC, 0.4, 1)
            text_w, text_h = text_size
            cv2.rectangle(img, (x, y), (x + text_w, y - text_h), (255, 255, 255), -1)
            cv2.putText(img, f"{x, y}", (x, y), cv2.FONT_ITALIC, 0.4, (0, 0, 255), 1)


    else:
        isfile = "X"

    print(f"Image {current_img_index + 1}/{len(image_files)} [{isfile}]")

    cv2.imshow('image', img)
    image_name = image_files[current_img_index].split("\\")[-2]
    cv2.imwrite(f"images/{image_name}.jpg", img)


def save_point():
    global data, point_list

    timestamp = image_files[current_img_index].split("\\")[1].split("_")[-1]
    data = {"points": point_list}
    path = os.path.join(image_files[current_img_index].split("\\")[0], image_files[current_img_index].split("\\")[1])

    for i in data:
        data["points"] = f"'{data['points']}'"

    with open(f"{path}/{timestamp}.json", "w") as f:
        f.write(json.dumps(data, indent=4).replace("'\"", "").replace("\"'", ""))
    print('save boxes')

    setting.setValue("CurrentIndex", current_img_index + 1)


def erase_point():
    global data, point_list, erase_mode

    erase_mode = not erase_mode
    if erase_mode: print('Erase mode')


def create_polygon():
    global polygon_mode, polygon_points
    print('create_polygon')
    polygon_mode = not polygon_mode
    polygon_points = []


def clear_box():
    global data, point_list
    point_list.clear()


show_current_image()

while True:
    key = cv2.waitKey(1) & 0xFF

    if key == ord('a') or key == ord('A'):
        current_img_index = (current_img_index - 1) % len(image_files)
        clear_box()
        show_current_image()

    elif key == ord('d') or key == ord('D'):
        current_img_index = (current_img_index + 1) % len(image_files)
        clear_box()
        show_current_image()

    elif key == ord('p') or key == ord('P'):
        print(point_list)

    elif key == ord('s') or key == ord('S'):
        save_point()

    elif key == ord('e'):
        erase_point()

    elif key == ord('c') or key == ord('C'):
        show_current_image()
        clear_box()

    elif key == ord('o'):
        create_polygon()

    elif key == 27 or key == ord('q'):
        break

cv2.destroyAllWindows()

저작자표시 비영리 동일조건

'Development > SAM' 카테고리의 다른 글

[SAM to OBB] Generate Point coord Tool (0)	2024.11.11
SegmentAnyRGBD (0)	2024.11.08
Oriented Bounding Boxes Label Editor (0)	2024.11.08
SAM2 (Segment Anything Model 2)에서 포인트를 이용한 세그멘테이션 (0)	2024.11.04
SAM (OBB) 객체 추출 (0)	2024.10.19

현재글[SAM to OBB] Generate Point coord Tool

개발 일기

Today :
Yesterday :

일	월	화	수	목	금	토
		1	2	3	4	5
6	7	8	9	10	11	12
13	14	15	16	17	18	19
20	21	22	23	24	25	26
27	28	29	30

내 블로그 - 관리자 홈 전환	`Q` `Q`
새 글 쓰기	`W` `W`

글 수정 (권한 있는 경우)	`E` `E`
댓글 영역으로 이동	`C` `C`

이 페이지의 URL 복사	`S` `S`
맨 위로 이동	`T` `T`
티스토리 홈 이동	`H` `H`
단축키 안내	`Shift` + `/` `⇧` + `/`

9학년 5반