7/10 - [11/10K] - nuscene 이미지 저장

개발일지 2024. 7. 10. 23:03

초반에 이미지 저장하는 것은 조금 무식하게 했음.

그래서 nuscene의 구조를 알고 다시 했음.

token 구조를 이용했기때문에 기존에 이미지가 맞지 않는 문제는없음.

simple --> data in simple --> cam in simple,카메라 토큰 추출 --> simple_data --> 파일명 획득 후 정보 추출 이런 식임.

import os
import cv2
import numpy as np
import matplotlib.pyplot as plt
import torch
from torchvision.models.detection import fasterrcnn_resnet50_fpn
from torchvision import transforms
from PIL import Image
from nuscenes.nuscenes import NuScenes
# NuScenes 데이터셋 경로
nusc_data_dir = '/data/sets/nuscenes/samples/'

# 각 카메라 폴더
camera_folders = ['CAM_FRONT_LEFT','CAM_FRONT', 'CAM_FRONT_RIGHT', 'CAM_BACK_LEFT','CAM_BACK', 'CAM_BACK_RIGHT']

target_classes = [0,1,2,3,4,6,7,8,9,10,11,12,13,14,15,16,17]

coco_classes = [
    "__background__", "person", "bicycle", "car", "motorcycle", "airplane", "bus", "train", "truck", "boat",
    "traffic light", "fire hydrant", "stop sign", "parking meter", "bench", "bird", "cat", "dog", "horse", "sheep",
    "cow", "elephant", "bear", "zebra", "giraffe", "backpack", "umbrella", "handbag", "tie", "suitcase", "frisbee",
    "skis", "snowboard", "sports ball", "kite", "baseball bat", "baseball glove", "skateboard", "surfboard",
    "tennis racket", "bottle", "wine glass", "cup", "fork", "knife", "spoon", "bowl", "banana", "apple", "sandwich",
    "orange", "broccoli", "carrot", "hot dog", "pizza", "donut", "cake", "chair", "couch", "potted plant", "bed",
    "dining table", "toilet", "TV", "laptop", "mouse", "remote", "keyboard", "cell phone", "microwave", "oven",
    "toaster", "sink", "refrigerator", "book", "clock", "vase", "scissors", "teddy bear", "hair drier", "toothbrush"
]

def merge_images(sample_record):
    radar_tokens = {
        'front_left': sample_record['data']['CAM_FRONT_LEFT'],
        'front': sample_record['data']['CAM_FRONT'],
        'front_right': sample_record['data']['CAM_FRONT_RIGHT'],
        'back_left': sample_record['data']['CAM_BACK_LEFT'],
        'back': sample_record['data']['CAM_BACK'],
        'back_right': sample_record['data']['CAM_BACK_RIGHT']
    }

    images = []
    for key, img_token in radar_tokens.items():
        img_sensor = nusc.get('sample_data', img_token)
        img = cv2.imread(os.path.join(os.path.join(nusc.dataroot, img_sensor['filename'])))
        if img is not None:
            img = cv2.resize(img, resize_dim)  # 이미지 리사이징
            # CAM_BACK 카메라만 좌우 반전
            if 'back' in key:
                img = cv2.flip(img, 1)
            
            if img is not None:    
                images.append(img)
            else:
                print(f"Error reading image from {img_sensor['filename']}")

    combined_row1 = np.hstack(images[:3])
    combined_row2 = np.hstack(images[3:])
    combined_image = np.vstack([combined_row1, combined_row2]) 
    image = cv2.cvtColor(combined_image, cv2.COLOR_BGR2RGB)
    
    return image

def detect_objects(model,transform,image):
    image_tensor = transform(image).unsqueeze(0)
    with torch.no_grad():
        predictions = model(image_tensor)
    return predictions[0]
    
def visualize_predictions(image, predictions,target_classes, score_threshold=0.5):
    plt.cla()
    plt.imshow(image)
    plt.axis('off')
    
    for box, label, score in zip(predictions['boxes'], predictions['labels'], predictions['scores']):
        if score > score_threshold and label in target_classes:
            x1, y1, x2, y2 = box
            plt.gca().add_patch(plt.Rectangle((x1, y1), x2-x1, y2-y1, edgecolor='red', facecolor='none', linewidth=2))
            
           # 라벨 숫자 그리기
            plt.text(x1, y1, f'{coco_classes[label]}', fontsize=12, bbox=dict(facecolor='yellow', alpha=0.5))
            
    
    plt.pause(1)  # Pause to update the plot
    
    
def make_mf4(scene_type):
    # 동영상 작성
    video_filename = os.path.join(output_dir, f'combined_scene_{scene_type}.mp4')
    frame_files = sorted([os.path.join(output_dir, f) for f in os.listdir(output_dir) if f.endswith('.jpg')])

    # 첫 번째 프레임에서 프레임 크기 가져오기
    frame = cv2.imread(frame_files[0])
    height, width, layers = frame.shape

    # 동영상 작성자 초기화
    video = cv2.VideoWriter(video_filename, cv2.VideoWriter_fourcc(*'mp4v'), 10, (width, height))

    # 각 프레임을 동영상 작성자에 추가
    for frame_file in frame_files:
        frame = cv2.imread(frame_file)
        video.write(frame)

    # 동영상 작성 종료
    video.release()

    print(f"Video saved as {video_filename}")

plt.figure(figsize=(30, 15))    
# 이미지 리사이즈 크기 (옵션)
resize_dim = (640, 480)  # 원하는 크기로 설정

# 결과 저장 디렉토리
output_dir = './combined_images'
if not os.path.exists(output_dir):
    os.makedirs(output_dir)

# 사전 학습된 Faster R-CNN 모델 로드
model = fasterrcnn_resnet50_fpn(pretrained=True)
model.eval()

# 이미지 전처리
transform = transforms.Compose([transforms.ToTensor()])

# Initialize 
nusc = NuScenes(version='v1.0-mini', dataroot='/data/sets/nuscenes', verbose=True)

scene_type = 1

scene = nusc.scene[scene_type]  # Adjust the scene index as needed
current_sample_token = scene['first_sample_token']

enable_write_avi = True

i = 0
while current_sample_token:

    sample_record = nusc.get('sample', current_sample_token)
    # 이미지 합성
    image = merge_images(sample_record)
    
    # 타겟 검출
    img_pil = Image.fromarray(image)
    predictions = detect_objects(model,transform,img_pil)        

    print(f"Predictions for combined image:")
    visualize_predictions(image, predictions,target_classes)
    
    # 이미지 저장 
    i=i+1
    output_path = os.path.join(output_dir, f"combined_image_{i}.jpg")
    plt.savefig(output_path)  # PNG 형식으로 저장
    
    current_sample = nusc.get('sample', current_sample_token)    
    current_sample_token = current_sample['next']  # Move to the next sample
    i = i + 1
    print(i)

if enable_write_avi:
    make_mf4(scene_type)

아래 처럼 똑같이 잘 나오는 것을 확인 할 수 있음.

'개발일지' 카테고리의 다른 글

7/17 - [15/10K] - __getitem__, collate_fn 역할 (0)	2024.07.17
[7/16, 13/10K] - 가중치 초기화 설명(Kaiming, Xavier) (0)	2024.07.16
7/9 - (9/10K) (0)	2024.07.10
7/1 - (7/10000) (0)	2024.07.01
6/30 - (5/10000) (1)	2024.06.30

ABOUT ME

Connecting the dots Connecting the dots

'개발일지' 카테고리의 다른 글

티스토리툴바

ABOUT ME

'개발일지' 카테고리의 다른 글

관련글 관련글 더보기

티스토리툴바