trans_t = lambda t : torch.Tensor([
    [1,0,0,0],
    [0,1,0,0],
    [0,0,1,t],
    [0,0,0,1]]).float()


import os
import imageio.v2 as imageio

import torch
import numpy as np
import matplotlib.pyplot as plt
import pytransform3d.camera as pc
import pytransform3d.transformations as pt

from pytransform3d.plot_utils import make_3d_axis
from pytransform3d.rotations import active_matrix_from_intrinsic_euler_xyz
from pytransform3d.transformations import transform_from, plot_transform
from pytransform3d.camera import make_world_grid, world2image, plot_camera


cam2world = transform_from(
    active_matrix_from_intrinsic_euler_xyz([-np.pi + 1, -0.1, 0.3]),
    [0.2, -1, 0.5])
focal_length = 0.0036
sensor_size = (0.00367, 0.00274)
image_size = (640, 480)
intrinsic_camera_matrix = np.array([
    [focal_length, 0, sensor_size[0] / 2],
    [0, focal_length, sensor_size[1] / 2],
    [0, 0, 1]
])

world_grid = make_world_grid(n_points_per_line=101)
image_grid = world2image(world_grid, cam2world, sensor_size, image_size,
                         focal_length, kappa=0.4)

plt.figure(figsize=(12, 5))
ax = make_3d_axis(1, 121, unit="m")
ax.view_init(elev=30, azim=-70)
plot_transform(ax)
plot_transform(ax, A2B=cam2world, s=0.3, name="Camera")
plot_camera(ax, intrinsic_camera_matrix, cam2world,
            sensor_size=sensor_size, virtual_image_distance=0.5)
ax.set_title("Camera and world frames")
ax.scatter(
    world_grid[:, 0], world_grid[:, 1], world_grid[:, 2], s=1, alpha=0.2)
ax.scatter(world_grid[-1, 0], world_grid[-1, 1], world_grid[-1, 2], color="r")
ax.view_init(elev=25, azim=-130)

ax = plt.subplot(122, aspect="equal")
ax.set_title("Camera image")
ax.set_xlim(0, image_size[0])
ax.set_ylim(0, image_size[1])
ax.scatter(image_grid[:, 0], -(image_grid[:, 1] - image_size[1]))
ax.scatter(image_grid[-1, 0], -(image_grid[-1, 1] - image_size[1]), color="r")

plt.show()


# Z축 t 평행이동
trans_t = lambda t : torch.Tensor([
    [1,0,0,0],
    [0,1,0,0],
    [0,0,1,t],
    [0,0,0,1]]).float()

# X축 파이 회전
rot_phi = lambda phi : torch.Tensor([
    [1,0,0,0],
    [0,np.cos(phi),-np.sin(phi),0],
    [0,np.sin(phi), np.cos(phi),0],
    [0,0,0,1]]).float()

# Y축 세타 회전
rot_theta = lambda th : torch.Tensor([
    [np.cos(th),0,-np.sin(th),0],
    [0,1,0,0],
    [np.sin(th),0, np.cos(th),0],
    [0,0,0,1]]).float()

# X축 반전, Y-Z 스왑
swap_mat = torch.Tensor([
    [-1, 0, 0, 0],
    [ 0, 0, 1, 0],
    [ 0, 1, 0, 0],
    [ 0, 0, 0, 1]
])
'''
swap_mat = torch.Tensor([
    [ 1, 0, 0, 0],
    [ 0, 0, 1, 0],
    [ 0, 1, 0, 0],
    [ 0, 0, 0, 1]
])
카메라의 이동을 다룰 때, 반사는 오른손 좌표계를 반전시켜 충돌을 일으킬 수 있으므로, 오직 이동과 회전만 고려한다.
그러나 X축 반전이 없는 위 행렬은 det = -1인 반사 행렬로, 연속된 회전 행렬로 분해할 수 없다. (연쇄 회전 행렬의 det = 1이다.)
따라서 어쩔 수 없이 X 축에 반전을 주는 것이다.
'''

'''
해당 함수에서 원본 코드에 있는 변수의 이름인 c2w를 그대로 사용하였지만, 여기서는 정 반대의 정보인 w2c(extrinsic matrix)를 구하기 위해 사용됩니다.
즉, 월드 좌표계에 곱하여 카메라 좌표계로 이동하는 행렬에 대한 정보가 담겨있습니다.
'''
def pose_spherical(phi, theta, radius):
    c2w_list = []

    # 중요! pytransfrom3d의 카메라는 Z축을 바라보고 있지만, blender dataset의 카메라는 -Z축을 바라보고 있으므로
    # 먼저 X축 기준으로 180도 회전시켜 두 카메라를 얼라인 해야 한다.
    c2w = rot_phi(180/180.*np.pi)
    c2w_list.append(c2w.clone())

    # 1) 평행이동
    c2w = trans_t(radius) @ c2w
    c2w_list.append(c2w.clone())  # clone()으로 복사
    
    # 2) rot_phi 곱
    c2w = rot_phi(phi/180.*np.pi) @ c2w
    c2w_list.append(c2w.clone())
    
    # 3) rot_theta 곱
    c2w = rot_theta(theta/180.*np.pi) @ c2w
    c2w_list.append(c2w.clone())
    
    # 4) 마지막 행렬 곱
    c2w = swap_mat @ c2w
    c2w_list.append(c2w.clone())
    
    return c2w_list  # 모든 단계를 반환 (리스트)


# 단순 시각화를 위한 카메라 내부 매트릭스 인자값 지정
intrinsic_matrix = np.array([
    [0.05, 0,    0.036/2.0],
    [0,    0.05, 0.024/2.0],
    [0,    0,    1]
])
sensor_size = np.array([0.036, 0.024])
virtual_image_distance = 1.0 # 뷰 프러스텀 크기


# pose_spherical로부터 단계별 c2w 가져오기
phi, theta, radius = -30, 90, 3
'''
phi의 값이 30이 아닌 -30인 이유도 swap_mat 때문이다.
'''
c2w_list = pose_spherical(phi, theta, radius)  # [torch.Tensor(4x4), ...]

fig = plt.figure(figsize=(9, 9))
ax = fig.add_subplot(111, projection='3d')

pt.plot_transform(ax=ax, A2B=np.eye(4), s=0.4, name="World")

for i, c2w_torch in enumerate(c2w_list):
    c2w_np = c2w_torch.numpy()  # pytransform3d는 np.array로 다룸
    
    # 좌표축 그리기 (원점+3축)
    ax = pt.plot_transform(
        A2B=c2w_np,  # (4x4) 카메라->월드 행렬
        ax=ax, 
        s=0.2,        # 좌표축 스케일
        name=f"Step {i}"
    )
    
    # 카메라 프러스텀 그리기
    pc.plot_camera(
        ax=ax,
        cam2world=c2w_np,        # (4x4) 카메라->월드
        M=intrinsic_matrix,      
        sensor_size=sensor_size,
        virtual_image_distance=virtual_image_distance,
        label=f"Step {i}",
        color="red", 
        alpha=0.2
    )

# 보기 편하도록 뷰 설정: elev(위에서 내려보는 각도), azim(수평 회전)
ax.view_init(elev=5, azim=45)

# 카메라들이 너무 바깥이면 축 범위를 넉넉히 설정
ax.set_xlim([-3, 3])
ax.set_ylim([-3, 3])
ax.set_zlim([-3, 3])

# 3D 축 비율을 1:1:1로 맞추고 싶으면 pytransform3d의 set_3d_axes_equal 등을 사용할 수도 있음
# 여기서는 간단히 set_box_aspect 써도 됨 (matplotlib 3.3+)
ax.set_box_aspect((1,1,1))

plt.show()


def render_frame(phi, theta, radius, filename):
    fig = plt.figure(figsize=(6, 6))
    ax = fig.add_subplot(111, projection='3d')
    virtual_image_distance = 1.0

    # pose_spherical로부터 단계별 c2w 가져오기
    c2w_list = pose_spherical(phi, theta, radius)  # [torch.Tensor(4x4), ...]

    pt.plot_transform(ax=ax, A2B=np.eye(4), s=0.4, name="World")

    for i, c2w_torch in enumerate(c2w_list):
        c2w_np = c2w_torch.numpy()  # pytransform3d는 np.array로 다룸
        
        # 좌표축 그리기 (원점+3축)
        ax = pt.plot_transform(
            A2B=c2w_np,  # (4x4) 카메라->월드 행렬
            ax=ax, 
            s=0.2,        # 좌표축 스케일
            name=f"Step {i}"
        )
        
        # 카메라 프러스텀 그리기
        pc.plot_camera(
            ax=ax,
            cam2world=c2w_np,        # (4x4) 카메라->월드
            M=intrinsic_matrix,      
            sensor_size=sensor_size,
            virtual_image_distance=virtual_image_distance,
            label=f"Step {i}",
            color="red", 
            alpha=0.2
        )

    # 보기 편하도록 뷰 설정: elev(위에서 내려보는 각도), azim(수평 회전)


    # 카메라들이 너무 바깥이면 축 범위를 넉넉히 설정
    ax.set_xlim([-4, 4])
    ax.set_ylim([-4, 4])
    ax.set_zlim([-4, 4])

    # 3D 축 비율을 1:1:1로 맞추고 싶으면 pytransform3d의 set_3d_axes_equal 등을 사용할 수도 있음
    # 여기서는 간단히 set_box_aspect 써도 됨 (matplotlib 3.3+)
    ax.set_box_aspect((1,1,1))

    # ax.view_init(elev=30, azim=0) ################
    # ax.view_init(elev=0, azim=90)
    # ax.view_init(elev=90, azim=0)
    ax.view_init(elev=10, azim=45)

    plt.title(f"phi={phi:.1f}, theta={theta:.1f}, radius={radius:.1f}")
    # plt.savefig(filename)
    plt.savefig(filename, bbox_inches='tight', pad_inches=0.1)
    plt.close(fig)

def create_animation_gif():
    # 저장 폴더
    out_dir = "frames"
    os.makedirs(out_dir, exist_ok=True)

    # 예: phi는 고정(45), theta를 0부터 360까지 10도 간격으로 변환
    #    radius도 예를 들어 4로 고정
    phi = -30
    radius = 4

    # 이미지 저장용 리스트
    images = []

    for i in range(120):
        theta = i * 3
        filename = os.path.join(out_dir, f"frame_{i:03d}.png")
        # 1) 프레임 그려서 PNG로 저장
        render_frame(phi, theta, radius, filename)

        # 2) 저장된 PNG 이미지를 읽어서 images 리스트에 쌓기
        img = imageio.imread(filename)
        images.append(img)

    # GIF 만들기 (frames/animation.gif)
    gif_path = os.path.join(out_dir, "animation.gif")
    imageio.mimsave(gif_path, images, fps=30, loop = 0)  # fps=5 → 초당 5프레임

    print(f"GIF saved to {gif_path}")

create_animation_gif()

GIF saved to frames/animation.gif


import json


# data practice
_datadir = './data/nerf_synthetic/lego'

with open(os.path.join(_datadir, 'transforms_test.json'), 'r') as fp:
    meta = json.load(fp)

print(meta['camera_angle_x'])
print(meta['frames'][0])
print(meta['frames'][0]['transform_matrix'])

rotations = []
transform_matrixes = []

print(len(meta['frames']))

for i in range(len(meta['frames'])):
    rotations.append(meta['frames'][i]['rotation'])
    transform_matrixes.append(meta['frames'][i]['transform_matrix'])

0.6911112070083618
{'file_path': './test/r_0', 'rotation': 0.031415926535897934, 'transform_matrix': [[-0.9999999403953552, 0.0, 0.0, 0.0], [0.0, -0.7341099977493286, 0.6790305972099304, 2.737260103225708], [0.0, 0.6790306568145752, 0.7341098785400391, 2.959291696548462], [0.0, 0.0, 0.0, 1.0]]}
[[-0.9999999403953552, 0.0, 0.0, 0.0], [0.0, -0.7341099977493286, 0.6790305972099304, 2.737260103225708], [0.0, 0.6790306568145752, 0.7341098785400391, 2.959291696548462], [0.0, 0.0, 0.0, 1.0]]
200


# print(rotations)
# print(transform_matrixes[0])


fig = plt.figure(figsize=(9, 9))
ax = fig.add_subplot(111, projection='3d')

pt.plot_transform(ax=ax, A2B=np.eye(4), s=0.4, name="World")

# pytransform3d와 blender dataset의 카메라 얼라인(X축 180도 회전)
fix_mat = np.array([
    [1,  0,  0, 0],
    [0, -1,  0, 0],
    [0,  0, -1, 0],
    [0,  0,  0, 1]
])

# 블렌더 데이터셋 중 하나의 transform_matrix
c2w_list = [[-0.9999999403953552, 0.0, 0.0, 0.0],
            [0.0, -0.7341099977493286, 0.6790305972099304, 2.737260103225708],
            [0.0, 0.6790306568145752, 0.7341098785400391, 2.959291696548462],
            [0.0, 0.0, 0.0, 1.0]]

c2w_np = np.array(c2w_list) @ fix_mat

# 좌표축 그리기 (원점+3축)
ax = pt.plot_transform(
    A2B=c2w_np,  # (4x4) 카메라->월드 행렬
    ax=ax, 
    s=0.2,        # 좌표축 스케일
    # name=f"Step {i}"
)

# 카메라 프러스텀 그리기
pc.plot_camera(
    ax=ax,
    cam2world=c2w_np,        # (4x4) 카메라->월드
    M=intrinsic_matrix,      
    sensor_size=sensor_size,
    virtual_image_distance=virtual_image_distance,
    # label=f"Step {i}",
    color="red", 
    alpha=0.2
)

# 보기 편하도록 뷰 설정: elev(위에서 내려보는 각도), azim(수평 회전)
ax.view_init(elev=10, azim=45)

# 카메라들이 너무 바깥이면 축 범위를 넉넉히 설정
ax.set_xlim([-4, 4])
ax.set_ylim([-4, 4])
ax.set_zlim([-4, 4])

# 3D 축 비율을 1:1:1로 맞추고 싶으면 pytransform3d의 set_3d_axes_equal 등을 사용할 수도 있음
# 여기서는 간단히 set_box_aspect 써도 됨 (matplotlib 3.3+)
ax.set_box_aspect((1,1,1))

plt.show()


# pytransform3d와 blender dataset의 카메라 얼라인(X축 180도 회전)
fix_mat = np.array([
    [1,  0,  0, 0],
    [0, -1,  0, 0],
    [0,  0, -1, 0],
    [0,  0,  0, 1]
])

virtual_image_distance = 0.5
fig = plt.figure(figsize=(9, 9))
ax = fig.add_subplot(111, projection='3d')

pt.plot_transform(ax=ax, A2B=np.eye(4), s=0.4, name="World")

for i, c2w_list in enumerate(transform_matrixes):
    if i % 5 == 0:
        # c2w_np = np.array(c2w_list) # pytransform3d는 np.array로 다룸
        c2w_np = np.array(c2w_list) @ fix_mat
        
        # 좌표축 그리기 (원점+3축)
        ax = pt.plot_transform(
            A2B=c2w_np,  # (4x4) 카메라->월드 행렬
            ax=ax, 
            s=0.2,        # 좌표축 스케일
            name=f"Step {i}"
        )
        
        # 카메라 프러스텀 그리기
        pc.plot_camera(
            ax=ax,
            cam2world=c2w_np,        # (4x4) 카메라->월드
            M=intrinsic_matrix,      
            sensor_size=sensor_size,
            virtual_image_distance=virtual_image_distance,
            label=f"Step {i}",
            color="red", 
            alpha=0.2
        )

# 보기 편하도록 뷰 설정: elev(위에서 내려보는 각도), azim(수평 회전)
ax.view_init(elev=30, azim=45)

# 카메라들이 너무 바깥이면 축 범위를 넉넉히 설정
ax.set_xlim([-3, 3])
ax.set_ylim([-3, 3])
ax.set_zlim([-3, 3])

# 3D 축 비율을 1:1:1로 맞추고 싶으면 pytransform3d의 set_3d_axes_equal 등을 사용할 수도 있음
# 여기서는 간단히 set_box_aspect 써도 됨 (matplotlib 3.3+)
ax.set_box_aspect((1,1,1))

plt.show()


plt.figure(figsize=(10, 5))
plt.plot(rotations, marker='o', linestyle='-', markersize=4, label='Value Trend')
plt.title("Rotations", fontsize=14)
plt.xlabel("Index", fontsize=12)
plt.ylabel("Value", fontsize=12)
plt.grid(alpha=0.5)
plt.legend()
plt.show()

3. NeRF Network (0)	2025.03.24
2. Calculating Rays (0)	2025.03.24

내 블로그 - 관리자 홈 전환	`Q` `Q`
새 글 쓰기	`W` `W`

글 수정 (권한 있는 경우)	`E` `E`
댓글 영역으로 이동	`C` `C`

이 페이지의 URL 복사	`S` `S`
맨 위로 이동	`T` `T`
티스토리 홈 이동	`H` `H`
단축키 안내	`Shift` + `/` `⇧` + `/`

Fluffy Shark Studio

티스토리 뷰

1. Camera Matrix

[1] 카메라 이론¶

1. 병진 행렬: `trans_t(t)`¶

2. X축 회전 행렬: `rot_phi(phi)`¶

3. Y축 회전 행렬: `rot_theta(th)`¶

4. `pose_spherical(theta, phi, radius)`¶

5. 카메라 외부행렬¶

6. 카메라 외부 행렬의 역행렬¶

[2] pytransform3d 라이브러리를 이용한 카메라 시각화¶

[3] NeRF의 Cam to World Matrix 이해하기¶

1. Blender vs. pytransform3d의 기본 좌표계 차이¶

2. 왜 시각화 라이브러리에서 이동과 회전 행렬만을 사용할까?¶

3. 회전 행렬과 반사 행렬의 판별¶

[4] 블렌더 데이터셋 살펴보기¶

요약¶

'코드 분석 > NeRF' 카테고리의 다른 글

티스토리툴바

단축키

내 블로그

블로그 게시글

모든 영역

« 2025/04 »
일	월	화	수	목	금	토
		1	2	3	4	5
6	7	8	9	10	11	12
13	14	15	16	17	18	19
20	21	22	23	24	25	26
27	28	29	30

티스토리 뷰

1. Camera Matrix

[1] 카메라 이론¶

1. 병진 행렬: trans_t(t)¶

2. X축 회전 행렬: rot_phi(phi)¶

3. Y축 회전 행렬: rot_theta(th)¶

4. pose_spherical(theta, phi, radius)¶

5. 카메라 외부행렬¶

6. 카메라 외부 행렬의 역행렬¶

[2] pytransform3d 라이브러리를 이용한 카메라 시각화¶

[3] NeRF의 Cam to World Matrix 이해하기¶

1. Blender vs. pytransform3d의 기본 좌표계 차이¶

2. 왜 시각화 라이브러리에서 이동과 회전 행렬만을 사용할까?¶

3. 회전 행렬과 반사 행렬의 판별¶

[4] 블렌더 데이터셋 살펴보기¶

요약¶

'코드 분석 > NeRF' 카테고리의 다른 글

티스토리툴바

단축키

내 블로그

블로그 게시글

모든 영역

1. 병진 행렬: `trans_t(t)`¶

2. X축 회전 행렬: `rot_phi(phi)`¶

3. Y축 회전 행렬: `rot_theta(th)`¶

4. `pose_spherical(theta, phi, radius)`¶