20번째 수업(0529)

학교/인공지능

20번째 수업(0529)

공부 기록장 2024. 5. 29. 15:53

과제 - test 데이터 중 0번째 숫자 출력

"""train-images-idx3-ubyte.gz
   train-labels-idx1-ubyte.gz
   t10k-labels-idx1-ubyte.gz
   t10k-images-idx3-ubyte.gz
"""
from google.colab import files

uploaded = files.upload()

import gzip
import numpy as np
import matplotlib.pyplot as plt
import struct

# 데이터 로드 함수
def load_mnist_images(filename):
    with gzip.open(filename, 'rb') as f:
        _, num, rows, cols = struct.unpack('>IIII', f.read(16))
        images = np.frombuffer(f.read(), dtype=np.uint8).reshape(num, rows, cols)
    return images

def load_mnist_labels(filename):
    with gzip.open(filename, 'rb') as f:
        _, num = struct.unpack('>II', f.read(8))
        labels = np.frombuffer(f.read(), dtype=np.uint8)
    return labels

# 파일 경로
train_images_path = 'train-images-idx3-ubyte.gz'
train_labels_path = 'train-labels-idx1-ubyte.gz'
test_images_path = 't10k-images-idx3-ubyte.gz'
test_labels_path = 't10k-labels-idx1-ubyte.gz'

# 데이터 로드
train_images = load_mnist_images(train_images_path)
train_labels = load_mnist_labels(train_labels_path)
test_images = load_mnist_images(test_images_path)
test_labels = load_mnist_labels(test_labels_path)

# 데이터셋 확인
print(f"훈련 이미지: {train_images.shape}")
print(f"훈련 레이블: {train_labels.shape}")
print(f"테스트 이미지: {test_images.shape}")
print(f"테스트 레이블: {test_labels.shape}")

# 이미지를 시각화하는 함수
def show_mnist_image(index, dataset='train'):
    """주어진 인덱스의 MNIST 이미지를 표시하고, 값을 출력합니다."""
    if dataset == 'train':
        images, labels = train_images, train_labels
    elif dataset == 'test':
        images, labels = test_images, test_labels
    else:
        print("Dataset should be 'train' or 'test'.")
        return

    if index < 0 or index >= len(images):
        print(f"Index {index} is out of bounds for MNIST dataset.")
        return
    
    image = images[index]
    label = labels[index]

    # 이미지 시각화
    plt.figure()
    plt.imshow(image, cmap='gray')
    plt.title(f"Label: {label}")
    plt.colorbar()
    plt.grid(False)
    plt.show()
    
    # 이미지의 픽셀 값을 출력 (28x28 형식으로)
    for row in image:
        print(' '.join(f'{pixel:3}' for pixel in row))

# 사용자 입력에 따른 이미지 표시
while True:
    user_input = input("이미지 인덱스를 입력하세요 (-1을 입력하면 종료): ")
    try:
        index = int(user_input)
        if index == -1:
            print("프로그램을 종료합니다.")
            break
        show_mnist_image(index, 'test')
    except ValueError:
        print("유효한 숫자를 입력하세요.")