# ! pip install tensorflow


import tensorflow as tf

print(tf.__version__)

2.8.0


# MNIST (手書き文字)の画像データを用意する

(x_train, y_train), (x_test, y_test) = tf.keras.datasets.mnist.load_data()

print(x_train.shape, y_train.shape, x_test.shape, y_test.shape)

Downloading data from https://storage.googleapis.com/tensorflow/tf-keras-datasets/mnist.npz
11493376/11490434 [==============================] - 0s 0us/step
11501568/11490434 [==============================] - 0s 0us/step
(60000, 28, 28) (60000,) (10000, 28, 28) (10000,)


# 画像データを表す numpy array の要素の型を調べる
type(x_train[0][0][0])

numpy.uint8


# sample code 7-1
%matplotlib inline

import matplotlib.pyplot as plt
import numpy as np
import tensorflow as tf

fig, ax = plt.subplots(1, 2, figsize=(2.8 * 2, 2.8))

img1 = x_train[0]
img2 = 255 - img1   # invert image

ax[0].imshow(img1, cmap='gray')
ax[0].axis('off')

ax[1].imshow(img2, cmap='gray')
ax[1].axis('off')

plt.show()


# cifar10 の画像を用意する
import tensorflow as tf

(x_train, y_train), (x_test, y_test) = tf.keras.datasets.cifar10.load_data()
print(x_train.shape, y_train.shape, x_test.shape, y_test.shape)

Downloading data from https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz
170500096/170498071 [==============================] - 4s 0us/step
170508288/170498071 [==============================] - 4s 0us/step
(50000, 32, 32, 3) (50000, 1) (10000, 32, 32, 3) (10000, 1)


# 画像データを表す numpy array の要素の型を調べる
type(x_train[0][0][0][0])

numpy.uint8


# sample code 7-2
%matplotlib inline

import matplotlib.pyplot as plt
import numpy as np
import tensorflow as tf

fig, ax = plt.subplots(1, 2, figsize=(3.2 * 2, 3.2))

img1 = x_train[6]  # [0, 255]
img2 = img1.astype('float32') / 255. # [0.0, 1.0]

ax[0].imshow(img1)
ax[0].axis('off')

ax[1].imshow(img2)
ax[1].axis('off')

plt.show()


# 画像データを表す numpy array の要素の型
# Deep Learning で画像を使う場合は [0, 1] または [-1, 1] の範囲の float32 型にしておくと使いやすい。
type(img2[0,0,0])

numpy.float32


# 指定したURLからデータを指定した場所にダウンロードする
import os
import urllib.request

url = 'https://zenodo.org/record/158963/files/fadg0.zip'
filepath = 'data/fadg0.zip'

dpath, fname = os.path.split(filepath)
os.makedirs(dpath, exist_ok=True)
urllib.request.urlretrieve(url, filepath)

('data/fadg0.zip', <http.client.HTTPMessage at 0x7f0a1626e250>)


# ファイルを確認する。
if os.name == 'nt':
    LS = 'dir'
    LS_R = 'dir /s'
else:
    LS = 'ls -l'
    LS_R = 'ls -lR'

!{LS} data

total 79684
-rw-r--r-- 1 root root 81593138 Mar 28 13:43 fadg0.zip


# zipファイルを指定したフォルダに展開する
import zipfile

with zipfile.ZipFile(filepath, 'r') as f:
    f.extractall(dpath)


! {LS} data

total 79688
drwxr-xr-x 4 root root     4096 Mar 28 13:43 fadg0
-rw-r--r-- 1 root root 81593138 Mar 28 13:43 fadg0.zip


! {LS} data/fadg0

total 8
drwxr-xr-x  2 root root 4096 Mar 28 13:43 audio
drwxr-xr-x 15 root root 4096 Mar 28 13:43 video


! {LS} data/fadg0/video

total 84
drwxr-xr-x 2 root root 12288 Mar 28 13:43 head
drwxr-xr-x 2 root root 12288 Mar 28 13:43 head2
drwxr-xr-x 2 root root 20480 Mar 28 13:43 head3
drwxr-xr-x 2 root root  4096 Mar 28 13:43 sa1
drwxr-xr-x 2 root root  4096 Mar 28 13:43 sa2
drwxr-xr-x 2 root root  4096 Mar 28 13:43 si1279
drwxr-xr-x 2 root root  4096 Mar 28 13:43 si1909
drwxr-xr-x 2 root root  4096 Mar 28 13:43 si649
drwxr-xr-x 2 root root  4096 Mar 28 13:43 sx109
drwxr-xr-x 2 root root  4096 Mar 28 13:43 sx19
drwxr-xr-x 2 root root  4096 Mar 28 13:43 sx199
drwxr-xr-x 2 root root  4096 Mar 28 13:43 sx289
drwxr-xr-x 2 root root  4096 Mar 28 13:43 sx379


# 画像ファイルのpathを一度に取得する
import os
import glob

DATA_DIR = './data/fadg0/video/head'


import re

def atoi(text):
    return int(text) if text.isdigit() else text

def natural_keys(text):
    return [ atoi(c) for c in re.split(r'(\d+)', text)]


# glob.glob を使って、ファイルの名前順で読み込む。key引数を指定して数字対応した。
DATA_PATHS = sorted(glob.glob(os.path.join(DATA_DIR, '*')), key=natural_keys)

print(len(DATA_PATHS))
print(DATA_PATHS[0])

346
./data/fadg0/video/head/001


# sample code 7-3
# 画像ファイルの読み込みと numpy array への変換

import numpy as np
import tensorflow as tf

image_uint8 = np.array(tf.keras.preprocessing.image.load_img(DATA_PATHS[0]))
image = image_uint8.astype('float32') / 255.0


%matplotlib inline

import matplotlib.pyplot as plt
import numpy as np

fig, ax = plt.subplots(1,1,figsize=(6,6))
ax.imshow(image)
ax.axis('off')

plt.show()


# sample code 7-4
# [0, 1] --> [-1, 1]
imageMP = image * 2 - 1

# [-1, 1] --> [0, 1]
image2 = np.clip((imageMP + 1) * 0.5, 0.0, 1.0)


# sample code 7-5
import tensorflow as tf

save_path = 'data/new_image.jpg'
tf.keras.preprocessing.image.save_img(save_path, image)

! {LS} {save_path}

-rw-r--r-- 1 root root 14875 Mar 28 13:43 data/new_image.jpg

matplotlib 入門 (7) nitta@tsuda.ac.jp¶

7章: 画像の保存・読み込み・表示¶

鉄則[7-1]: Numpy配列形式の画像データを表示するときは、グレースケール画像は[0,255]のuint8型配列に、カラー画像は[0,1]のfloat32型配列に変換してから、Axes.imshow() を適用する。

7-1: グレースケールの画像をプロットする (Axes.imshow())¶

7-2: カラー画像を表示する (Axes.imshow())¶

7-3 の準備: 画像ファイルをネットワークからダウンロードして展開する¶

7-3: ファイルから画像の読み込み¶

鉄則[7-2]: 画像ファイルから画像データを読み込む時は tensorflow.keras の下にある load_img() 関数を使う。

鉄則[7-3]: load_img() で読み込んだ画像データは PIL形式なので、ただちに Numpy Array に変換する。

鉄則[7-4]: 画像データをニューラルネットワークに通すときは、要素値の範囲が [0, 1] または [-1, 1] の 'float32' 型の Numpy 配列に変換する。

鉄則[7-5]: Numpy配列形式のカラー画像データを表示したり保存したりするときは、要素値の範囲が[0, 1] の'float32'型Numpy配列に変換する。

7-4: 画像データの要素値の範囲の変換¶

鉄則[7-6]: Numpy 配列形式の画像データをファイルに保存するときは tensorflow.keras の下にある save_img() 関数を使う。

7-5 画像の保存¶