distinguish dog and cat 본문


distinguish dog and cat

givemebro 2020. 6. 9. 14:38
import os
import zipfile


# data set

# 압축 풀기
local_zip = 'C:/Users/givemebro/jupyter notebook/cats_and_dogs_filtered.zip'
zip_ref = zipfile.ZipFile(local_zip, 'r')
zip_ref.extractall('C:/Users/givemebro/jupyter notebook')


# data set

# 경로 설정 base + (train and validation)
base_dir = 'C:/Users/givemebro/jupyter notebook/cats_and_dogs_filtered'
train_dir = os.path.join(base_dir,'train')
validation_dir= os.path.join(base_dir,'validation')

# 경로 설정 trian + (cats and dogs)
# Directory with our training cat pictures
train_cats_dir = os.path.join(train_dir, 'cats')
# Directory with our training dog pictures
train_dogs_dir = os.path.join(train_dir, 'dogs')

# 경로 설정 validation + (cats and dogs)
# Directory with our validation cat pictures
validation_cats_dir = os.path.join(validation_dir, 'cats')
# Directory with our validation dog pictures
validation_dogs_dir = os.path.join(validation_dir, 'dogs')


# file name check

train_cat_fnames = os.listdir(train_cats_dir)

train_dog_fnames = os.listdir(train_dogs_dir)
['cat.0.jpg', 'cat.1.jpg', 'cat.10.jpg', 'cat.100.jpg', 'cat.101.jpg', 'cat.102.jpg', 'cat.103.jpg', 'cat.104.jpg', 'cat.105.jpg', 'cat.106.jpg']
['dog.0.jpg', 'dog.1.jpg', 'dog.10.jpg', 'dog.100.jpg', 'dog.101.jpg', 'dog.102.jpg', 'dog.103.jpg', 'dog.104.jpg', 'dog.105.jpg', 'dog.106.jpg']


# check number of cat and dog images in train and validation 

print('total training cat images:', len(os.listdir(train_cats_dir)))
print('total training dog images:', len(os.listdir(train_dogs_dir)))
print('total validation cat images:', len(os.listdir(validation_cats_dir)))
print('total validation dog images:', len(os.listdir(validation_dogs_dir)))
total training cat images: 1000
total training dog images: 1000
total validation cat images: 500
total validation dog images: 500



%matplotlib inline

import matplotlib.pyplot as plt
import matplotlib.image as mpimg

# Parameters for our graph; we'll output images in a 4x4 configuration
nrows = 4
ncols = 4

# Index for iterating over images
pic_index = 0

# Set up matplotlib fig, and size it to fit 4x4 pics
fig = plt.gcf()
fig.set_size_inches(ncols * 4, nrows * 4)

pic_index += 8
next_cat_pix = [os.path.join(train_cats_dir, fname) 
                for fname in train_cat_fnames[pic_index-8:pic_index]]
next_dog_pix = [os.path.join(train_dogs_dir, fname) 
                for fname in train_dog_fnames[pic_index-8:pic_index]]

for i, img_path in enumerate(next_cat_pix+next_dog_pix):
  # Set up subplot; subplot indices start at 1
  sp = plt.subplot(nrows, ncols, i + 1)
  sp.axis('Off') # Don't show axes (or gridlines)

  img = mpimg.imread(img_path)


finished data set

from tensorflow.keras import layers
from tensorflow.keras import Model


# Our input feature map is 150x150x3: 150x150 for the image pixels, and 3 for
# the three color channels: R, G, and B
img_input = layers.Input(shape=(150, 150, 3)

# First convolution extracts 16 filters that are 3x3
# Convolution is followed by max-pooling layer with a 2x2 window
x = layers.Conv2D(16, 3, activation='relu')(img_input)
x = layers.MaxPooling2D(2)(x)

# Second convolution extracts 32 filters that are 3x3
# Convolution is followed by max-pooling layer with a 2x2 window
x = layers.Conv2D(32, 3, activation='relu')(x)
x = layers.MaxPooling2D(2)(x)

# Third convolution extracts 64 filters that are 3x3
# Convolution is followed by max-pooling layer with a 2x2 window
x = layers.Conv2D(64, 3, activation='relu')(x)
x = layers.MaxPooling2D(2)(x)


# Flatten feature map to a 1-dim tensor so we can add fully connected layers
x = layers.Flatten()(x)

# Create a fully connected layer with ReLU activation and 512 hidden units
x = layers.Dense(512, activation='relu')(x)

# Create output layer with a single node and sigmoid activation
output = layers.Dense(1, activation='sigmoid')(x)

# Create model:
# input = input feature map
# output = input feature map + stacked convolution/maxpooling layers + fully 
# connected layer + sigmoid output layer
model = Model(img_input, output)


Layer (type)                 Output Shape              Param #   
input_1 (InputLayer)         (None, 150, 150, 3)       0         
conv2d (Conv2D)              (None, 148, 148, 16)      448       
max_pooling2d (MaxPooling2D) (None, 74, 74, 16)        0         
conv2d_1 (Conv2D)            (None, 72, 72, 32)        4640      
max_pooling2d_1 (MaxPooling2 (None, 36, 36, 32)        0         
conv2d_2 (Conv2D)            (None, 34, 34, 64)        18496     
max_pooling2d_2 (MaxPooling2 (None, 17, 17, 64)        0         
flatten (Flatten)            (None, 18496)             0         
dense (Dense)                (None, 512)               9470464   
dense_1 (Dense)              (None, 1)                 513       
Total params: 9,494,561
Trainable params: 9,494,561
Non-trainable params: 0


from tensorflow.keras.optimizers import RMSprop

from tensorflow.keras.preprocessing.image import ImageDataGenerator

# All images will be rescaled by 1./255
train_datagen = ImageDataGenerator(rescale=1./255)
val_datagen = ImageDataGenerator(rescale=1./255)

# Flow training images in batches of 20 using train_datagen generator
train_generator = train_datagen.flow_from_directory(
        train_dir,  # This is the source directory for training images
        target_size=(150, 150),  # All images will be resized to 150x150
        # Since we use binary_crossentropy loss, we need binary labels

# Flow validation images in batches of 20 using val_datagen generator
validation_generator = val_datagen.flow_from_directory(
        target_size=(150, 150),
Found 2000 images belonging to 2 classes.
Found 1000 images belonging to 2 classes.

history = model.fit_generator(
      steps_per_epoch=100,  # 2000 images = batch_size * steps
      validation_steps=50,  # 1000 images = batch_size * steps
Epoch 1/15
 - 87s - loss: 4.1684 - acc: 0.5250 - val_loss: 0.6708 - val_acc: 0.6630
Epoch 2/15
 - 88s - loss: 0.6557 - acc: 0.6450 - val_loss: 0.5845 - val_acc: 0.6770
Epoch 3/15
 - 86s - loss: 0.5740 - acc: 0.7045 - val_loss: 0.5643 - val_acc: 0.7120
Epoch 4/15
 - 87s - loss: 0.5069 - acc: 0.7615 - val_loss: 0.5709 - val_acc: 0.7170
Epoch 5/15
 - 77s - loss: 0.4349 - acc: 0.7870 - val_loss: 0.5861 - val_acc: 0.7290
Epoch 6/15
 - 89s - loss: 0.3529 - acc: 0.8460 - val_loss: 0.6678 - val_acc: 0.7160
Epoch 7/15
 - 106s - loss: 0.2958 - acc: 0.8770 - val_loss: 0.6121 - val_acc: 0.7420
Epoch 8/15
 - 111s - loss: 0.2056 - acc: 0.9190 - val_loss: 0.7415 - val_acc: 0.7120
Epoch 9/15
 - 113s - loss: 0.1480 - acc: 0.9455 - val_loss: 0.8736 - val_acc: 0.7240
Epoch 10/15
 - 96s - loss: 0.1341 - acc: 0.9560 - val_loss: 1.5144 - val_acc: 0.6490
Epoch 11/15
 - 90s - loss: 0.0767 - acc: 0.9785 - val_loss: 1.1448 - val_acc: 0.7140
Epoch 12/15
 - 85s - loss: 0.0780 - acc: 0.9795 - val_loss: 1.2964 - val_acc: 0.7290
Epoch 13/15
 - 85s - loss: 0.0451 - acc: 0.9860 - val_loss: 1.6336 - val_acc: 0.7100
Epoch 14/15
 - 87s - loss: 0.0485 - acc: 0.9840 - val_loss: 1.6253 - val_acc: 0.7060
Epoch 15/15
 - 85s - loss: 0.0973 - acc: 0.9820 - val_loss: 3.0956 - val_acc: 0.6010


import numpy as np
import random
from tensorflow.keras.preprocessing.image import img_to_array, load_img

# Let's define a new Model that will take an image as input, and will output
# intermediate representations for all layers in the previous model after
# the first.
successive_outputs = [layer.output for layer in model.layers[1:]]
visualization_model = Model(img_input, successive_outputs)

# Let's prepare a random input image of a cat or dog from the training set.
cat_img_files = [os.path.join(train_cats_dir, f) for f in train_cat_fnames]
dog_img_files = [os.path.join(train_dogs_dir, f) for f in train_dog_fnames]
img_path = random.choice(cat_img_files + dog_img_files)

img = load_img(img_path, target_size=(150, 150))  # this is a PIL image
x = img_to_array(img)  # Numpy array with shape (150, 150, 3)
x = x.reshape((1,) + x.shape)  # Numpy array with shape (1, 150, 150, 3)

# Rescale by 1/255
x /= 255

# Let's run our image through our network, thus obtaining all
# intermediate representations for this image.
successive_feature_maps = visualization_model.predict(x)

# These are the names of the layers, so can have them as part of our plot
layer_names = [layer.name for layer in model.layers]

# Now let's display our representations
for layer_name, feature_map in zip(layer_names, successive_feature_maps):
  if len(feature_map.shape) == 4:
    # Just do this for the conv / maxpool layers, not the fully-connected layers
    n_features = feature_map.shape[-1]  # number of features in feature map
    # The feature map has shape (1, size, size, n_features)
    size = feature_map.shape[1]
    # We will tile our images in this matrix
    display_grid = np.zeros((size, size * n_features))
    for i in range(n_features):
      # Postprocess the feature to make it visually palatable
      x = feature_map[0, :, :, i]
      x -= x.mean()
      x /= x.std()
      x *= 64
      x += 128
      x = np.clip(x, 0, 255).astype('uint8')
      # We'll tile each filter into this big horizontal grid
      display_grid[:, i * size : (i + 1) * size] = x
    # Display the grid
    scale = 20. / n_features
    plt.figure(figsize=(scale * n_features, scale))
    plt.imshow(display_grid, aspect='auto', cmap='viridis')

# Retrieve a list of accuracy results on training and validation data
# sets for each training epoch
acc = history.history['acc']
val_acc = history.history['val_acc']

# Retrieve a list of list results on training and validation data
# sets for each training epoch
loss = history.history['loss']
val_loss = history.history['val_loss']

# Get number of epochs
epochs = range(len(acc))

# Plot training and validation accuracy per epoch
plt.plot(epochs, acc)
plt.plot(epochs, val_acc)
plt.title('Training and validation accuracy')


# Plot training and validation loss per epoch
plt.plot(epochs, loss)
plt.plot(epochs, val_loss)
plt.title('Training and validation loss')


