My machine learning model keeps predicting the wrong thing even though it has a high accuracy

Question

The model does not predict the right thing even after having a high training accuracy , the reason for that is really an issue, it does not predict well it is suppose to classify malaria images into infected and non infected but it seems not to do that, this model was developed using the cnn transfer learning

from tensorflow.keras.layers import Input, Lambda, Dense, Flatten,Conv2D
from tensorflow.keras.models import Model
from tensorflow.keras.applications.vgg19 import VGG19
from tensorflow.keras.applications.resnet50 import preprocess_input
from tensorflow.keras.preprocessing import image
from tensorflow.keras.preprocessing.image import ImageDataGenerator,load_img
from tensorflow.keras.models import Sequential
import numpy as np
from glob import glob
import matplotlib.pyplot as plt

import tensorflow as tf
print(tf.__version__)

# re-size all the images to this
IMAGE_SIZE = [224, 224 , 3]

# Import the Vgg 16 library as shown below and add preprocessing layer to the front of VGG
# Here we will be using imagenet weights

mobilnet = VGG19(input_shape=IMAGE_SIZE , weights='imagenet', include_top=False)

from google.colab import drive
drive.mount('/content/drive')

# don't train existing weights
for layer in mobilnet.layers:
layer.trainable = False

# useful for getting number of output classes
# folders = glob('Dataset/Train/*')
enter code here

folders = glob('/content/drive/MyDrive/Dataset/Train/*')

folders

# our layers - you can add more if you want
x = Flatten()(mobilnet.output)

prediction = Dense(len(folders), activation='softmax')(x)

# create a model object
model = Model(inputs=mobilnet.input, outputs=prediction)

# view the structure of the model
model.summary()

from tensorflow.keras.layers import MaxPooling2D

# tell the model what cost and optimization method to use
model.compile(
  loss='categorical_crossentropy',
  optimizer='adam',
  metrics=['accuracy']
)

# Use the Image Data Generator to import the images from the dataset
from tensorflow.keras.preprocessing.image import ImageDataGenerator

train_datagen = ImageDataGenerator(rescale = 1./255,
                               shear_range = 0.2,
                               zoom_range = 0.2,
                               horizontal_flip = True)

test_datagen = ImageDataGenerator(rescale = 1./255)

# # Make sure you provide the same target size as initialied for the image size
training_set = train_datagen.flow_from_directory(directory='/content/drive/MyDrive/Dataset/Train',
                                             target_size = (224, 224),
                                             batch_size = 32,
                                             class_mode = 'categorical')

training_set

test_set = test_datagen.flow_from_directory('/content/drive/MyDrive/Dataset/Test',
                                        target_size = (224, 224),
                                        batch_size = 32,
                                        class_mode = 'categorical')

test_set

from keras.callbacks import ModelCheckpoint, EarlyStopping

# simple early stopping
es = EarlyStopping(monitor='val_loss', mode='min', verbose=1)

# fit the model    
# Run the cell. It will take some time to execute
r = model.fit_generator(
  training_set,
  validation_data=test_set,
  epochs= 20,
  steps_per_epoch=len(training_set),
  validation_steps=len(test_set),
  # callbacks=[es]
)



# plot the loss
plt.plot(r.history['loss'], label='train loss')
plt.plot(r.history['val_loss'], label='val loss')
plt.legend()
plt.show()
plt.savefig('LossVal_loss')

# plot the accuracy
plt.plot(r.history['accuracy'], label='train acc')
plt.plot(r.history['val_accuracy'], label='val acc')
plt.legend()
plt.show()
plt.savefig('AccVal_acc')

# save it as a h5 file


from tensorflow.keras.models import load_model

model.save('model_vgg19.h5')



y_pred = model.predict(test_set)

y_pred

import numpy as np
y_pred = np.argmax(y_pred, axis=1)

y_pred

print(y_pred.shape)



from tensorflow.keras.models import load_model
from tensorflow.keras.preprocessing import image

model=load_model('model_vgg19.h5')



img=image.load_img('/content/drive/MyDrive/Dataset/Train/Parasite/C111.png',target_size=(224,224))

x=image.img_to_array(img)
x

x.shape

x=x/255

x=np.expand_dims(x,axis=0)

image_data = preprocess_input(x)

print(image_data.shape)

model.predict(image_data)

a=np.argmax(model.predict(image_data), axis=1)

print(a)

if(a==1):
    print("Not infected")
else:
    print("Infected")

My machine learning model keeps predicting the wrong thing even though it has a high accuracy

Answers (1)

Related Questions