test_preprocess_encode.py

#Simple unit tests covering preprocess_data.py, encode_image.py, vgg16.py and imagenet_utils.py

import pytest

from preprocess_data import preprocessing
from vgg16 import VGG16
from encode_image import model_gen,encodings
from imagenet_utils import preprocess_input as i_preprocess_input

import os
import numpy as np
from keras import backend as K
from keras.preprocessing import image
from keras.applications.imagenet_utils import preprocess_input as k_preprocess_input #distinguish from imagenet_utils.preprocess_input!


captions_folder='Flickr8K_Text'
image_folder='Flickr8K_Data'
test_image='3666056567_661e25f54c.jpg'


@pytest.fixture(scope='module')
def load_example_image(request):
	img=image.load_img(os.path.join(image_folder,test_image),target_size=(224,224))
	x=image.img_to_array(img)
	x=np.expand_dims(x,axis=0)
	return x

def test_preprocess():
	'''
	Wherein we test preprocess_data.preprocess(). We check whether the number of 
	test/training examples as well as the 42nd entries of both output files, 
	trainimgs.txt and testimgs.txt, agree with the truth.
	'''
	preprocessing()

	train_captions=open(os.path.join(captions_folder,'trainimgs.txt'),'r').read().split('\n')
	test_captions=open(os.path.join(captions_folder,'testimgs.txt'),'r').read().split('\n')

	assert len(train_captions)==30001#the last line yields one stray empty string
	assert len(test_captions)==5001

	assert train_captions[42]=='2638369467_8fc251595b.jpg\t<start> A smiling young girl in braids is playing ball . <end>'
	assert test_captions[42]=='280706862_14c30d734a.jpg\t<start> A black dog on a beach carrying a ball in its mouth . <end>'

@pytest.mark.slow
def test_vgg16(load_example_image):
	'''
	Wherein we test vgg16.py. We create the model, load a test image, perform the
	encoding, and test the result for correct shape, correct number of nonzero
	entries, correct first 100 entries.
	'''

	model=VGG16(include_top=True,weights='imagenet')

	x=load_example_image
	x=k_preprocess_input(x)

	preds=model.predict(x)
	
	vgg16_pred_slice=np.array([0,0,0,0,6.281284,0,0,0,0,0.3895438,0,0,1.1056916,0,0,1.7175925,0,1.8917649,0,0,1.7590455,6.602196,0.43233678,0.4528695,0,3.6373415,3.5424447,2.4427955,0,0,3.206093,2.5562162,0,0,2.2278,0,3.2318673,2.3519747,0,6.4740357,0,2.8249745,0,0,9.216705,0,0,0,2.835004,2.1258173,2.2908218,1.0856905,2.6308882,0.91681635,0,0,0,0,0,0,0.40301943,0,0,0,3.2203531,0.2024988,0,0,0,0,0,0,1.2414606,0,0,0,1.2453537,0,4.912657,0,4.361135,0,0,0,0,0,0,0,2.4128122,0.68293965,0.7010477,1.3694913,1.7609701,0,0,0,0,0,0,0,])
	assert(x.shape==(1,224,224,3))
	assert(preds.shape==(1,4096))
	assert(len(preds[0][preds[0]!=0])==1368)
	np.testing.assert_allclose(preds[0,:100],vgg16_pred_slice,err_msg='VGG16 encoding yielded wrong encoding for test image!')

def test_utils_preprocessing(load_example_image):
	'''
	Wherein we test imagenet_utils.encodings(), which is slightly different from
	keras.applications.imagenet_utils.preprocessing. It reorders the axes, flips
	the order of colours, and subtracts constant values from each colour.
	'''

	dim_ordering=K.image_dim_ordering()
	assert(dim_ordering in ['tf','th'])

	x=load_example_image
	x_pre=x.copy()
	x=i_preprocess_input(x)

	if dim_ordering=='th':
		#BGR -> RGB
		x=x[ :, ::-1, :, : ]
		diff=x-x_pre

		colR=diff[ :, 0, :, : ]
		colG=diff[ :, 1, :, : ]
		colB=diff[ :, 2, :, : ]
	else:
		#BGR -> RGB
		x=x[ :, :, :, ::-1 ]
		diff=x-x_pre

		colR=diff[ :, :, :, 0 ]
		colG=diff[ :, :, :, 1 ]
		colB=diff[ :, :, :, 2 ]

	np.testing.assert_allclose(colR,-103.939)
	np.testing.assert_allclose(colG,-116.779)
	np.testing.assert_allclose(colB,-123,68)


@pytest.mark.slow
def test_encodings():
	'''
	We test encode_image.encodings(), which is just a wrapper for VGG16.
	This proceeds in the same fashion as in test_vgg16(). The truth value for
	the encodings differ slightly, since the encodings() wrapper uses another
	preprocessing routine defined in imagenet_utils.
	'''
	model=model_gen()
	preds=encodings(model=model,path=os.path.join(image_folder,test_image))

	encoding_pred_slice=np.array([0,0,0,0,6.943786,0,0,0,0,0.495808,0,0,1.2099614,0,0,1.9550853,0,2.5830698,0,0,1.5520213,6.7467823,0.30691597,0.6208435,0,3.8465405,3.7862554,2.3970299,0,0,3.5254822,2.7294598,0,0,2.7226853,0,3.2338202,2.3976898,0,6.3592043,0,2.7090664,0,0,10.004378,0,0,0,3.0425727,2.0538316,1.8156273,0.15581878,2.3381875,0.88823074,0,0,0,0,0,0,0.036334604,0,0,0,3.5556676,0.29299664,0,0,0,0,0,0,1.0033253,0,0,0,0.96017045,0,5.8062425,0,4.4312,0,0,0,0,0,0,0,2.7901797,0.5715834,0.76234996,1.7294867,1.2244358,0,0,0,0,0,0,0,])
	assert(preds.shape==(4096,))
	assert(len(preds[preds!=0])==1351)
	np.testing.assert_allclose(preds[:100],encoding_pred_slice,err_msg='encoding wrapper yielded wrong encoding for test image!')