hcl14/infer.py

## infer.py
# Create dataset of labels and predictions for the model from https://github.com/idealo/image-quality-assessment/
# Use tensorflow >= 1.10.0 to load this model. I had weird errors.

from os import path
import numpy as np
import pandas as pd
import cv2

from keras.preprocessing.image import load_img
from keras.preprocessing.image import img_to_array

import keras
from keras import backend as K
from keras.models import Model
from keras.layers import Dense, Dropout, Concatenate, Flatten
import tensorflow as tf

from scipy.io import savemat


base_model = keras.applications.mobilenet.MobileNet((224, 224, 3), pooling='avg', include_top=False, weights=None)
x = Dropout(0.75)(base_model.output)
x = Dense(10, activation='softmax')(x)

model = Model(inputs=base_model.input, outputs=x)

model.load_weights(path.join(path.dirname(path.abspath(__file__)),'models/MobileNet/weights_mobilenet_aesthetic_0.07.hdf5'))

print(model.summary())

print('loaded model')

'''
# Normalize according to ImageNet
IMAGE_NET_MEAN = [0.485, 0.456, 0.406]
IMAGE_NET_STD = [0.229, 0.224, 0.225]
# for each channel do input[channel] = (input[channel] - mean[channel]) / std[channel
def normalize_img(img):
    img /= 255.
    for channel in range(3):
        mean = IMAGE_NET_MEAN[channel]
        std = IMAGE_NET_STD[channel]
        img[:,:, channel] = (img[:,:, channel] - mean)/std

    return img
'''
# store elements of distribution to compute means, etc
dist_values = np.array([1,2,3,4,5,6,7,8,9,10], dtype=np.float32)
dist_values = np.expand_dims(dist_values, -1)

def mean_std(x):
    mean = x.dot(dist_values)
    # sqrt( E(X^2) - (E(X))^2 )
    return mean, np.sqrt(x.dot(dist_values**2) - mean**2 )


# predict scores  - use this function to evaluate your images
def test_inference(filename, model=model):
    # load an image in PIL format
    original = load_img(filename, target_size=(224, 224))
    numpy_image = img_to_array(original)

    numpy_image_n = keras.applications.mobilenet.preprocess_input(numpy_image.copy())

    # (1, 224, 224, 3)
    image_batch = np.expand_dims(numpy_image_n, axis=0)

    # get the predicted probabilities for each class
    predictions = model.predict(image_batch)

    mean, std = mean_std(predictions)

    return mean, std, predictions


import json

with open('data/AVA/ava_labels_test.json', 'r') as f:
    data = json.load(f)

label_test = []
for value in data:
    label_test.append([value["image_id"]]+value["label"])

label_test = np.array(label_test, dtype=float)
# normalize histograms
histograms = label_test[:,1:]
histograms /=  histograms.sum(axis=1)[:,np.newaxis]

# First column is id, other 10 - histogram
label_test[:,1:] = histograms

data_path = '../../datasets/AVA_dataset/images/images'


labels_good = []
predictions = []
mean_predictions = []
std_predictions = []

for idx, image_id in enumerate(label_test[:,0]):
    filename = data_path +'/' + str(int(image_id)) + '.jpg'
    try:
        mean, std, pred = test_inference(filename)
    except:
        continue

    labels_good.append(label_test[idx])
    predictions.append(pred)

    mean_predictions.append(mean)
    std_predictions.append(std)

    if idx%100==0:
        print(idx)
        print(pred)


labels_good = np.array(labels_good)
predictions = np.array(predictions)
mean_predictions = np.array(mean_predictions)
std_predictions = np.array(std_predictions)

savemat('wtf.mat', {'labels':labels_good, 'predictions':predictions, 'mean_predictions':mean_predictions, 'std_predictions':std_predictions})


dist_values = np.array([1,2,3,4,5,6,7,8,9,10], dtype=np.float32)
dist_values = np.expand_dims(dist_values, -1)
gt_means = labels_good[:,1:].dot(dist_values)
# predicted x actual
confusion_matrix = np.zeros(shape=(10,10), dtype=int)
for idx, value in enumerate(gt_means):
    confusion_matrix[int(mean_predictions[idx])-1][int(value)-1] += 1
print(confusion_matrix)

## plot_result.py
# print confusion matrices and build histograms

import numpy as np
import pandas as pd
import matplotlib.pyplot as plt

import random


import pickle

from scipy.io import loadmat
from scipy.stats import pearsonr, spearmanr

data = loadmat('data.mat')

label_np = np.squeeze(np.array(data['labels']))
predictions = np.squeeze(data['predictions'])

histograms = label_np[:,1:]
histograms /=  histograms.sum(axis=1)[:,np.newaxis]

# First column is id, other 10 - histogram
label_np[:,1:] = histograms

print('Got labels: {}'.format(len(label_np)))


rough_total_hist = np.sum(histograms, axis=0)

rough_total_hist /= np.sum(rough_total_hist)


# load predicitons
import pickle

#with open('model_predictions_oversample.pickle', 'rb') as handle:
#    predictions = pickle.load(handle)

# precise mean score distriburtion

dist_values = np.array([1,2,3,4,5,6,7,8,9,10], dtype=np.float32)
dist_values = np.expand_dims(dist_values, -1)

mean_scores = histograms.dot(dist_values)
mean_scores_predicted = predictions.dot(dist_values)

confusion_matrix = np.zeros(shape=(10,10), dtype=int)

acc = []
diffs = []
for idx, value in enumerate(mean_scores):
    confusion_matrix[int(mean_scores_predicted[idx])-1][int(value)-1] += 1
    acc.append(1. - np.abs(mean_scores_predicted[idx] - value)/value)
    diffs.append(np.abs(mean_scores_predicted[idx] - value))


print(confusion_matrix)
print('accuracy:{}'.format(np.mean(acc)))
print('standard deviation of score differences:{}'.format(np.std(diffs)))
print('LCC: {}'.format(pearsonr(mean_scores_predicted.ravel(), mean_scores.ravel())))
print('SRCC: {}'.format(spearmanr(mean_scores_predicted.ravel(), mean_scores.ravel())))

print('random shuffle:')

np.random.shuffle(mean_scores_predicted)
confusion_matrix = np.zeros(shape=(10,10), dtype=int)

acc = []
diffs = []
for idx, value in enumerate(mean_scores):
    confusion_matrix[int(mean_scores_predicted[idx])-1][int(value)-1] += 1
    acc.append(1. - np.abs(mean_scores_predicted[idx] - value)/value)
    diffs.append(np.abs(mean_scores_predicted[idx] - value))


print(confusion_matrix)
print('accuracy:{}'.format(np.mean(acc)))
print('standard deviation of score differences:{}'.format(np.std(diffs)))
print('LCC: {}'.format(pearsonr(mean_scores_predicted.ravel(), mean_scores.ravel())))
print('SRCC: {}'.format(spearmanr(mean_scores_predicted.ravel(), mean_scores.ravel())))


plt.subplot(1, 2, 1)
out1 = plt.hist(mean_scores, 100, density=0, facecolor='green', alpha=0.5, range=(1,10))
out2 = plt.hist(mean_scores_predicted, 100, density=0, facecolor='red', alpha=0.5, range=(1,10))
plt.xticks(np.arange(1, 10, 1))

plt.xlabel('Scores')
plt.ylabel('No of images')
plt.title('Precise histogram of mean scores')
plt.grid(True)


# precise histogram of standard deviations

def std_dev(x):
    mean = x.dot(dist_values)

    # sqrt( E(X^2) - (E(X))^2 )
    return np.sqrt( x.dot(dist_values**2) - mean**2  )


std_devs = np.array(list(map(std_dev, histograms)))
std_predicted = np.array(list(map(std_dev, predictions)))


plt.subplot(1, 2, 2)
plt.hist(std_devs, 100, density=0, facecolor='green', alpha=0.5, range=(0,2.5))
plt.hist(std_predicted, 100, density=0, facecolor='red', alpha=0.5, range=(0,2.5))
plt.xticks(np.arange(0, 2.5, 0.5))

plt.xlabel('Scores')
plt.ylabel('No of images')
plt.title('Precise histogram of std devs')
plt.grid(True)

plt.show()


## wtf.mat

      
    Raw
  

              wtf.mat
            
          
      This file has been truncated, but you can view the full file.
    

            View raw
	# Create dataset of labels and predictions for the model from https://github.com/idealo/image-quality-assessment/
	# Use tensorflow >= 1.10.0 to load this model. I had weird errors.

	from os import path
	import numpy as np
	import pandas as pd
	import cv2

	from keras.preprocessing.image import load_img
	from keras.preprocessing.image import img_to_array

	import keras
	from keras import backend as K
	from keras.models import Model
	from keras.layers import Dense, Dropout, Concatenate, Flatten
	import tensorflow as tf

	from scipy.io import savemat


	base_model = keras.applications.mobilenet.MobileNet((224, 224, 3), pooling='avg', include_top=False, weights=None)
	x = Dropout(0.75)(base_model.output)
	x = Dense(10, activation='softmax')(x)

	model = Model(inputs=base_model.input, outputs=x)

	model.load_weights(path.join(path.dirname(path.abspath(__file__)),'models/MobileNet/weights_mobilenet_aesthetic_0.07.hdf5'))

	print(model.summary())

	print('loaded model')

	'''
	# Normalize according to ImageNet
	IMAGE_NET_MEAN = [0.485, 0.456, 0.406]
	IMAGE_NET_STD = [0.229, 0.224, 0.225]
	# for each channel do input[channel] = (input[channel] - mean[channel]) / std[channel
	def normalize_img(img):
	img /= 255.
	for channel in range(3):
	mean = IMAGE_NET_MEAN[channel]
	std = IMAGE_NET_STD[channel]
	img[:,:, channel] = (img[:,:, channel] - mean)/std

	return img
	'''
	# store elements of distribution to compute means, etc
	dist_values = np.array([1,2,3,4,5,6,7,8,9,10], dtype=np.float32)
	dist_values = np.expand_dims(dist_values, -1)

	def mean_std(x):
	mean = x.dot(dist_values)
	# sqrt( E(X^2) - (E(X))^2 )
	return mean, np.sqrt(x.dot(dist_values2) - mean2 )


	# predict scores - use this function to evaluate your images
	def test_inference(filename, model=model):
	# load an image in PIL format
	original = load_img(filename, target_size=(224, 224))
	numpy_image = img_to_array(original)

	numpy_image_n = keras.applications.mobilenet.preprocess_input(numpy_image.copy())

	# (1, 224, 224, 3)
	image_batch = np.expand_dims(numpy_image_n, axis=0)

	# get the predicted probabilities for each class
	predictions = model.predict(image_batch)

	mean, std = mean_std(predictions)

	return mean, std, predictions



	import json

	with open('data/AVA/ava_labels_test.json', 'r') as f:
	data = json.load(f)

	label_test = []
	for value in data:
	label_test.append([value["image_id"]]+value["label"])

	label_test = np.array(label_test, dtype=float)
	# normalize histograms
	histograms = label_test[:,1:]
	histograms /= histograms.sum(axis=1)[:,np.newaxis]

	# First column is id, other 10 - histogram
	label_test[:,1:] = histograms

	data_path = '../../datasets/AVA_dataset/images/images'



	labels_good = []
	predictions = []
	mean_predictions = []
	std_predictions = []

	for idx, image_id in enumerate(label_test[:,0]):
	filename = data_path +'/' + str(int(image_id)) + '.jpg'
	try:
	mean, std, pred = test_inference(filename)
	except:
	continue

	labels_good.append(label_test[idx])
	predictions.append(pred)

	mean_predictions.append(mean)
	std_predictions.append(std)

	if idx%100==0:
	print(idx)
	print(pred)


	labels_good = np.array(labels_good)
	predictions = np.array(predictions)
	mean_predictions = np.array(mean_predictions)
	std_predictions = np.array(std_predictions)

	savemat('wtf.mat', {'labels':labels_good, 'predictions':predictions, 'mean_predictions':mean_predictions, 'std_predictions':std_predictions})


	dist_values = np.array([1,2,3,4,5,6,7,8,9,10], dtype=np.float32)
	dist_values = np.expand_dims(dist_values, -1)
	gt_means = labels_good[:,1:].dot(dist_values)
	# predicted x actual
	confusion_matrix = np.zeros(shape=(10,10), dtype=int)
	for idx, value in enumerate(gt_means):
	confusion_matrix[int(mean_predictions[idx])-1][int(value)-1] += 1
	print(confusion_matrix)
	# print confusion matrices and build histograms

	import numpy as np
	import pandas as pd
	import matplotlib.pyplot as plt

	import random


	import pickle

	from scipy.io import loadmat
	from scipy.stats import pearsonr, spearmanr

	data = loadmat('data.mat')

	label_np = np.squeeze(np.array(data['labels']))
	predictions = np.squeeze(data['predictions'])

	histograms = label_np[:,1:]
	histograms /= histograms.sum(axis=1)[:,np.newaxis]

	# First column is id, other 10 - histogram
	label_np[:,1:] = histograms

	print('Got labels: {}'.format(len(label_np)))


	rough_total_hist = np.sum(histograms, axis=0)

	rough_total_hist /= np.sum(rough_total_hist)


	# load predicitons
	import pickle

	#with open('model_predictions_oversample.pickle', 'rb') as handle:
	# predictions = pickle.load(handle)

	# precise mean score distriburtion

	dist_values = np.array([1,2,3,4,5,6,7,8,9,10], dtype=np.float32)
	dist_values = np.expand_dims(dist_values, -1)

	mean_scores = histograms.dot(dist_values)
	mean_scores_predicted = predictions.dot(dist_values)

	confusion_matrix = np.zeros(shape=(10,10), dtype=int)

	acc = []
	diffs = []
	for idx, value in enumerate(mean_scores):
	confusion_matrix[int(mean_scores_predicted[idx])-1][int(value)-1] += 1
	acc.append(1. - np.abs(mean_scores_predicted[idx] - value)/value)
	diffs.append(np.abs(mean_scores_predicted[idx] - value))


	print(confusion_matrix)
	print('accuracy:{}'.format(np.mean(acc)))
	print('standard deviation of score differences:{}'.format(np.std(diffs)))
	print('LCC: {}'.format(pearsonr(mean_scores_predicted.ravel(), mean_scores.ravel())))
	print('SRCC: {}'.format(spearmanr(mean_scores_predicted.ravel(), mean_scores.ravel())))

	print('random shuffle:')

	np.random.shuffle(mean_scores_predicted)
	confusion_matrix = np.zeros(shape=(10,10), dtype=int)

	acc = []
	diffs = []
	for idx, value in enumerate(mean_scores):
	confusion_matrix[int(mean_scores_predicted[idx])-1][int(value)-1] += 1
	acc.append(1. - np.abs(mean_scores_predicted[idx] - value)/value)
	diffs.append(np.abs(mean_scores_predicted[idx] - value))


	print(confusion_matrix)
	print('accuracy:{}'.format(np.mean(acc)))
	print('standard deviation of score differences:{}'.format(np.std(diffs)))
	print('LCC: {}'.format(pearsonr(mean_scores_predicted.ravel(), mean_scores.ravel())))
	print('SRCC: {}'.format(spearmanr(mean_scores_predicted.ravel(), mean_scores.ravel())))




	plt.subplot(1, 2, 1)
	out1 = plt.hist(mean_scores, 100, density=0, facecolor='green', alpha=0.5, range=(1,10))
	out2 = plt.hist(mean_scores_predicted, 100, density=0, facecolor='red', alpha=0.5, range=(1,10))
	plt.xticks(np.arange(1, 10, 1))

	plt.xlabel('Scores')
	plt.ylabel('No of images')
	plt.title('Precise histogram of mean scores')
	plt.grid(True)




	# precise histogram of standard deviations

	def std_dev(x):
	mean = x.dot(dist_values)

	# sqrt( E(X^2) - (E(X))^2 )
	return np.sqrt( x.dot(dist_values2) - mean2 )


	std_devs = np.array(list(map(std_dev, histograms)))
	std_predicted = np.array(list(map(std_dev, predictions)))


	plt.subplot(1, 2, 2)
	plt.hist(std_devs, 100, density=0, facecolor='green', alpha=0.5, range=(0,2.5))
	plt.hist(std_predicted, 100, density=0, facecolor='red', alpha=0.5, range=(0,2.5))
	plt.xticks(np.arange(0, 2.5, 0.5))

	plt.xlabel('Scores')
	plt.ylabel('No of images')
	plt.title('Precise histogram of std devs')
	plt.grid(True)

	plt.show()