ImageRetrievalClassic/ImageUtils.py at master · aa1000/ImageRetrievalClassic · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
import cv2
import numpy as np
from sklearn.cluster import KMeans
from skimage.feature import greycomatrix, greycoprops
from skimage import data

histsogram_centers_file_name = 'HistogramCenters.npy'
n_indexed_colors=256
n_color_histogram_categories=64
dct2_size = 100
GLCM_resize_size = 200
GLCM_step = 20

# speed-up opencv using multithreads
cv2.setUseOptimized(True)
cv2.setNumThreads(8)

def CreateIndexedColorClasses(feature_vectors):
    # an approximation is more than enough, no need to have high accuracy and waste computing time
    kmeans = KMeans(n_clusters=n_indexed_colors, n_init =1, tol=0.001, max_iter=100, random_state=0, n_jobs=1, algorithm='full')
    kmeans.fit(pixels_vector)
    return kmeans.cluster_centers_

def ImgPathToPixelVector(img_path):
    img = cv2.imread(img_path)
    # a 200*200 image preserves most color information and it's enough for indexing colors
    img = cv2.resize(img,(200,200))
    reshaped_image = img.reshape((-1,3))
    reshaped_image = np.float32(reshaped_image)
    return reshaped_image

def RGBToIndex(img, color_classes):
    # reconstruct the kmeans from center information
    kmeans = KMeans(n_clusters=n_indexed_colors, random_state=0)
    kmeans.cluster_centers_ = color_classes
    # Reshape the image into a vector of pixels
    pixel_vector = img.reshape(-1, 3)
    # Get the nearest class for each pixel
    labels = kmeans.predict(pixel_vector)
    # Reshape the indexed image to the height and width of the original
    return_img = labels
    rows, cols, channels = img.shape
    return return_img.reshape(rows, cols)

def IndexedImageToRGB(indexed_img, color_classes):
    # create a new array of true color pixels
    rg_colors = color_classes[indexed_img.flatten()]
    # reshape the size of the new array to have 3 color channels and the dimensions of the original
    rows, cols = indexed_img.shape
    return rg_colors.reshape(rows, cols, 3)

def CreateColorHistogram(img):
    # Calculte and normalize the histogram for each channel then append them
    histogram = cv2.calcHist([img],[0],None,[n_color_histogram_categories],[0,256])
    histogram = cv2.normalize(histogram, None)

    ch1_histogram = cv2.calcHist([img],[1],None,[n_color_histogram_categories],[0,256])
    ch1_histogram = cv2.normalize(ch1_histogram, None)
    histogram = np.vstack((histogram, ch1_histogram))

    ch2_histogram = cv2.calcHist([img],[2],None,[n_color_histogram_categories],[0,256])
    ch2_histogram = cv2.normalize(ch2_histogram, None)
    histogram = np.vstack((histogram, ch2_histogram))

    return histogram

def CreateIndexedColorHistogram(img, color_classes):
    indexed_img = RGBToIndex(img, color_classes)
    # cv2 calcHist only works with uint8 arrays (?) so we are limited to 256 colors
    indexed_img = indexed_img.astype(np.uint8)
    histogram = cv2.calcHist([indexed_img],[0],None,[n_indexed_colors],[0,n_indexed_colors])
    histogram = cv2.normalize(histogram, None)
    return histogram

def CreateDCT2(img):
	# only the gray image is needed for the dct
    grey_img = cv2.cvtColor(img, cv2.COLOR_RGB2GRAY)
	# normalise the image content
    NormImg = np.float32(grey_img)/255.0
    Dct2 = cv2.dct(NormImg)
    Dct2Out = np.zeros([dct2_size,dct2_size])
    Dct2Out = Dct2[:dct2_size,:dct2_size]
    return Dct2Out.reshape(-1, 1)

def CreateGLCM(img):

    grey_img = cv2.cvtColor(img, cv2.COLOR_RGB2GRAY)
    resized_img = cv2.resize(grey_img,(GLCM_resize_size, GLCM_resize_size))

    energy_features = []
    contrast_features = []

    sz = resized_img.shape
    for i in range(0,sz[0],GLCM_step):
        for j in range(0,sz[1],GLCM_step):
            patch = resized_img[i:i+GLCM_step,j:j+GLCM_step]
            #greycomatrix parameters:
            # 1) patch : part of image to generate co-occurance matrix for
            # 2 & 3): separation vector neighbor [1] and angle in radians [0] "1 to the right"
            # 4) symmetric = True: add the matrix to its transpose
            # 5) normed = True: divide each element in matrix by number of elements in it
            glcm = greycomatrix(patch, [1], [0], 256, symmetric=True, normed=True)
            energy_features.append(greycoprops(glcm, 'energy')[0, 0])
            contrast_features.append(greycoprops(glcm, 'contrast')[0, 0])

    out_glsm_features = np.array(energy_features)
    out_glsm_features = np.vstack((out_glsm_features, contrast_features))

    return out_glsm_features.reshape(-1, 1)

def CreateImageFeaturesVector(img, colors_classes):
    # Create the features of each category
    features_vector = CreateColorHistogram(img)

    indexed_histogram_features = CreateIndexedColorHistogram(img, colors_classes)
    features_vector = np.vstack((features_vector, indexed_histogram_features))

    dct2_features = CreateDCT2(img)
    features_vector = np.vstack((features_vector, dct2_features))

    GLSM_features = CreateGLCM(img)
    features_vector = np.vstack((features_vector, GLSM_features))

    return features_vector