Background-Substract-Based-on-GMM/multiChannels.py at master · LeoHaoVIP/Background-Substract-Based-on-GMM · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
# -*- coding: utf-8 -*-
import cv2
import os
import numpy as np
import pickle
import matplotlib.pyplot as plt
import time

# 值越大，前景被当作背景的可能性也越大
# 值越小，背景被当作前景的可能性也越大
SIGMA = 30
WEIGHT = 0.05
CHANNELS = 3


# 图像GMM模型定义
class GmmModel:
    def __init__(self, sample_image):
        # 像素点个数
        self.img_size = sample_image.shape[0] * sample_image.shape[1]
        # 各像素点的模型个数 （初始化为0）
        self.model_count = np.zeros([1, self.img_size], int)
        # GMM高斯模型的个数 K （这里是固定的，有些方法可以对每个像素进行自适应模型个数K的选取）
        self.k = 4
        # 学习率 Alpha
        self.alpha = 0.005
        # SumOfWeightThreshold T
        self.t = 0.75
        # 各个模型的权重系数（初始化为0）
        self.w = np.zeros([self.k, self.img_size])
        # 各高斯模型的均值（初始化为0）
        self.u = np.zeros([self.k, self.img_size])
        # 各高斯模型的标准差（初始化为默认标准差）
        self.sigma = np.full([self.k, self.img_size], SIGMA)


# 读取图片集合，返回RGB图片
def load_data_set(path):
    image_set = []
    file_names = os.listdir(path)
    for filename in file_names:
        file_path = os.path.join(path, filename)
        img = cv2.imread(file_path)
        image_set.append(img)
    return image_set


# gmm模型初始化
def gmm_models_create():
    # 读取首张图片帧
    first_image = cv2.imread('WavingTrees/background_train/b00000.bmp')
    _R, _G, _B = cv2.split(first_image)
    return [GmmModel(_R), GmmModel(_G), GmmModel(_B)]


# 训练模型参数
def gmm_model_train(gmm_model, single_frame):
    # start_time = time.time()
    img_rows = single_frame.shape[0]
    img_cols = single_frame.shape[1]
    for m in range(img_rows):
        for n in range(img_cols):
            # 用于标识是否存在与像素点(m,n)匹配的分布模型
            matched = False
            for k in range(gmm_model.model_count[0, m * img_cols + n]):
                # 计算像素点与高斯分布均值的差值
                difference = abs(single_frame[m, n] - gmm_model.u[k, m * img_cols + n])
                distance = difference * difference
                # 当前像素点满足当前高斯分布
                if difference <= 2.5 * gmm_model.sigma[k, m * img_cols + n]:
                    matched = True
                    # 更新第k个高斯分布模型的参数
                    # 计算第k个高斯分布在该像素点上的概率密度
                    prob = (1 / (2 * np.pi * gmm_model.sigma[k, m * img_cols + n] ** 2) ** 0.5) * np.exp(
                        -(single_frame[m, n] - gmm_model.u[k, m * img_cols + n]) ** 2 / (
                                2 * (gmm_model.sigma[k, m * img_cols + n] ** 2)))
                    p = gmm_model.alpha * prob
                    # update weight
                    gmm_model.w[k, m * img_cols + n] = (1 - gmm_model.alpha) * gmm_model.w[
                        k, m * img_cols + n] + gmm_model.alpha
                    # update mean
                    gmm_model.u[k, m * img_cols + n] = (1 - p) * gmm_model.u[k, m * img_cols + n] + p * single_frame[
                        m, n]
                    # update standard deviation
                    if gmm_model.sigma[k, m * img_cols + n] < SIGMA / 2:
                        gmm_model.sigma[k, m * img_cols + n] = SIGMA / 2
                    else:
                        gmm_model.sigma[k, m * img_cols + n] = ((1 - p) * gmm_model.sigma[
                            k, m * img_cols + n] ** 2 + p * distance) ** 0.5
                    break
                else:
                    # 当前像素点不满足当前高斯分布
                    # 只更新weight
                    gmm_model.w[k, m * img_cols + n] = (1 - gmm_model.alpha) * gmm_model.w[k, m * img_cols + n]
                # 对k个gmm_model进行排序，便于后面高斯分布模型的替换和更新
                gmm_model_sort(gmm_model, m, n, img_cols)
            '''
            # 当前像素点未匹配到任何一个高斯分布，则需要新建一个高斯分布
            # 这里需要考虑两种情况
            # 1. 存在未初始化的高斯分布：此时可新建一个高斯分布
            # 2. k个高斯分布均已被初始化：此时替换order_weight最低的分布模型
            '''
            if not matched:
                # print('(', m, ',', n, ')', 'no matching distribution')
                # condition 1
                model_count = gmm_model.model_count[0, m * img_cols + n]
                if gmm_model.model_count[0, m * img_cols + n] < gmm_model.k:
                    # 初始化weight
                    gmm_model.w[model_count, m * img_cols + n] = WEIGHT
                    # 初始化mean
                    gmm_model.u[model_count, m * img_cols + n] = single_frame[m, n]
                    # 初始化standard deviation
                    gmm_model.sigma[model_count, m * img_cols + n] = SIGMA
                    gmm_model.model_count[0, m * img_cols + n] = model_count + 1
                # condition 2
                else:
                    # update weight
                    gmm_model.w[gmm_model.k - 1, m * img_cols + n] = WEIGHT
                    # update mean
                    gmm_model.u[gmm_model.k - 1, m * img_cols + n] = single_frame[m, n]
                    # update standard deviation
                    gmm_model.sigma[gmm_model.k - 1, m * img_cols + n] = SIGMA
            # weight归一化
            # 加上此判断条件，运行速度快了很多
            if sum(gmm_model.w[:, m * img_cols + n]) != 0:
                gmm_model.w[:, m * img_cols + n] = gmm_model.w[:, m * img_cols + n] / sum(
                    gmm_model.w[:, m * img_cols + n])
    # end_time = time.time()
    # print(end_time - start_time)


# 对指定像素点的k个gmm_model进行排序(依据：w/sigma)
def gmm_model_sort(gmm_model, m, n, img_cols):
    # 构造排序依据
    order_weight = gmm_model.w[:, m * img_cols + n] / gmm_model.sigma[:, m * img_cols + n]
    # 封装order_weight和权重
    zip_ow_weight = zip(order_weight, gmm_model.w[:, m * img_cols + n])
    # 封装order_weight和均值
    zip_ow_mean = zip(order_weight, gmm_model.u[:, m * img_cols + n])
    # 封装order_weight和标准差
    zip_ow_standard_deviation = zip(order_weight, gmm_model.sigma[:, m * img_cols + n])
    zip_ow_weight = sorted(zip_ow_weight, reverse=True)
    zip_ow_mean = sorted(zip_ow_mean, reverse=True)
    zip_ow_standard_deviation = sorted(zip_ow_standard_deviation, reverse=True)
    temp, gmm_model.w[:, m * img_cols + n] = zip(*zip_ow_weight)
    temp, gmm_model.u[:, m * img_cols + n] = zip(*zip_ow_mean)
    temp, gmm_model.sigma[:, m * img_cols + n] = zip(*zip_ow_standard_deviation)


# 借助形态学处理操作消除噪声点、连通对象
def optimize_frame(single_frame):
    kernel = cv2.getStructuringElement(cv2.MORPH_RECT, (2, 2))
    frame_parsed = cv2.morphologyEx(single_frame, cv2.MORPH_OPEN, kernel, iterations=2)
    kernel = cv2.getStructuringElement(cv2.MORPH_ERODE, (3, 3))
    frame_parsed = cv2.morphologyEx(frame_parsed, cv2.MORPH_CLOSE, kernel, iterations=2)
    return frame_parsed


# 根据训练得到的GMM模型，对输入图像进行背景剪除操作，将处理后的图像返回
def background_subtract(gmm_models, image):
    frame_channels = cv2.split(image)
    img_rows = frame_channels[0].shape[0]
    img_cols = frame_channels[0].shape[1]
    # 首先对计算得到的高斯模型进行筛选 需要满足条件sum(weight_i)>T
    for gmm_model in gmm_models:
        for pixel_index in range(img_rows * img_cols):
            weight_sum = 0
            for k in range(gmm_model.model_count[0, pixel_index]):
                weight_sum = weight_sum + gmm_model.w[k, pixel_index]
                # 如果前K个模型已经满足权重阈值，则只选择前K个模型
                if weight_sum > gmm_model.t:
                    gmm_model.model_count[0, pixel_index] = k + 1
                    break
    # 初始化处理后的图片
    frame_parsed = np.full([img_rows, img_cols], 255, np.uint8)
    for m in range(img_rows):
        for n in range(img_cols):
            hit_count = 0
            for ii in range(len(gmm_models)):
                for k in range(gmm_models[ii].model_count[0, m * img_cols + n]):
                    # 计算当前像素与高斯分布均值的差值
                    difference = abs(frame_channels[ii][m, n] - gmm_models[ii].u[k, m * img_cols + n])
                    if difference <= 2 * gmm_models[ii].sigma[k, m * img_cols + n]:
                        # 背景
                        hit_count = hit_count + 1
                        break
            # 若当前像素与三个通道均可匹配，方可视为背景，否则视为前景
            if hit_count == CHANNELS:
                frame_parsed[m, n] = 0
    return frame_parsed


# 保存GMM模型到本地

def gmm_models_save(gmm_models, path):
    with open(path, 'wb') as f:
        pickle.dump(gmm_models, f)


# 加载本地GMM模型
def gmm_models_load(path):
    with open(path, 'rb') as f:
        gmm_models = pickle.load(f)
    return gmm_models


if __name__ == '__main__':
    # 初始化三个GMM模型，分别对应于R、G、B三个通道
    models = gmm_models_create()
    gmm_model_path = './models_learned/gmm_models_maxK={0}_alpha={1}_T={2}_sigma={3}.pkl'.format(models[0].k,
                                                                                                 models[0].alpha,
                                                                                                 models[0].t, SIGMA)
    # 如果模型已存在则直接加载
    if not os.path.exists(gmm_model_path):
        # 加载训练集
        images = load_data_set('WavingTrees/background_train/')
        for i in range(len(images)):
            print('frame ' + str(i) + ' is training...')
            # 提取RGB三通道图像
            R, G, B = cv2.split(images[i])
            # 依次对三个通道的图像进行模型训练
            print('--->> training channel R...')
            gmm_model_train(models[0], R)
            print('--->> training channel G...')
            gmm_model_train(models[1], G)
            print('--->> training channel B...')
            gmm_model_train(models[2], B)
        print('GMM Models learning process finished')
        print('saving models...')
        gmm_models_save(models, gmm_model_path)
    else:
        print('local models already exists')
    print('loading models...')
    # 加载本地模型
    models = gmm_models_load(gmm_model_path)
    images = load_data_set('WavingTrees/person_in/')
    # 实时显示剪除效果
    param_str = 'maxK={0} alpha={1} T={2} SIGMA={3}'.format(models[0].k, models[0].alpha, models[0].t, SIGMA)
    plt.ion()
    for i in range(len(images)):
        # 背景剪除后
        frame_subtracted = background_subtract(models, images[i])
        # 形态学处理优化
        frame_optimized = optimize_frame(frame_subtracted)
        plt.suptitle('(Frame {0}) RealTime Background Subtract\n\n{1}'.format(i + 1, param_str))
        plt.subplot(131)
        plt.title('origin')
        plt.imshow(images[i])
        plt.subplot(132)
        plt.title('subtracted')
        plt.imshow(frame_subtracted, cmap='gray')
        plt.subplot(133)
        plt.title('optimized')
        plt.imshow(frame_optimized, cmap='gray')
        plt.pause(0.4)
        plt.clf()
    plt.ioff()
    # plt.ion()
    # for i in range(len(images)):
    #     # 背景剪除后
    #     frame_subtracted = background_subtract(models, images[i])
    #     # 形态学处理优化
    #     frame_optimized = optimize_frame(frame_subtracted)
    #     plt.suptitle('(Frame {0}) RealTime Background Subtract\n\n{1}'.format(i + 1, param_str))
    #     plt.subplot(121)
    #     plt.title('origin')
    #     plt.imshow(images[i])
    #     plt.subplot(122)
    #     plt.title('subtracted')
    #     plt.imshow(frame_subtracted, cmap='gray')
    #     plt.pause(0.2)
    #     plt.clf()
    # plt.ioff()