forked from s60sc/ESP32-CAM_MJPEG2SD
-
Notifications
You must be signed in to change notification settings - Fork 0
/
motionDetect.cpp
370 lines (332 loc) · 14.8 KB
/
motionDetect.cpp
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
/*
Detect movement in sequential images using background subtraction.
Very small (98x98) bitmaps are used both to provide image smoothing to reduce spurious motion changes
and to enable rapid processing
Bitmaps can either be color or grayscale. Color requires triple memory
of grayscale and more processing.
The amount of change between images will depend on the frame rate.
A faster frame rate will need a higher sensitivity
When frame size is changed the OV2640 outputs a few glitched frames whilst it
makes the transition. These could be interpreted as spurious motion.
Machine Learning can be incorporated to further discriminate when motion detection
has occurred by classsifying whether the object in the frame is of a particular
type of interest, eg a human, animal, vehicle etc.
s60sc 2020, 2023
*/
#include "appGlobals.h"
#if INCLUDE_TINYML
#include TINY_ML_LIB
#endif
using namespace std;
#define RESIZE_DIM 96 // dimensions of resized motion bitmap
#define RESIZE_DIM_SQ (RESIZE_DIM * RESIZE_DIM) // pixels in bitmap
#define INACTIVE_COLOR 96 // color for inactive motion pixel
#define JPEG_QUAL 80 // % quality for generated motion detect jpeg
// motion recording parameters
int detectMotionFrames = 5; // min sequence of changed frames to confirm motion
int detectNightFrames = 10; // frames of sequential darkness to avoid spurious day / night switching
// define region of interest, ie exclude top and bottom of image from movement detection if required
// divide image into detectNumBands horizontal bands, define start and end bands of interest, 1 = top
int detectNumBands = 10;
int detectStartBand = 3;
int detectEndBand = 8; // inclusive
int detectChangeThreshold = 15; // min difference in pixel comparison to indicate a change
uint8_t colorDepth; // set by depthColor config
static size_t stride;
bool mlUse = false; // whether to use ML for motion detection, requires INCLUDE_TINYML to be true
float mlProbability = 0.8; // minimum probability (0.0 - 1.0) for positive classification
uint8_t lightLevel; // Current ambient light level
uint8_t nightSwitch = 20; // initial white level % for night/day switching
float motionVal = 8.0; // initial motion sensitivity setting
uint8_t* motionJpeg = NULL;
size_t motionJpegLen = 0;
static uint8_t* currBuff = NULL;
/**********************************************************************************/
static bool jpg2rgb(const uint8_t* src, size_t src_len, uint8_t* out, jpg_scale_t scale);
bool isNight(uint8_t nightSwitch) {
// check if night time for suspending recording
// or for switching relay if enabled
static bool nightTime = false;
static uint16_t nightCnt = 0;
if (nightTime) {
if (lightLevel > nightSwitch) {
// light image
nightCnt--;
// signal day time after given sequence of light frames
if (nightCnt == 0) {
nightTime = false;
LOG_INF("Day time");
}
}
} else {
if (lightLevel < nightSwitch) {
// dark image
nightCnt++;
// signal night time after given sequence of dark frames
if (nightCnt > detectNightFrames) {
nightTime = true;
LOG_INF("Night time");
}
}
}
return nightTime;
}
static void rescaleImage(const uint8_t* input, int inputWidth, int inputHeight, uint8_t* output, int outputWidth, int outputHeight) {
// use bilinear interpolation to resize image
float xRatio = (float)inputWidth / (float)outputWidth;
float yRatio = (float)inputHeight / (float)outputHeight;
for (int i = 0; i < outputHeight; ++i) {
for (int j = 0; j < outputWidth; ++j) {
int xL = (int)floor(xRatio * j);
int yL = (int)floor(yRatio * i);
int xH = (int)ceil(xRatio * j);
int yH = (int)ceil(yRatio * i);
float xWeight = xRatio * j - xL;
float yWeight = yRatio * i - yL;
for (int channel = 0; channel < colorDepth; ++channel) {
uint8_t a = input[(yL * inputWidth + xL) * colorDepth + channel];
uint8_t b = input[(yL * inputWidth + xH) * colorDepth + channel];
uint8_t c = input[(yH * inputWidth + xL) * colorDepth + channel];
uint8_t d = input[(yH * inputWidth + xH) * colorDepth + channel];
float pixel = a * (1 - xWeight) * (1 - yWeight) + b * xWeight * (1 - yWeight)
+ c * yWeight * (1 - xWeight) + d * xWeight * yWeight;
output[(i * outputWidth + j) * colorDepth + channel] = (uint8_t)pixel;
}
}
}
}
#if INCLUDE_TINYML
static int getImageData(size_t offset, size_t length, float *out_ptr) {
// copy to features as grayscale or RGB
size_t pixelPtr = offset * colorDepth;
size_t out_ptr_idx = 0;
while (out_ptr_idx < length) {
out_ptr[out_ptr_idx++] = (colorDepth == RGB888_BYTES)
? (float)((currBuff[pixelPtr] << 16) + (currBuff[pixelPtr + 1] << 8) + currBuff[pixelPtr + 2])
: (float)((currBuff[pixelPtr] << 16) + (currBuff[pixelPtr] << 8) + currBuff[pixelPtr]);
pixelPtr += colorDepth;
}
return 0;
}
static bool tinyMLclassify() {
// convert input data to appropriate format
bool out = false;
uint32_t dTime = millis();
// reduce size of bitmap to that required by classifier and copy to features as grayscale or RGB
if (RESIZE_DIM != EI_CLASSIFIER_INPUT_WIDTH) {
uint8_t* tempBuff = (uint8_t*)ps_malloc(EI_CLASSIFIER_INPUT_WIDTH * EI_CLASSIFIER_INPUT_HEIGHT * colorDepth);
rescaleImage(currBuff, RESIZE_DIM, RESIZE_DIM, tempBuff, EI_CLASSIFIER_INPUT_WIDTH, EI_CLASSIFIER_INPUT_HEIGHT);
memcpy(currBuff, tempBuff, EI_CLASSIFIER_INPUT_WIDTH * EI_CLASSIFIER_INPUT_HEIGHT * colorDepth);
free(tempBuff);
}
signal_t features_signal;
features_signal.total_length = EI_CLASSIFIER_INPUT_WIDTH * EI_CLASSIFIER_INPUT_HEIGHT;
features_signal.get_data = &getImageData;
// Run the classifier
ei_impulse_result_t result = { 0 };
EI_IMPULSE_ERROR res = run_classifier(&features_signal, &result, false);
if (res == EI_IMPULSE_OK) {
if (result.classification[0].value > mlProbability) {
out = true; // sufficient classification match, so keep motion detection
if (dbgVerbose) {
LOG_VRB("Prob: %0.2f, Timing: DSP %d ms, inference %d ms, anomaly %d ms",
result.classification[0].value, result.timing.dsp, result.timing.classification, result.timing.anomaly);
char outcome[200] = {0};
for (uint16_t i = 0; i < EI_CLASSIFIER_LABEL_COUNT; i++)
sprintf(outcome + strlen(outcome), "%s: %.2f, ", ei_classifier_inferencing_categories[i], result.classification[i].value);
LOG_VRB("Predictions - %s in %ums", outcome, millis() - dTime);
}
}
} else LOG_WRN("Failed to run classifier (%d)", res);
return out;
}
#endif
bool checkMotion(camera_fb_t* fb, bool motionStatus) {
// check difference between current and previous image (subtract background)
// convert image from JPEG to downscaled RGB888 or 8 bit grayscale bitmap
uint32_t dTime = millis();
uint32_t lux = 0;
static uint32_t motionCnt = 0;
uint8_t* jpg_buf = NULL;
// calculate parameters for sample size
uint8_t scaling = frameData[fsizePtr].scaleFactor;
uint16_t reducer = frameData[fsizePtr].sampleRate;
uint8_t downsize = pow(2, scaling) * reducer;
int sampleWidth = frameData[fsizePtr].frameWidth / downsize;
int sampleHeight = frameData[fsizePtr].frameHeight / downsize;
stride = (colorDepth == RGB888_BYTES) ? GRAYSCALE_BYTES : RGB888_BYTES; // stride is inverse of colorDepth
static uint8_t* rgb_buf = (uint8_t*)ps_malloc(sampleWidth * sampleHeight * RGB888_BYTES);
if (!jpg2rgb((uint8_t*)fb->buf, fb->len, rgb_buf, (jpg_scale_t)scaling)) {
if (fsizePtr > 16) {
LOG_WRN("Frame size %s too large for motion detection", frameData[fsizePtr].frameSizeStr);
useMotion = false;
} else LOG_WRN("jpg2rgb() failure");
return motionStatus;
}
LOG_VRB("JPEG to rescaled %s bitmap conversion %u bytes in %lums", colorDepth == RGB888_BYTES ? "color" : "grayscale", sampleWidth * sampleHeight * colorDepth, millis() - dTime);
// allocate buffer space on heap
size_t resizeDimLen = RESIZE_DIM_SQ * colorDepth; // byte size of bitmap
if (motionJpeg == NULL) motionJpeg = (uint8_t*)ps_malloc(32 * 1024);
if (currBuff == NULL) currBuff = (uint8_t*)ps_malloc(RESIZE_DIM_SQ * RGB888_BYTES);
static uint8_t* prevBuff = (uint8_t*)ps_malloc(RESIZE_DIM_SQ * RGB888_BYTES);
static uint8_t* changeMap = (uint8_t*)ps_malloc(RESIZE_DIM_SQ * RGB888_BYTES);
dTime = millis();
rescaleImage(rgb_buf, sampleWidth, sampleHeight, currBuff, RESIZE_DIM, RESIZE_DIM);
LOG_VRB("Bitmap rescale to %u bytes in %lums", resizeDimLen, millis() - dTime);
// compare each pixel in current frame with previous frame
dTime = millis();
int changeCount = 0;
// set horizontal region of interest in image
uint16_t startPixel = (RESIZE_DIM*(detectStartBand-1)/detectNumBands) * RESIZE_DIM * colorDepth;
uint16_t endPixel = (RESIZE_DIM*(detectEndBand)/detectNumBands) * RESIZE_DIM * colorDepth;
int moveThreshold = ((endPixel-startPixel)/colorDepth) * (11-motionVal)/100; // number of changed pixels that constitute a movement
for (int i = 0; i < resizeDimLen; i += colorDepth) {
uint16_t currPix = 0, prevPix = 0;
for (int j = 0; j < colorDepth; j++) {
currPix += currBuff[i + j];
prevPix += prevBuff[i + j];
}
currPix /= colorDepth;
prevPix /= colorDepth;
lux += currPix; // for calculating light level
uint8_t pixVal = 255; // show active changed pixel as bright red color in changeMap image
// set up display image for motion tracking debug
if (dbgMotion) for (int j = 0; j < RGB888_BYTES; j++) changeMap[(i * stride) + j] = currPix; // grayscale
// determine pixel change status
if (abs((int)currPix - (int)prevPix) > detectChangeThreshold) {
if (i > startPixel && i < endPixel) changeCount++; // number of changed pixels
else pixVal = 80; // show inactive changed pixel as dark red color in changeMap image
if (dbgMotion) {
changeMap[(i * stride) + 2] = pixVal;
for (int j = 0; j < RGB888_BYTES - 1; j++) changeMap[(i * stride) + j] = 0;
}
}
}
lightLevel = (lux*100)/(RESIZE_DIM_SQ*255); // light value as a %
nightTime = isNight(nightSwitch);
memcpy(prevBuff, currBuff, resizeDimLen); // save image for next comparison
LOG_VRB("Detected %u changes, threshold %u, light level %u, in %lums", changeCount, moveThreshold, lightLevel, millis() - dTime);
dTime = millis();
if (!nightTime && changeCount > moveThreshold) {
LOG_VRB("### Change detected");
motionCnt++; // number of consecutive changes
// need minimum sequence of changes to signal valid movement
if (!motionStatus && motionCnt >= detectMotionFrames) {
LOG_VRB("***** Motion - START");
motionStatus = true; // motion started
#if INCLUDE_TINYML
// pass image to TinyML for classification
if (!dbgMotion && mlUse) if (!tinyMLclassify()) motionCnt = 0; // not classified, so cancel motion
#endif
if (motionCnt) { // in case unset by tinyMLclassify()
#if INCLUDE_SMTP
if (smtpUse) {
// send email with movement image
keepFrame(fb);
char subjectMsg[50];
snprintf(subjectMsg, sizeof(subjectMsg) - 1, "from %s", hostName);
emailAlert("Motion Alert", subjectMsg);
}
#endif
#if INCLUDE_TGRAM
if (tgramUse) keepFrame(fb); // for telegram, wait till filename available
#endif
}
dTime = millis();
#if INCLUDE_MQTT
if (mqtt_active && motionCnt) {
sprintf(jsonBuff, "{\"MOTION\":\"ON\",\"TIME\":\"%s\"}",esp_log_system_timestamp());
mqttPublish(jsonBuff);
mqttPublishPath("motion", "on");
}
#endif
}
} else motionCnt = 0;
if (motionStatus && !motionCnt) {
// insufficient change or motion not classified
LOG_VRB("***** Motion - STOP");
motionStatus = false; // motion stopped
#if INCLUDE_MQTT
if (mqtt_active) {
sprintf(jsonBuff, "{\"MOTION\":\"OFF\",\"TIME\":\"%s\"}", esp_log_system_timestamp());
mqttPublish(jsonBuff);
mqttPublishPath("motion", "off");
}
#endif
}
if (motionStatus) LOG_VRB("*** Motion - ongoing %u frames", motionCnt);
if (dbgMotion && !motionJpegLen) {
// ready to setup next movement map for streaming
dTime = millis();
// build jpeg of changeMap for debug streaming
if (!fmt2jpg(changeMap, resizeDimLen, RESIZE_DIM, RESIZE_DIM, PIXFORMAT_RGB888, JPEG_QUAL, &jpg_buf, &motionJpegLen))
LOG_WRN("motionDetect: fmt2jpg() failed");
memcpy(motionJpeg, jpg_buf, motionJpegLen);
free(jpg_buf); // releases 128kB in to_jpg.cpp
jpg_buf = NULL;
xSemaphoreGive(motionSemaphore);
LOG_VRB("Created changeMap JPEG %d bytes in %lums", motionJpegLen, millis() - dTime);
}
if (dbgVerbose) checkMemory();
LOG_VRB("============================");
// motionStatus indicates whether motion previously ongoing or not
return nightTime ? false : motionStatus;
}
/************* copied and modified from esp32-camera/to_bmp.c to access jpg_scale_t *****************/
typedef struct {
uint16_t width;
uint16_t height;
uint16_t data_offset;
const uint8_t *input;
uint8_t *output;
} rgb_jpg_decoder;
static bool _rgb_write(void * arg, uint16_t x, uint16_t y, uint16_t w, uint16_t h, uint8_t *data) {
// mpjpeg2sd: modified to generate 24 bit RGB or 8 bit grayscale
rgb_jpg_decoder * jpeg = (rgb_jpg_decoder *)arg;
if (!data){
if (x == 0 && y == 0) {
// write start
jpeg->width = w;
jpeg->height = h;
}
return true;
}
size_t jw = jpeg->width*RGB888_BYTES;
size_t t = y * jw;
size_t b = t + (h * jw);
size_t l = x * RGB888_BYTES;
uint8_t *out = jpeg->output+jpeg->data_offset;
uint8_t *o = out;
size_t iy, ix;
w *= RGB888_BYTES;
for (iy=t; iy<b; iy+=jw) {
o = out+(iy+l)/stride;
for (ix=0; ix<w; ix+=RGB888_BYTES) {
if (colorDepth == RGB888_BYTES) {
o[ix] = data[ix+2];
o[ix+1] = data[ix+1];
o[ix+2] = data[ix];
} else {
uint16_t grayscale = (data[ix+2]+data[ix+1]+data[ix])/RGB888_BYTES;
o[ix/RGB888_BYTES] = (uint8_t)grayscale;
}
}
data+=w;
}
return true;
}
static unsigned int _jpg_read(void * arg, size_t index, uint8_t *buf, size_t len) {
rgb_jpg_decoder * jpeg = (rgb_jpg_decoder *)arg;
if (buf) memcpy(buf, jpeg->input + index, len);
return len;
}
static bool jpg2rgb(const uint8_t* src, size_t src_len, uint8_t* out, jpg_scale_t scale) {
rgb_jpg_decoder jpeg;
jpeg.width = 0;
jpeg.height = 0;
jpeg.input = src;
jpeg.output = out;
jpeg.data_offset = 0;
esp_err_t res = esp_jpg_decode(src_len, scale, _jpg_read, _rgb_write, (void*)&jpeg);
return (res == ESP_OK) ? true : false;
}