My final project is a motion tracking CCTV camera that utilizes poseNet. The basic idea is to use poseNet to locate a person on the screen, and then send that data to a 3D printed CCTV camera mounted on top of a servo motor. By mapping the location data to the angles of the servo motor, it creates the illusion that the CCTV camera is following the person. In addition to the camera tracking, I also wanted to create a motion detecting p5 interface. After watching coding train tutorials on this effect, I discovered a method that uses pixel array data to isolate the moving person from the background, which I found really cool.
A large part of my process involved testing whether the servo-poseNet idea would work or not, and my draft of the final project documents this discovery. For the final project, I had several challenges ahead of me, including creating the p5 interface, figuring out the CCTV camera, and building a base for the camera and motor.
First, with the CCTV camera, I referred to the professor’s slides and came across a website with various 3D models that could be 3D printed. With the professor’s guidance on using the Ultimaker 3, I successfully 3D printed a CCTV camera that was the perfect size for the motor, in my opinion.
Next, I focused on the p5 interface. As mentioned earlier, I aimed to achieve a motion detection look. By applying multiple layers of effects such as grain, blur, and posterize, I was able to create an old-school CCTV footage vibe while also giving it a unique appearance that doesn’t resemble a typical CCTV camera. I wanted to capture the point of view of a camera trying to detect motion.
The final step for me was priming and spray painting the CCTV camera white, and finding the right base for it. Since I wanted to position it behind the laptop, I needed a base of suitable height. I found a cardboard box in my room and repurposed it as the shell for the CCTV camera base. I drilled a large piece of wood into it, which serves as a sturdy base for the motor. I then used wood glue to attach the motor to the wood slab, and glued the motor’s base plate to the CCTV camera.
The following is the code for my Arduino and p5 project:
// video, previous frame and threshold for motion detection let video; let prev; let threshold = 25; // Variables for motion functions and positions let mfun = 0; let motionY = 0; let lerpX = 0; let lerpY = 0; // Font for overlay text and PoseNet related variables let myFont; let poseNet; let pose; let skeleton; let loco = 0; function preload() { myFont = loadFont("VCR_OSD_MONO_1.001.ttf"); } function setup() { // low frame rate for a cool choppy motion detection effect frameRate(5); createCanvas(windowWidth, windowHeight); pixelDensity(1); video = createCapture(VIDEO); video.size(windowWidth, windowHeight); video.hide(); // Create an image to store the previous frame prev = createImage(windowWidth, windowHeight); // Initialize PoseNet and set up callback for pose detection poseNet = ml5.poseNet(video, modelLoaded); poseNet.on("pose", gotPoses); } // Callback for when poses are detected by PoseNet function gotPoses(poses) { //console.log(poses); if (poses.length > 0) { pose = poses[0].pose; skeleton = poses[0].skeleton; } } // Callback for when PoseNet model is loaded function modelLoaded() { console.log("poseNet ready"); } function draw() { // Check for serial port if (!serialActive) { text("Press Space Bar to select Serial Port", 20, 30); } else { text("Connected", 20, 30); } // Check for pose and get nose pose data if (pose) { fill(255, 0, 0); ellipse(pose.nose.x, pose.nose.y, 20); // location of pose nose loco = int(pose.nose.x); // value mapped for servo motor val = int(map(loco, 0, windowWidth, 60, 120)); print(val); } background(0); // load pixels for motion detection video.loadPixels(); prev.loadPixels(); threshold = 40; let count = 0; let avgX = 0; let avgY = 0; // Flip the canvas for video display push(); translate(width, 0); scale(-1, 1); image(video, 0, 0, video.width, video.height); pop(); // Analyzing the pixels for motion detection loadPixels(); for (let x = 0; x < video.width; x++) { for (let y = 0; y < video.height; y++) { // Current and previous pixel colors let loc = (x + y * video.width) * 4; let r1 = video.pixels[loc + 0]; let g1 = video.pixels[loc + 1]; let b1 = video.pixels[loc + 2]; let r2 = prev.pixels[loc + 0]; let g2 = prev.pixels[loc + 1]; let b2 = prev.pixels[loc + 2]; // Calculate color distance let d = distSq(r1, g1, b1, r2, g2, b2); if (d > threshold * threshold) { avgX += x; avgY += y; count++; // Fliped motion effect pixels let flippedLoc = (video.width - x - 1 + y * video.width) * 4; pixels[flippedLoc + 0] = 155; pixels[flippedLoc + 1] = 155; pixels[flippedLoc + 2] = 255; } else { let flippedLoc = (video.width - x - 1 + y * video.width) * 4; pixels[flippedLoc + 0] = 190; pixels[flippedLoc + 1] = 255; pixels[flippedLoc + 2] = 155; } } } // Updating the pixels on the canvas updatePixels(); // Calculate the average motion position if significant motion is detected if (count > 200) { motionX = avgX / count; motionY = avgY / count; } // Mirror the motion tracking coordinates // let flippedMotionX = width - motionX; // lerpX = lerp(lerpX, flippedMotionX, 0.1); // lerpY = lerp(lerpY, motionY, 0.1); // fill(255, 0, 255); // stroke(0); // strokeWeight(2); // ellipse(lerpX, lerpY, 36, 36); // MOREE EFFECTZZZZ filter(INVERT); prev.copy( video, 0, 0, video.width, video.height, 0, 0, prev.width, prev.height ); filter(ERODE); filter(POSTERIZE, random(10, 20)); drawGrid(); // Draw the grid on top of your content drawSurveillanceOverlay(); //surveillance overlay cam drawGrain(); // grain effect for old school cctv vibes filter(BLUR, 1.5); // blur effect to achieve that vhs quality } function distSq(x1, y1, z1, x2, y2, z2) { return sq(x2 - x1) + sq(y2 - y1) + sq(z2 - z1); } // toggle full screen function mousePressed() { if (mouseX > 0 && mouseX < width && mouseY > 0 && mouseY < height) { let fs = fullscreen(); fullscreen(!fs); } } function drawGrain() { loadPixels(); for (let i = 0; i < pixels.length; i += 4) { let grainAmount = random(-10, 10); pixels[i] += grainAmount; // red pixels[i + 1] += grainAmount; // green pixels[i + 2] += grainAmount; // blue // pixels[i + 3] is the alpha channel } updatePixels(); } function drawSurveillanceOverlay() { textFont(myFont); // Set the font textSize(32); // Set the text size // Draw border noFill(); strokeWeight(5); stroke(0, 0, 0, 255); rect(9, 9, width - 16, height - 16); stroke(250, 250, 250, 255); strokeWeight(2.1); rect(9, 9, width - 16, height - 16); // Display timestamp fill(250, 50, 50); fill(250, 250, 250); stroke(0, 120); textSize(30); textAlign(CENTER, TOP); text( new Date().toLocaleString(), windowWidth / 2, windowHeight - windowHeight / 11 ); // cam 01 textSize(17); fill(50, 250, 55); text("CAM 01", width - width / 19, windowHeight / 29); } function drawGrid() { let gridSize = 15; // Size of each grid cell // only the horizontal lines stroke(205, 3); // Grid line color (white with some transparency) strokeWeight(1); // Thickness of grid lines for (let x = 0; x <= width; x += gridSize) { for (let y = 14; y <= height + 16; y += gridSize) { // line(x, 10, x, height); line(11, y, width - 10, y); } } } // serial connection function keyPressed() { if (key == " ") { // important to have in order to start the serial connection!! setUpSerial(); } } function readSerial(data) { //////////////////////////////////// //READ FROM ARDUINO HERE //////////////////////////////////// if (data != null) { // make sure there is actually a message // split the message let fromArduino = split(trim(data), ","); // if the right length, then proceed if (fromArduino.length == 2) { // only store values here // do everything with those values in the main draw loop print("nice"); // We take the string we get from Arduino and explicitly // convert it to a number by using int() // e.g. "103" becomes 103 } ////////////////////////////////// //SEND TO ARDUINO HERE (handshake) ////////////////////////////////// let sendToArduino = val + "\n"; writeSerial(sendToArduino); } }
p5 👆
#include <Servo.h> Servo myservo; // create servo object to control a servo void setup() { Serial.begin(9600); myservo.attach(9); // start the handshake while (Serial.available() <= 0) { digitalWrite(LED_BUILTIN, HIGH); // on/blink while waiting for serial data Serial.println("0,0"); // send a starting message delay(300); // wait 1/3 second digitalWrite(LED_BUILTIN, LOW); delay(50); myservo.write(0); // sets the servo position according to the scaled value } } void loop() { // wait for data from p5 before doing something while (Serial.available()) { Serial.println("0,0"); digitalWrite(LED_BUILTIN, HIGH); // led on while receiving data int value = Serial.parseInt(); if (Serial.read() == '\n') { myservo.write(value); // sets the servo position according to the scaled value } } }
arduino 👆
Overall, I am happy with how the project was realized. It has been a very educational experience for me, as it has allowed me to learn about posenet, 3D printing, and visual effects. These skills will be valuable for my future capstone project, which will focus on surveillance.
Documentation/User Testing from the IM Showcase: