So far, when we work with the screen and pixels, we’ve been drawing shapes and objects to the screen, but nothing that could be called “representational”. We can uses still images and videos (and webcams!) to get images on screen that reflect the “real” world. We can then parse these for more information and create something more interesting than reality.
We can easily load and display images. While it’s possible to load an image from a URL, it’s easier to load it locally. Put it in a folder in your projects path.
let img;// Declare variable img
function preload{
img=loadImage("assets/tenor.gif");// Load the image
}
function setup(){
createCanvas(600,370);
}
function draw(){
// Displays the image at its actual size at point 0,0
image(img,0,0);
}
You can manipulate the image however you like. Similar to a bouncing, spinning rectangle.
// Display an image and bounce it around at 1/2 size
let img; // Declare variable img
let xPos, yPos;
let xSpeed, ySpeed;
let rot = 0.0;
let iw, ih; // variables for the image width and height
// Load the image
function preload() {
img = loadImage("tenor.gif");
}
function setup() {
createCanvas(windowWidth, windowHeight);
// img.width/img.height are attributes about
// your image that can be used as a variable
iw = img.width;
ih = img.height;
// randomly position the picture in the sketch
yPos = random(ih, height - ih);
xPos = random(iw, width - iw);
xSpeed = random(-3, 3);
ySpeed = random(-3, 3);
}
function draw() {
background(255);
// image is drawn from top left corner
// to bottom right corner by default
// imageMode() can be called to change the
// way it's drawn, similar to rectMode
imageMode(CENTER);
// the code below uses translate to
// relocate the x, y coordinates to the center of the image to move and rotate the image
push();
translate(xPos, yPos);
rotate(rot);
// draw the image at 1/2 it's native size
image(img, 0, 0, iw/2, ih/2);
pop();
rot += .01;
xPos += xSpeed;
yPos += ySpeed;
if (xPos >= width || xPos <= 0) {
xSpeed *= -1;
}
if (yPos >= height || yPos <= 0) {
ySpeed *= -1;
}
}
Dan Shiffman’s pointillism example is pretty cool, and demonstrates how to access the values of the pixels in the image.
loadPixels() and get() will let us access the r/g/b values in the image.
We can use the DOM library in p5js to give us access to videos and the camera. Don’t worry, it loads automagically for us.
We need to make a capture variable to get stuff from a camera. createCapture() stores the images in the object, which can be accessed just like an image.
let capture; // variable to hold the video capture
function setup() {
createCanvas(640, 480);
// create the capture object
capture = createCapture(VIDEO);
// set the size of the capture
capture.size(320, 240);
// hide the HTML video
capture.hide();
}
function draw() {
background(255);
// draw the video
image(capture, 0, 0);
}
A movie is similar to an image, but it … moves
let video;
function preload(){
// specify multiple formats for different browsers
video = createVideo(['spoops.mp4', 'spoops.webm']);
}
function setup() {
createCanvas(245, 440);
// by default video shows up in separate DOM
// element outside your canvas.
// hide it to draw to the canvas instead
video.hide();
// play and loop the video
video.loop();
}
function draw() {
//background(255);
image(video, 0, 0, mouseX, mouseY); // draw the video frame to canvas
}
But my video is backwards! You can mirror your image with translate() and scale().
let capture; // variable to hold the video capture
function setup() {
createCanvas(640, 480);
// create the capture object
capture = createCapture(VIDEO);
// set the size of the capture
capture.size(320, 240);
// hide the HTML video
capture.hide();
}
function draw() {
background(255);
// draw the regular image
image(capture, 0, 0);
// draw the mirrored image
push();
translate(width, 0);
scale(-1.0, 1);
image(capture, 0, 0);
pop();
// draw an upside down image
push();
translate(0, height);
scale(1.0, -1);
image(capture, 0, 0);
pop();
// draw a mirrored and upside down image
push();
translate(width, height);
scale(-1.0, -1);
image(capture, 0, 0);
pop();
}
Get the PIXELSSSSSS
All of this becomes really interesting when you start to access the pixels inside the image, video, movie, etc. Each pixel has a R,G,B, and A value associated with it. We can load the image into an array called pixels[], which holds all the information about the image. pixels[0] has the red information of the first pixel in the array, pixels[1] has the green information of the first pixel in the array, pixels[2] has the blue information of the first pixel in the array, and pixels[3] has the alpha information of the first pixel in the array.
To operate on the pixels you need to loadPixels() each frame. To write them out after doing something interesting with them, you updatePixels(). You don’t need to do this all the time though.
This will go thru all the pixels in the video, then swap the colors around.
We can ask questions about the pixels when we loop through them :
let img; // image we will eventually display on our canvas
function setup() {
createCanvas(640, 480);
mirror = createCapture(VIDEO); // our video object that will just see what the camera sees
mirror.size(320,240);
img = createImage(640, 480); // create our image to be the same size as our canvas
let.loadPixels(); // load our pixels into our first set of pixels into the image
}
function draw() {
background(255);
mirror.loadPixels(); // load pixel information into our mirror array
for (var i=0; i < 4*(mirror.width*mirror.height); i+=4) { //multiply and step by 4 since each pixel has 4 color variables associated with it (r,g,b,a)
let r = mirror.pixels[i]; // store red value
let g = mirror.pixels[i+ 1]; // store green value
let b = mirror.pixels[i+ 2]; // store blue value
let a = mirror.pixels[i+ 3];// store alpha value
img.pixels[i] = b; // in the image swap red values for blue values
img.pixels[i + 1] = r; // in the image swap green values for red values
img.pixels[i + 2] = g; // in the image swap blue values for green values
img.pixels[i + 3]= a; // keep alpha the same for now
}
img.updatePixels(); // update all the pixels for the image after you've looped through all the pixels
image(img,0,0); // finally write new processed image to the canvas
}
This looks at the brightness of each video pixel and uses it as a means to draw circles. We can step thru each pixel and get the brightness like so :
function setup() {
createCanvas(640, 480);
mirror = createCapture(VIDEO);
mirror.size(640,480);
noStroke();
fill(0);
}
function draw() {
background(255);
mirror.loadPixels();
let stepSize = round(constrain(mouseX / 8, 6, 32)); // based on mouseX limit the size of our ellipses' diameter to be between 6 and 32 px.
for (let y=0; y<height; y+=stepSize) {
for (let x=0; x<width; x+=stepSize) {
var i = y * width + x;
let darkness = (255 - mirror.pixels[i*4]) / 255; // alpha is always 255
let radius = stepSize * darkness;
ellipse(x, y, radius, radius);
}
}
}
Computer vision
Tracking things can be pretty easy sometimes :
We can double up our for loops to get the position of a pixel in the pixels array :
for (let x = 0; x < video.width; x ++ ) {
for (let y = 0; y < video.height; y ++ ) {
let loc = x + y*video.width;
// What is current color
color currentColor = video.pixels[loc];
let red = red(currentColor);
let green = green(currentColor);
let blue = blue(currentColor);
// SOME IF STATEMENT THAT ASKS A QUESTION ABOUT THAT COLOR
}
}
This is the magic line :
let loc = x + y*video.width;
Tracking colors
We can use the dist() function to get the distance from one color to another :
let video;
// A variable for the color we are searching for.
let trackColor;
function setup() {
createCanvas(640, 480);
// devicePixelScaling(false);
video = createCapture(VIDEO);
video.size(320, 240);
// The above function actually makes a separate video
// element on the page. The line below hides it since we are
// drawing the video to the canvas
video.hide();
// Start off tracking for red
trackColor = [255, 0, 0];
}
function draw() {
// Draw the video
image(video, 0, 0);
// We are going to look at the video's pixels
video.loadPixels();
// Before we begin searching, the "world record" for closest color is set to a high number that is easy for the first pixel to beat.
let worldRecord = 500;
// XY coordinate of closest color
let closestX = 0;
let closestY = 0;
for (let y = 0; y < video.height; y++) {
for (let x = 0; x < video.width; x++) {
let loc = (x + y * video.width) * 4;
// The functions red(), green(), and blue() pull out the three color components from a pixel.
let r1 = video.pixels[loc];
let g1 = video.pixels[loc + 1];
let b1 = video.pixels[loc + 2];
let r2 = trackColor[0];
let g2 = trackColor[1];
let b2 = trackColor[2];
// Using euclidean distance to compare colors
let d = dist(r1, g1, b1, r2, g2, b2); // We are using the dist( ) function to compare the current color with the color we are tracking.
// If current color is more similar to tracked color than
// closest color, save current location and current difference
if (d < worldRecord) {
worldRecord = d;
closestX = x;
closestY = y;
}
}
}
// We only consider the color found if its color distance is less than 10.
// This threshold of 10 is arbitrary and you can adjust this number depending on how accurate you require the tracking to be.
if (worldRecord < 50) {
// Draw a circle at the tracked pixel
fill(trackColor);
strokeWeight(4.0);
stroke(0);
ellipse(closestX, closestY, 16, 16);
}
}
function mousePressed() {
// Save color where the mouse is clicked in trackColor variable
trackColor = video.get(mouseX, mouseY);
console.log(trackColor);
}
Here is is a little smoother by taking the average of all the pixels under a certain threshold :
let threshold = 20; //255 is white, 0 is black
let aveX, aveY; //this is what we are trying to find
let objectR =255;
let objectG = 0;
let objectB = 0;
let debug = true;
function setup() {
createCanvas(640, 480);
video = createCapture(VIDEO);
video.size(320, 240);
video.hide();
}
function draw(){
video.loadPixels();
let totalFoundPixels= 0; //we are going to find the average location of change pixes so
let sumX = 0; //we will need the sum of all the x find, the sum of all the y find and the total finds
let sumY = 0;
//enter into the classic nested for statements of computer vision
for (let row = 0; row < video.height; row++) {
for (let col = 0; col < video.width; col++) {
//the pixels file into the room long line you use this simple formula to find what row and column the sit in
let offset = (row * video.width + col)*4;
//pull out the same pixel from the current frame
let thisColor = video.pixels[offset];
//pull out the individual colors for both pixels
let r = video.pixels[offset];
let g = video.pixels[offset + 1];
let b = video.pixels[offset + 2];
//in a color "space" you find the distance between color the same whay you would in a cartesian space, phythag or dist in processing
let diff = dist(r, g, b, objectR, objectG, objectB);
if (diff < threshold) { //if it is close enough in size, add it to the average
sumX = sumX + col;
sumY= sumY + row;
totalFoundPixels++;
// if (debug) video.pixels[offset] = 0xff000000;//debugging
}
}
}
video.updatePixels();
image(video,0,0);
if (totalFoundPixels > 0){
aveX = sumX/totalFoundPixels;
aveY = sumY/totalFoundPixels;
ellipse(aveX-10,(aveY-10),20,20);
}
}
function mousePressed(){
//if they click, use that picture for the new thing to follow
// var offset = mouseY * video.width + mouseX;
//pull out the same pixel from the current frame
let thisColor = video.get(mouseX,mouseY);
//pull out the individual colors for both pixels
objectR = thisColor[0];
objectG = thisColor[1];
objectB = thisColor[2];
println("Chasing new color " + objectR + " " + objectG + " " + objectB);
}
function keyPressed() {
//for adjusting things on the fly
if (key == '-') {
threshold--;
println("Threshold " + threshold);
}
else if (key == '=') {
threshold++;
println("Threshold " + threshold);
}
else if (key == 'd') {
background(255);
debug = !debug;
println("Debug " + debug);
}
else if (key == 't') {
println("Time Between Frames " + ellapsedTime);
}
}
Background subtraction is great too
This allows us to isolate objects from the front of the camera, it's like a DIY Zoom background
let video;
let display;
let bgImage;
// How different must a pixel be to be a foreground pixel
let threshold = 20;
function setup() {
createCanvas(640, 480);
video = createCapture(VIDEO);
video.size(320, 240);
video.hide();
// Create an empty image the same size as the video
bgImage = createImage(width, height);
display = createImage(width, height);
}
function draw() {
// We are looking at the video's pixels, the memorized backgroundImage's pixels, as well as accessing the display pixels.
// So we must loadPixels() for all!
video.loadPixels();
bgImage.loadPixels();
display.loadPixels();
// Begin loop to walk through every pixel
for (let x = 0; x < video.width; x++) {
for (let y = 0; y < video.height; y++) {
let loc = (x + y * video.width) * 4; // What is the 1D pixel location
// Store the RGB values for each pixel of the video and our background image
let r1 = video.pixels[loc];
let g1 = video.pixels[loc + 1];
let b1 = video.pixels[loc + 2];
let r2 = bgImage.pixels[loc];
let g2 = bgImage.pixels[loc + 1];
let b2 = bgImage.pixels[loc + 2];
//Compare the foreground and background color
let diff = dist(r1, g1, b1, r2, g2, b2);
// Is the foreground color different from the background color
if (diff > threshold) {
// If so, display the foreground color
display.pixels[loc] = video.pixels[loc];
display.pixels[loc + 1] = video.pixels[loc + 1];
display.pixels[loc + 2] = video.pixels[loc + 2];
display.pixels[loc + 3] = video.pixels[loc + 3];
} else {
// If not, display green
display.pixels[loc] = 0;
display.pixels[loc + 1] = 255;
display.pixels[loc + 2] = 0; // We could choose to replace the background pixels with something other than the color green!
display.pixels[loc + 3] = 255;
}
}
}
//update the display image
display.updatePixels();
// display the updated display image
image(display, 0, 0);
// show our threshold in text at the bottom of the screen
fill(0);
rect(0, height - 20, width, height);
fill(255);
text("Threshold is now: " + threshold, 20, height - 5);
}
function mousePressed() {
for (var i = 0; i < video.pixels.length; i++) {
bgImage.pixels[i] = video.pixels[i];
}
bgImage.updatePixels();
changeThreshold(); // comment this out to keep threshold constant
}
// change the threshold on the fly depending on where you click
function changeThreshold() {
threshold = map(mouseX, 0, width, 0, 175);
print("Threshold is now: " + threshold);
}