dlib/examples/random_cropper_ex.cpp
Davis King 17b48b97bb Changed the random_cropper's interface so that instead of talking in terms of
min and max object height, it's now min and max object size.  This way, if you
have objects that are short and wide (i.e. objects where the relevant dimension
is width rather than height) you will get sensible behavior out of the random
cropper.
2017-06-17 12:34:26 -04:00

96 lines
3.5 KiB
C++

// The contents of this file are in the public domain. See LICENSE_FOR_EXAMPLE_PROGRAMS.txt
/*
When you are training a convolutional neural network using the loss_mmod loss
layer, you need to generate a bunch of identically sized training images. The
random_cropper is a convenient tool to help you crop out a bunch of
identically sized images from a training dataset.
This example shows you what it does exactly and talks about some of its options.
*/
#include <iostream>
#include <dlib/data_io.h>
#include <dlib/gui_widgets.h>
#include <dlib/image_transforms.h>
using namespace std;
using namespace dlib;
// ----------------------------------------------------------------------------------------
int main(int argc, char** argv) try
{
if (argc != 2)
{
cout << "Give an image dataset XML file to run this program." << endl;
cout << "For example, if you are running from the examples folder then run this program by typing" << endl;
cout << " ./random_cropper_ex faces/training.xml" << endl;
cout << endl;
return 0;
}
// First lets load a dataset
std::vector<matrix<rgb_pixel>> images;
std::vector<std::vector<mmod_rect>> boxes;
load_image_dataset(images, boxes, argv[1]);
// Here we make our random_cropper. It has a number of options.
random_cropper cropper;
// We can tell it how big we want the cropped images to be.
cropper.set_chip_dims(400,400);
// Also, when doing cropping, it will map the object annotations from the
// dataset to the cropped image as well as perform random scale jittering.
// You can tell it how much scale jittering you would like by saying "please
// make the objects in the crops have a min and max size of such and such".
// You do that by calling these two functions. Here we are saying we want the
// objects in our crops to be between 0.2*400 and 0.8*400 pixels in height.
cropper.set_min_object_size(0.2);
cropper.set_max_object_size(0.8);
// The cropper can also randomly mirror and rotate crops, which we ask it to
// perform as well.
cropper.set_randomly_flip(true);
cropper.set_max_rotation_degrees(50);
// This fraction of crops are from random parts of images, rather than being centered
// on some object.
cropper.set_background_crops_fraction(0.2);
// Now ask the cropper to generate a bunch of crops. The output is stored in
// crops and crop_boxes.
std::vector<matrix<rgb_pixel>> crops;
std::vector<std::vector<mmod_rect>> crop_boxes;
// Make 1000 crops.
cropper(1000, images, boxes, crops, crop_boxes);
// Finally, lets look at the results
image_window win;
for (size_t i = 0; i < crops.size(); ++i)
{
win.clear_overlay();
win.set_image(crops[i]);
for (auto b : crop_boxes[i])
{
// Note that mmod_rect has an ignore field. If an object was labeled
// ignore in boxes then it will still be labeled as ignore in
// crop_boxes. Moreover, objects that are not well contained within
// the crop are also set to ignore.
if (b.ignore)
win.add_overlay(b.rect, rgb_pixel(255,255,0)); // draw ignored boxes as orange
else
win.add_overlay(b.rect, rgb_pixel(255,0,0)); // draw other boxes as red
}
cout << "Hit enter to view the next random crop.";
cin.get();
}
}
catch(std::exception& e)
{
cout << e.what() << endl;
}