summaryrefslogtreecommitdiffstats
path: root/ml/dlib/examples/random_cropper_ex.cpp
blob: 6b020058d53992ecd457a345528bd827482bdfe4 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
// The contents of this file are in the public domain. See LICENSE_FOR_EXAMPLE_PROGRAMS.txt
/*
    When you are training a convolutional neural network using the loss_mmod loss
    layer, you need to generate a bunch of identically sized training images.  The
    random_cropper is a convenient tool to help you crop out a bunch of
    identically sized images from a training dataset.

    This example shows you what it does exactly and talks about some of its options.
*/


#include <iostream>
#include <dlib/data_io.h>
#include <dlib/gui_widgets.h>
#include <dlib/image_transforms.h>

using namespace std;
using namespace dlib;

// ----------------------------------------------------------------------------------------

int main(int argc, char** argv) try
{
    if (argc != 2)
    {
        cout << "Give an image dataset XML file to run this program." << endl;
        cout << "For example, if you are running from the examples folder then run this program by typing" << endl;
        cout << "   ./random_cropper_ex faces/training.xml" << endl;
        cout << endl;
        return 0;
    }

    // First lets load a dataset
    std::vector<matrix<rgb_pixel>> images;
    std::vector<std::vector<mmod_rect>> boxes;
    load_image_dataset(images, boxes, argv[1]);

    // Here we make our random_cropper.  It has a number of options. 
    random_cropper cropper;
    // We can tell it how big we want the cropped images to be.
    cropper.set_chip_dims(400,400);
    // Also, when doing cropping, it will map the object annotations from the
    // dataset to the cropped image as well as perform random scale jittering.
    // You can tell it how much scale jittering you would like by saying "please
    // make the objects in the crops have a min and max size of such and such".
    // You do that by calling these two functions.  Here we are saying we want the
    // objects in our crops to be no more than 0.8*400 pixels in height and width.
    cropper.set_max_object_size(0.8);
    // And also that they shouldn't be too small. Specifically, each object's smallest
    // dimension (i.e. height or width) should be at least 60 pixels and at least one of
    // the dimensions must be at least 80 pixels.  So the smallest objects the cropper will
    // output will be either 80x60 or 60x80.
    cropper.set_min_object_size(80,60);
    // The cropper can also randomly mirror and rotate crops, which we ask it to
    // perform as well.
    cropper.set_randomly_flip(true);
    cropper.set_max_rotation_degrees(50);
    // This fraction of crops are from random parts of images, rather than being centered
    // on some object.
    cropper.set_background_crops_fraction(0.2);

    // Now ask the cropper to generate a bunch of crops.  The output is stored in
    // crops and crop_boxes.
    std::vector<matrix<rgb_pixel>> crops;
    std::vector<std::vector<mmod_rect>> crop_boxes;
    // Make 1000 crops.
    cropper(1000, images, boxes, crops, crop_boxes);

    // Finally, lets look at the results
    image_window win;
    for (size_t i = 0; i < crops.size(); ++i)
    {
        win.clear_overlay();
        win.set_image(crops[i]);
        for (auto b : crop_boxes[i])
        {
            // Note that mmod_rect has an ignore field.  If an object was labeled
            // ignore in boxes then it will still be labeled as ignore in
            // crop_boxes.  Moreover, objects that are not well contained within
            // the crop are also set to ignore.
            if (b.ignore)
                win.add_overlay(b.rect, rgb_pixel(255,255,0)); // draw ignored boxes as orange 
            else
                win.add_overlay(b.rect, rgb_pixel(255,0,0));   // draw other boxes as red
        }
        cout << "Hit enter to view the next random crop.";
        cin.get();
    }

}
catch(std::exception& e)
{
    cout << e.what() << endl;
}