412 lines
16 KiB
C++
412 lines
16 KiB
C++
// Copyright (C) 2011 Davis E. King (davis@dlib.net)
|
|
// License: Boost Software License See LICENSE.txt for the full license.
|
|
#ifndef DLIB_IMAGE_DAtASET_METADATA_CPPh_
|
|
#define DLIB_IMAGE_DAtASET_METADATA_CPPh_
|
|
|
|
#include "image_dataset_metadata.h"
|
|
|
|
#include <fstream>
|
|
#include <sstream>
|
|
#include "../compress_stream.h"
|
|
#include "../base64.h"
|
|
#include "../xml_parser.h"
|
|
#include "../string.h"
|
|
|
|
// ----------------------------------------------------------------------------------------
|
|
|
|
namespace dlib
|
|
{
|
|
namespace image_dataset_metadata
|
|
{
|
|
|
|
// ------------------------------------------------------------------------------------
|
|
|
|
const std::string get_decoded_string();
|
|
void create_image_metadata_stylesheet_file(const std::string& main_filename)
|
|
{
|
|
std::string path;
|
|
std::string::size_type pos = main_filename.find_last_of("/\\");
|
|
if (pos != std::string::npos)
|
|
path = main_filename.substr(0,pos+1);
|
|
|
|
std::ofstream fout((path + "image_metadata_stylesheet.xsl").c_str());
|
|
if (!fout)
|
|
throw dlib::error("ERROR: Unable to open image_metadata_stylesheet.xsl for writing.");
|
|
|
|
fout << get_decoded_string();
|
|
|
|
if (!fout)
|
|
throw dlib::error("ERROR: Unable to write to image_metadata_stylesheet.xsl.");
|
|
}
|
|
|
|
void save_image_dataset_metadata (
|
|
const dataset& meta,
|
|
const std::string& filename
|
|
)
|
|
{
|
|
create_image_metadata_stylesheet_file(filename);
|
|
|
|
const std::vector<image>& images = meta.images;
|
|
|
|
std::ofstream fout(filename.c_str());
|
|
if (!fout)
|
|
throw dlib::error("ERROR: Unable to open " + filename + " for writing.");
|
|
|
|
fout << "<?xml version='1.0' encoding='ISO-8859-1'?>\n";
|
|
fout << "<?xml-stylesheet type='text/xsl' href='image_metadata_stylesheet.xsl'?>\n";
|
|
fout << "<dataset>\n";
|
|
fout << "<name>" << meta.name << "</name>\n";
|
|
fout << "<comment>" << meta.comment << "</comment>\n";
|
|
fout << "<images>\n";
|
|
for (unsigned long i = 0; i < images.size(); ++i)
|
|
{
|
|
fout << " <image file='" << images[i].filename << "'>\n";
|
|
|
|
// save all the boxes
|
|
for (unsigned long j = 0; j < images[i].boxes.size(); ++j)
|
|
{
|
|
const box& b = images[i].boxes[j];
|
|
fout << " <box top='" << b.rect.top() << "' "
|
|
<< "left='" << b.rect.left() << "' "
|
|
<< "width='" << b.rect.width() << "' "
|
|
<< "height='" << b.rect.height() << "'";
|
|
if (b.difficult)
|
|
fout << " difficult='" << b.difficult << "'";
|
|
if (b.truncated)
|
|
fout << " truncated='" << b.truncated << "'";
|
|
if (b.occluded)
|
|
fout << " occluded='" << b.occluded << "'";
|
|
if (b.ignore)
|
|
fout << " ignore='" << b.ignore << "'";
|
|
if (b.angle != 0)
|
|
fout << " angle='" << b.angle << "'";
|
|
if (b.age != 0)
|
|
fout << " age='" << b.age << "'";
|
|
if (b.gender == FEMALE)
|
|
fout << " gender='female'";
|
|
else if (b.gender == MALE)
|
|
fout << " gender='male'";
|
|
if (b.pose != 0)
|
|
fout << " pose='" << b.pose << "'";
|
|
if (b.detection_score != 0)
|
|
fout << " detection_score='" << b.detection_score << "'";
|
|
|
|
if (b.has_label() || b.parts.size() != 0)
|
|
{
|
|
fout << ">\n";
|
|
|
|
if (b.has_label())
|
|
fout << " <label>" << b.label << "</label>\n";
|
|
|
|
// save all the parts
|
|
std::map<std::string,point>::const_iterator itr;
|
|
for (itr = b.parts.begin(); itr != b.parts.end(); ++itr)
|
|
{
|
|
fout << " <part name='"<< itr->first << "' x='"<< itr->second.x() <<"' y='"<< itr->second.y() <<"'/>\n";
|
|
}
|
|
|
|
fout << " </box>\n";
|
|
}
|
|
else
|
|
{
|
|
fout << "/>\n";
|
|
}
|
|
}
|
|
|
|
|
|
|
|
fout << " </image>\n";
|
|
|
|
if (!fout)
|
|
throw dlib::error("ERROR: Unable to write to " + filename + ".");
|
|
}
|
|
fout << "</images>\n";
|
|
fout << "</dataset>";
|
|
}
|
|
|
|
// ------------------------------------------------------------------------------------
|
|
// ------------------------------------------------------------------------------------
|
|
// ------------------------------------------------------------------------------------
|
|
|
|
class doc_handler : public document_handler
|
|
{
|
|
std::vector<std::string> ts;
|
|
image temp_image;
|
|
box temp_box;
|
|
|
|
dataset& meta;
|
|
|
|
public:
|
|
|
|
doc_handler(
|
|
dataset& metadata_
|
|
):
|
|
meta(metadata_)
|
|
{}
|
|
|
|
|
|
virtual void start_document (
|
|
)
|
|
{
|
|
meta = dataset();
|
|
ts.clear();
|
|
temp_image = image();
|
|
temp_box = box();
|
|
}
|
|
|
|
virtual void end_document (
|
|
)
|
|
{
|
|
}
|
|
|
|
virtual void start_element (
|
|
const unsigned long line_number,
|
|
const std::string& name,
|
|
const dlib::attribute_list& atts
|
|
)
|
|
{
|
|
try
|
|
{
|
|
if (ts.size() == 0)
|
|
{
|
|
if (name != "dataset")
|
|
{
|
|
std::ostringstream sout;
|
|
sout << "Invalid XML document. Root tag must be <dataset>. Found <" << name << "> instead.";
|
|
throw dlib::error(sout.str());
|
|
}
|
|
else
|
|
{
|
|
ts.push_back(name);
|
|
return;
|
|
}
|
|
}
|
|
|
|
|
|
if (name == "box")
|
|
{
|
|
if (atts.is_in_list("top")) temp_box.rect.top() = sa = atts["top"];
|
|
else throw dlib::error("<box> missing required attribute 'top'");
|
|
|
|
if (atts.is_in_list("left")) temp_box.rect.left() = sa = atts["left"];
|
|
else throw dlib::error("<box> missing required attribute 'left'");
|
|
|
|
if (atts.is_in_list("width")) temp_box.rect.right() = sa = atts["width"];
|
|
else throw dlib::error("<box> missing required attribute 'width'");
|
|
|
|
if (atts.is_in_list("height")) temp_box.rect.bottom() = sa = atts["height"];
|
|
else throw dlib::error("<box> missing required attribute 'height'");
|
|
|
|
if (atts.is_in_list("difficult")) temp_box.difficult = sa = atts["difficult"];
|
|
if (atts.is_in_list("truncated")) temp_box.truncated = sa = atts["truncated"];
|
|
if (atts.is_in_list("occluded")) temp_box.occluded = sa = atts["occluded"];
|
|
if (atts.is_in_list("ignore")) temp_box.ignore = sa = atts["ignore"];
|
|
if (atts.is_in_list("angle")) temp_box.angle = sa = atts["angle"];
|
|
if (atts.is_in_list("age")) temp_box.age = sa = atts["age"];
|
|
if (atts.is_in_list("gender"))
|
|
{
|
|
if (atts["gender"] == "male")
|
|
temp_box.gender = MALE;
|
|
else if (atts["gender"] == "female")
|
|
temp_box.gender = FEMALE;
|
|
else if (atts["gender"] == "unknown")
|
|
temp_box.gender = UNKNOWN;
|
|
else
|
|
throw dlib::error("Invalid gender string in box attribute.");
|
|
}
|
|
if (atts.is_in_list("pose")) temp_box.pose = sa = atts["pose"];
|
|
if (atts.is_in_list("detection_score")) temp_box.detection_score = sa = atts["detection_score"];
|
|
|
|
temp_box.rect.bottom() += temp_box.rect.top()-1;
|
|
temp_box.rect.right() += temp_box.rect.left()-1;
|
|
}
|
|
else if (name == "part" && ts.back() == "box")
|
|
{
|
|
point temp;
|
|
if (atts.is_in_list("x")) temp.x() = sa = atts["x"];
|
|
else throw dlib::error("<part> missing required attribute 'x'");
|
|
|
|
if (atts.is_in_list("y")) temp.y() = sa = atts["y"];
|
|
else throw dlib::error("<part> missing required attribute 'y'");
|
|
|
|
if (atts.is_in_list("name"))
|
|
{
|
|
if (temp_box.parts.count(atts["name"])==0)
|
|
{
|
|
temp_box.parts[atts["name"]] = temp;
|
|
}
|
|
else
|
|
{
|
|
throw dlib::error("<part> with name '" + atts["name"] + "' is defined more than one time in a single box.");
|
|
}
|
|
}
|
|
else
|
|
{
|
|
throw dlib::error("<part> missing required attribute 'name'");
|
|
}
|
|
}
|
|
else if (name == "image")
|
|
{
|
|
temp_image.boxes.clear();
|
|
|
|
if (atts.is_in_list("file")) temp_image.filename = atts["file"];
|
|
else throw dlib::error("<image> missing required attribute 'file'");
|
|
}
|
|
|
|
ts.push_back(name);
|
|
}
|
|
catch (error& e)
|
|
{
|
|
throw dlib::error("Error on line " + cast_to_string(line_number) + ": " + e.what());
|
|
}
|
|
}
|
|
|
|
virtual void end_element (
|
|
const unsigned long ,
|
|
const std::string& name
|
|
)
|
|
{
|
|
ts.pop_back();
|
|
if (ts.size() == 0)
|
|
return;
|
|
|
|
if (name == "box" && ts.back() == "image")
|
|
{
|
|
temp_image.boxes.push_back(temp_box);
|
|
temp_box = box();
|
|
}
|
|
else if (name == "image" && ts.back() == "images")
|
|
{
|
|
meta.images.push_back(temp_image);
|
|
temp_image = image();
|
|
}
|
|
}
|
|
|
|
virtual void characters (
|
|
const std::string& data
|
|
)
|
|
{
|
|
if (ts.size() == 2 && ts[1] == "name")
|
|
{
|
|
meta.name = trim(data);
|
|
}
|
|
else if (ts.size() == 2 && ts[1] == "comment")
|
|
{
|
|
meta.comment = trim(data);
|
|
}
|
|
else if (ts.size() >= 2 && ts[ts.size()-1] == "label" &&
|
|
ts[ts.size()-2] == "box")
|
|
{
|
|
temp_box.label = trim(data);
|
|
}
|
|
}
|
|
|
|
virtual void processing_instruction (
|
|
const unsigned long ,
|
|
const std::string& ,
|
|
const std::string&
|
|
)
|
|
{
|
|
}
|
|
};
|
|
|
|
// ----------------------------------------------------------------------------------------
|
|
|
|
class xml_error_handler : public error_handler
|
|
{
|
|
public:
|
|
virtual void error (
|
|
const unsigned long
|
|
) { }
|
|
|
|
virtual void fatal_error (
|
|
const unsigned long line_number
|
|
)
|
|
{
|
|
std::ostringstream sout;
|
|
sout << "There is a fatal error on line " << line_number << " so parsing will now halt.";
|
|
throw dlib::error(sout.str());
|
|
}
|
|
};
|
|
|
|
// ------------------------------------------------------------------------------------
|
|
|
|
void load_image_dataset_metadata (
|
|
dataset& meta,
|
|
const std::string& filename
|
|
)
|
|
{
|
|
xml_error_handler eh;
|
|
doc_handler dh(meta);
|
|
|
|
std::ifstream fin(filename.c_str());
|
|
if (!fin)
|
|
throw dlib::error("ERROR: unable to open " + filename + " for reading.");
|
|
|
|
xml_parser parser;
|
|
parser.add_document_handler(dh);
|
|
parser.add_error_handler(eh);
|
|
parser.parse(fin);
|
|
}
|
|
|
|
// ------------------------------------------------------------------------------------
|
|
// ------------------------------------------------------------------------------------
|
|
// ------------------------------------------------------------------------------------
|
|
|
|
// This function returns the contents of the file 'images.xsl'
|
|
const std::string get_decoded_string()
|
|
{
|
|
dlib::base64 base64_coder;
|
|
dlib::compress_stream::kernel_1ea compressor;
|
|
std::ostringstream sout;
|
|
std::istringstream sin;
|
|
|
|
// The base64 encoded data from the file 'image_metadata_stylesheet.xsl' we want to decode and return.
|
|
sout << "PFWfgmWfCHr1DkV63lbjjeY2dCc2FbHDOVh0Kd7dkvaOfRYrOG24f0x77/5iMVq8FtE3UBxtGwSd";
|
|
sout << "1ZHOHRSHgieNoeBv8ssJQ75RRxYtFKRY3OTPX5eKQoCN9jUaUnHnR4QZtEHgmKqXSs50Yrdd+2Ah";
|
|
sout << "gNyarPZCiR6nvqNvCjtP2MP5FxleqNf8Fylatm2KdsXmrv5K87LYVN7i7JMkmZ++cTXYSOxDmxZi";
|
|
sout << "OiCH8funXUdF9apDW547gCjz9HOQUI6dkz5dYUeFjfp6dFugpnaJyyprFLKq048Qk7+QiL4CNF/G";
|
|
sout << "7e0VpBw8dMpiyRNi2fSQGSZGfIAUQKKT6+rPwQoRH2spdjsdXVWj4XQAqBX87nmqMnqjMhn/Vd1s";
|
|
sout << "W5aoC0drwRGu3Xe3gn9vBL8hBkRXcJvEy6q/lb9bYnsLemhE5Zp/+nTmTBjfT9UFYLcsmgsjC+4n";
|
|
sout << "Bq6h9QlpuyMYqJ8RvW8pp3mFlvXc3Yg+18t5F0hSMQfaIFYAuDPU2lVzPpY+ba0B39iu9IrPCLsS";
|
|
sout << "+tUtSNSmQ74CtzZgKKjkTMA3nwYP2SDmZE3firq42pihT7hdU5vYkes69K8AQl8WZyLPpMww+r0z";
|
|
sout << "+veEHPlAuxF7kL3ZvVjdB+xABwwqDe0kSRHRZINYdUfJwJdfYLyDnYoMjj6afqIJZ7QOBPZ42tV5";
|
|
sout << "3hYOQTFwTNovOastzJJXQe1kxPg1AQ8ynmfjjJZqD0xKedlyeJybP919mVAA23UryHsq9TVlabou";
|
|
sout << "qNl3xZW/mKKktvVsd/nuH62HIv/kgomyhaEUY5HgupupBUbQFZfyljZ5bl3g3V3Y1400Z1xTM/LL";
|
|
sout << "LJpeLdlqoGzIe/19vAN1zUUVId9F/OLNUl3Zoar63yZERSJHcsuq/Pasisp0HIGi7rfI9EIQF7C/";
|
|
sout << "IhLKLZsJ+LOycreQGOJALZIEZHOqxYLSXG0qaPM5bQL/MQJ2OZfwEhQgYOrjaM7oPOHHEfTq5kcO";
|
|
sout << "daMwzefKfxrF2GXbUs0bYsEXsIGwENIUKMliFaAI4qKLxxb94oc+O3BRjWueZjZty2zKawQyTHNd";
|
|
sout << "ltFJBUzfffdZN9Wq4zbPzntkM3U6Ys4LRztx5M15dtbhFeKx5rAf2tPXT6wU01hx7EJxBJzpvoDE";
|
|
sout << "YwEoYVDSYulRKpgk82cHFzzUDgWXbl4paFSe1L1w8r9KHr67SYJDTUG86Lrm6LJ0rw73Xp0NAFcU";
|
|
sout << "MKpiG9g1cHW74HYbUb/yAbtVWt40eB7M637umdo2jWz/r/vP5WnfSMXEbkyWebsa1fFceg/TLWy6";
|
|
sout << "E8OTc4XKB48h1oFIlGagOiprxho3+F3TIcxDSwA=";
|
|
|
|
|
|
|
|
// Put the data into the istream sin
|
|
sin.str(sout.str());
|
|
sout.str("");
|
|
|
|
// Decode the base64 text into its compressed binary form
|
|
base64_coder.decode(sin,sout);
|
|
sin.clear();
|
|
sin.str(sout.str());
|
|
sout.str("");
|
|
|
|
// Decompress the data into its original form
|
|
compressor.decompress(sin,sout);
|
|
|
|
// Return the decoded and decompressed data
|
|
return sout.str();
|
|
}
|
|
|
|
|
|
}
|
|
}
|
|
|
|
// ----------------------------------------------------------------------------------------
|
|
|
|
#endif // DLIB_IMAGE_DAtASET_METADATA_CPPh_
|
|
|
|
|