Commit 2ec4f6846ef196b629677d4dfac4d026ea51fd19
Minor updates.
Showing
9 changed files
with
432 additions
and
63 deletions
openbr/core/eval.cpp
| @@ -130,6 +130,12 @@ float Evaluate(const Mat &simmat, const Mat &mask, const QString &csv) | @@ -130,6 +130,12 @@ float Evaluate(const Mat &simmat, const Mat &mask, const QString &csv) | ||
| 130 | qFatal("Similarity matrix (%ix%i) differs in size from mask matrix (%ix%i).", | 130 | qFatal("Similarity matrix (%ix%i) differs in size from mask matrix (%ix%i).", |
| 131 | simmat.rows, simmat.cols, mask.rows, mask.cols); | 131 | simmat.rows, simmat.cols, mask.rows, mask.cols); |
| 132 | 132 | ||
| 133 | + if (simmat.type() != CV_32FC1) | ||
| 134 | + qFatal("Invalid simmat format"); | ||
| 135 | + | ||
| 136 | + if (mask.type() != CV_8UC1) | ||
| 137 | + qFatal("Invalid mask format"); | ||
| 138 | + | ||
| 133 | float result = -1; | 139 | float result = -1; |
| 134 | 140 | ||
| 135 | // Make comparisons | 141 | // Make comparisons |
| @@ -427,84 +433,106 @@ static QStringList computeDetectionResults(const QList<ResolvedDetection> &detec | @@ -427,84 +433,106 @@ static QStringList computeDetectionResults(const QList<ResolvedDetection> &detec | ||
| 427 | return lines; | 433 | return lines; |
| 428 | } | 434 | } |
| 429 | 435 | ||
| 430 | -QString getDetectKey(const TemplateList &templates) | 436 | +struct DetectionKey : public QString |
| 437 | +{ | ||
| 438 | + enum Type { | ||
| 439 | + Invalid, | ||
| 440 | + Rect, | ||
| 441 | + RectList, | ||
| 442 | + XYWidthHeight | ||
| 443 | + } type; | ||
| 444 | + | ||
| 445 | + DetectionKey(const QString &key = "", Type type = Invalid) | ||
| 446 | + : QString(key), type(type) {} | ||
| 447 | +}; | ||
| 448 | + | ||
| 449 | +static DetectionKey getDetectKey(const FileList &files) | ||
| 431 | { | 450 | { |
| 432 | - const File &f = templates.first().file; | ||
| 433 | - foreach (const QString &key, f.localKeys()) { | ||
| 434 | - // first check for single detections | 451 | + if (files.empty()) |
| 452 | + return DetectionKey(); | ||
| 453 | + | ||
| 454 | + const File &f = files.first(); | ||
| 455 | + const QStringList localKeys = f.localKeys(); | ||
| 456 | + | ||
| 457 | + // first check for single detections | ||
| 458 | + foreach (const QString &key, localKeys) | ||
| 435 | if (!f.get<QRectF>(key, QRectF()).isNull()) | 459 | if (!f.get<QRectF>(key, QRectF()).isNull()) |
| 436 | - return key; | ||
| 437 | - } | 460 | + return DetectionKey(key, DetectionKey::Rect); |
| 461 | + | ||
| 438 | // and then multiple | 462 | // and then multiple |
| 439 | if (!f.rects().empty()) | 463 | if (!f.rects().empty()) |
| 440 | - return "Rects"; | ||
| 441 | - return ""; | ||
| 442 | -} | 464 | + return DetectionKey("Rects", DetectionKey::RectList); |
| 443 | 465 | ||
| 444 | -bool detectKeyIsList(QString key, const TemplateList &templates) | ||
| 445 | -{ | ||
| 446 | - return templates.first().file.get<QRectF>(key, QRectF()).isNull(); | 466 | + // check for <Key>_X, <Key>_Y, <Key>_Width, <Key>_Height |
| 467 | + foreach (const QString &localKey, localKeys) { | ||
| 468 | + if (!localKey.endsWith("_X")) | ||
| 469 | + continue; | ||
| 470 | + const QString key = localKey.mid(0, localKey.size()-2); | ||
| 471 | + if (localKeys.contains(key+"_Y") && | ||
| 472 | + localKeys.contains(key+"_Width") && | ||
| 473 | + localKeys.contains(key+"_Height")) | ||
| 474 | + return DetectionKey(key, DetectionKey::XYWidthHeight); | ||
| 475 | + } | ||
| 476 | + | ||
| 477 | + return DetectionKey(); | ||
| 447 | } | 478 | } |
| 448 | 479 | ||
| 449 | -// return a list of detections whether the template holds | ||
| 450 | -// multiple detections or a single detection | ||
| 451 | -QList<Detection> getDetections(QString key, const Template &t, bool isList, bool isTruth) | 480 | +// return a list of detections independent of the detection key format |
| 481 | +static QList<Detection> getDetections(const DetectionKey &key, const File &f, bool isTruth) | ||
| 452 | { | 482 | { |
| 453 | - File f = t.file; | ||
| 454 | QList<Detection> dets; | 483 | QList<Detection> dets; |
| 455 | - if (isList) { | 484 | + if (key.type == DetectionKey::RectList) { |
| 456 | QList<QRectF> rects = f.rects(); | 485 | QList<QRectF> rects = f.rects(); |
| 457 | QList<float> confidences = f.getList<float>("Confidences", QList<float>()); | 486 | QList<float> confidences = f.getList<float>("Confidences", QList<float>()); |
| 458 | if (!isTruth && rects.size() != confidences.size()) | 487 | if (!isTruth && rects.size() != confidences.size()) |
| 459 | qFatal("You don't have enough confidence. I mean, your detections don't all have confidence measures."); | 488 | qFatal("You don't have enough confidence. I mean, your detections don't all have confidence measures."); |
| 460 | for (int i=0; i<rects.size(); i++) { | 489 | for (int i=0; i<rects.size(); i++) { |
| 461 | if (isTruth) | 490 | if (isTruth) |
| 462 | - dets.append(Detection(rects.at(i))); | 491 | + dets.append(Detection(rects[i])); |
| 463 | else | 492 | else |
| 464 | - dets.append(Detection(rects.at(i), confidences.at(i))); | 493 | + dets.append(Detection(rects[i], confidences[i])); |
| 465 | } | 494 | } |
| 466 | - } else { | ||
| 467 | - if (isTruth) | ||
| 468 | - dets.append(Detection(f.get<QRectF>(key))); | ||
| 469 | - else | ||
| 470 | - dets.append(Detection(f.get<QRectF>(key), f.get<float>("Confidence", -1))); | 495 | + } else if (key.type == DetectionKey::Rect) { |
| 496 | + dets.append(Detection(f.get<QRectF>(key), isTruth ? -1 : f.get<float>("Confidence", -1))); | ||
| 497 | + } else if (key.type == DetectionKey::XYWidthHeight) { | ||
| 498 | + const QRectF rect(f.get<float>(key+"_X"), f.get<float>(key+"_Y"), f.get<float>(key+"_Width"), f.get<float>(key+"_Height")); | ||
| 499 | + dets.append(Detection(rect, isTruth ? -1 : f.get<float>("Confidence", -1))); | ||
| 471 | } | 500 | } |
| 472 | return dets; | 501 | return dets; |
| 473 | } | 502 | } |
| 474 | 503 | ||
| 475 | -QMap<QString, Detections> getDetections(const TemplateList &predicted, const TemplateList &truth) | 504 | +static QMap<QString, Detections> getDetections(const File &predictedGallery, const File &truthGallery) |
| 476 | { | 505 | { |
| 506 | + const FileList predicted = TemplateList::fromGallery(predictedGallery).files(); | ||
| 507 | + const FileList truth = TemplateList::fromGallery(truthGallery).files(); | ||
| 508 | + | ||
| 477 | // Figure out which metadata field contains a bounding box | 509 | // Figure out which metadata field contains a bounding box |
| 478 | - QString truthDetectKey = getDetectKey(truth); | ||
| 479 | - if (truthDetectKey.isEmpty()) qFatal("No suitable ground truth metadata key found."); | ||
| 480 | - QString predictedDetectKey = getDetectKey(predicted); | ||
| 481 | - if (predictedDetectKey.isEmpty()) qFatal("No suitable predicted metadata key found."); | 510 | + DetectionKey truthDetectKey = getDetectKey(truth); |
| 511 | + if (truthDetectKey.isEmpty()) | ||
| 512 | + qFatal("No suitable ground truth metadata key found."); | ||
| 513 | + | ||
| 514 | + DetectionKey predictedDetectKey = getDetectKey(predicted); | ||
| 515 | + if (predictedDetectKey.isEmpty()) | ||
| 516 | + qFatal("No suitable predicted metadata key found."); | ||
| 517 | + | ||
| 482 | qDebug("Using metadata key: %s%s", | 518 | qDebug("Using metadata key: %s%s", |
| 483 | qPrintable(predictedDetectKey), | 519 | qPrintable(predictedDetectKey), |
| 484 | qPrintable(predictedDetectKey == truthDetectKey ? QString() : "/"+truthDetectKey)); | 520 | qPrintable(predictedDetectKey == truthDetectKey ? QString() : "/"+truthDetectKey)); |
| 485 | 521 | ||
| 486 | QMap<QString, Detections> allDetections; | 522 | QMap<QString, Detections> allDetections; |
| 487 | - bool predKeyIsList = detectKeyIsList(predictedDetectKey, predicted); | ||
| 488 | - bool truthKeyIsList = detectKeyIsList(truthDetectKey, truth); | ||
| 489 | - foreach (const Template &t, predicted) { | ||
| 490 | - QList<Detection> dets = getDetections(predictedDetectKey, t, predKeyIsList, false); | ||
| 491 | - allDetections[t.file.baseName()].predicted.append(dets); | ||
| 492 | - } | ||
| 493 | - foreach (const Template &t, truth) { | ||
| 494 | - QList<Detection> dets = getDetections(truthDetectKey, t, truthKeyIsList, true); | ||
| 495 | - allDetections[t.file.baseName()].truth.append(dets); | ||
| 496 | - } | 523 | + foreach (const File &f, predicted) |
| 524 | + allDetections[f.baseName()].predicted.append(getDetections(predictedDetectKey, f, false)); | ||
| 525 | + foreach (const File &f, truth) | ||
| 526 | + allDetections[f.baseName()].truth.append(getDetections(truthDetectKey, f, true)); | ||
| 497 | return allDetections; | 527 | return allDetections; |
| 498 | } | 528 | } |
| 499 | 529 | ||
| 500 | float EvalDetection(const QString &predictedGallery, const QString &truthGallery, const QString &csv) | 530 | float EvalDetection(const QString &predictedGallery, const QString &truthGallery, const QString &csv) |
| 501 | { | 531 | { |
| 502 | qDebug("Evaluating detection of %s against %s", qPrintable(predictedGallery), qPrintable(truthGallery)); | 532 | qDebug("Evaluating detection of %s against %s", qPrintable(predictedGallery), qPrintable(truthGallery)); |
| 503 | - const TemplateList predicted(TemplateList::fromGallery(predictedGallery)); | ||
| 504 | - const TemplateList truth(TemplateList::fromGallery(truthGallery)); | ||
| 505 | 533 | ||
| 506 | // Organized by file, QMap used to preserve order | 534 | // Organized by file, QMap used to preserve order |
| 507 | - QMap<QString, Detections> allDetections = getDetections(predicted, truth); | 535 | + QMap<QString, Detections> allDetections = getDetections(predictedGallery, truthGallery); |
| 508 | 536 | ||
| 509 | QList<ResolvedDetection> resolvedDetections, falseNegativeDetections; | 537 | QList<ResolvedDetection> resolvedDetections, falseNegativeDetections; |
| 510 | int totalTrueDetections = 0; | 538 | int totalTrueDetections = 0; |
openbr/janus.cpp
| @@ -77,15 +77,23 @@ janus_error janus_finalize_template(janus_template template_, janus_flat_templat | @@ -77,15 +77,23 @@ janus_error janus_finalize_template(janus_template template_, janus_flat_templat | ||
| 77 | { | 77 | { |
| 78 | *bytes = 0; | 78 | *bytes = 0; |
| 79 | foreach (const cv::Mat &m, *template_) { | 79 | foreach (const cv::Mat &m, *template_) { |
| 80 | - assert(m.isContinuous()); | 80 | + if (!m.data) |
| 81 | + continue; | ||
| 82 | + | ||
| 83 | + if (!m.isContinuous()) | ||
| 84 | + return JANUS_UNKNOWN_ERROR; | ||
| 85 | + | ||
| 81 | const size_t templateBytes = m.rows * m.cols * m.elemSize(); | 86 | const size_t templateBytes = m.rows * m.cols * m.elemSize(); |
| 82 | if (*bytes + sizeof(size_t) + templateBytes > janus_max_template_size()) | 87 | if (*bytes + sizeof(size_t) + templateBytes > janus_max_template_size()) |
| 83 | break; | 88 | break; |
| 89 | + | ||
| 84 | memcpy(flat_template, &templateBytes, sizeof(templateBytes)); | 90 | memcpy(flat_template, &templateBytes, sizeof(templateBytes)); |
| 85 | flat_template += sizeof(templateBytes); | 91 | flat_template += sizeof(templateBytes); |
| 92 | + *bytes += sizeof(templateBytes); | ||
| 93 | + | ||
| 86 | memcpy(flat_template, m.data, templateBytes); | 94 | memcpy(flat_template, m.data, templateBytes); |
| 87 | flat_template += templateBytes; | 95 | flat_template += templateBytes; |
| 88 | - *bytes += sizeof(size_t) + templateBytes; | 96 | + *bytes += templateBytes; |
| 89 | } | 97 | } |
| 90 | 98 | ||
| 91 | delete template_; | 99 | delete template_; |
openbr/plugins/cascade.cpp
| @@ -19,12 +19,144 @@ | @@ -19,12 +19,144 @@ | ||
| 19 | #include "openbr_internal.h" | 19 | #include "openbr_internal.h" |
| 20 | #include "openbr/core/opencvutils.h" | 20 | #include "openbr/core/opencvutils.h" |
| 21 | #include "openbr/core/resource.h" | 21 | #include "openbr/core/resource.h" |
| 22 | +#include <QProcess> | ||
| 22 | 23 | ||
| 23 | using namespace cv; | 24 | using namespace cv; |
| 25 | + | ||
| 26 | +struct TrainParams | ||
| 27 | +{ | ||
| 28 | + QString data; // REQUIRED: Filepath to store trained classifier | ||
| 29 | + QString vec; // REQUIRED: Filepath to store vector of positive samples, default "vector" | ||
| 30 | + QString img; // Filepath to source object image. Either this or info is REQUIRED | ||
| 31 | + QString info; // Description file of source images. Either this or img is REQUIRED | ||
| 32 | + QString bg; // REQUIRED: Filepath to background list file | ||
| 33 | + int num; // Number of samples to generate | ||
| 34 | + int bgcolor; // Background color supplied image (via img) | ||
| 35 | + int bgthresh; // Threshold to determine bgcolor match | ||
| 36 | + bool inv; // Invert colors | ||
| 37 | + bool randinv; // Randomly invert colors | ||
| 38 | + int maxidev; // Max intensity deviation of foreground pixels | ||
| 39 | + double maxxangle; // Maximum rotation angle (X) | ||
| 40 | + double maxyangle; // Maximum rotation angle (Y) | ||
| 41 | + double maxzangle; // Maximum rotation angle (Z) | ||
| 42 | + bool show; // Show generated samples | ||
| 43 | + int w; // REQUIRED: Sample width | ||
| 44 | + int h; // REQUIRED: Sample height | ||
| 45 | + int numPos; // Number of positive samples | ||
| 46 | + int numNeg; // Number of negative samples | ||
| 47 | + int numStages; // Number of stages | ||
| 48 | + int precalcValBufSize; // Precalculated val buffer size in Mb | ||
| 49 | + int precalcIdxBufSize; // Precalculated index buffer size in Mb | ||
| 50 | + bool baseFormatSave; // Save in old format | ||
| 51 | + QString stageType; // Stage type (BOOST) | ||
| 52 | + QString featureType; // Feature type (HAAR, LBP) | ||
| 53 | + QString bt; // Boosted classifier type (DAB, RAB, LB, GAB) | ||
| 54 | + double minHitRate; // Minimal hit rate per stage | ||
| 55 | + double maxFalseAlarmRate; // Max false alarm rate per stage | ||
| 56 | + double weightTrimRate; // Weight for trimming | ||
| 57 | + int maxDepth; // Max weak tree depth | ||
| 58 | + int maxWeakCount; // Max weak tree count per stage | ||
| 59 | + QString mode; // Haar feature mode (BASIC, CORE, ALL) | ||
| 24 | 60 | ||
| 25 | -namespace br | 61 | + TrainParams() |
| 62 | + { | ||
| 63 | + num = -1; | ||
| 64 | + maxidev = -1; | ||
| 65 | + maxxangle = -1; | ||
| 66 | + maxyangle = -1; | ||
| 67 | + maxzangle = -1; | ||
| 68 | + w = -1; | ||
| 69 | + h = -1; | ||
| 70 | + numPos = -1; | ||
| 71 | + numNeg = -1; | ||
| 72 | + numStages = -1; | ||
| 73 | + precalcValBufSize = -1; | ||
| 74 | + precalcIdxBufSize = -1; | ||
| 75 | + minHitRate = -1; | ||
| 76 | + maxFalseAlarmRate = -1; | ||
| 77 | + weightTrimRate = -1; | ||
| 78 | + maxDepth = -1; | ||
| 79 | + maxWeakCount = -1; | ||
| 80 | + inv = false; | ||
| 81 | + randinv = false; | ||
| 82 | + show = false; | ||
| 83 | + baseFormatSave = false; | ||
| 84 | + vec = "vector.vec"; | ||
| 85 | + bgcolor = -1; | ||
| 86 | + bgthresh = -1; | ||
| 87 | + } | ||
| 88 | +}; | ||
| 89 | + | ||
| 90 | +static QStringList buildTrainingArgs(const TrainParams ¶ms) | ||
| 91 | +{ | ||
| 92 | + QStringList args; | ||
| 93 | + if (params.data != "") args << "-data" << params.data; | ||
| 94 | + else qFatal("Must specify storage location for cascade"); | ||
| 95 | + if (params.vec != "") args << "-vec" << params.vec; | ||
| 96 | + else qFatal("Must specify location of positive vector"); | ||
| 97 | + if (params.bg != "") args << "-bg" << params.bg; | ||
| 98 | + else qFatal("Must specify negative images"); | ||
| 99 | + if (params.numPos >= 0) args << "-numPos" << QString::number(params.numPos); | ||
| 100 | + if (params.numNeg >= 0) args << "-numNeg" << QString::number(params.numNeg); | ||
| 101 | + if (params.numStages >= 0) args << "-numStages" << QString::number(params.numStages); | ||
| 102 | + if (params.precalcValBufSize >= 0) args << "-precalcValBufSize" << QString::number(params.precalcValBufSize); | ||
| 103 | + if (params.precalcIdxBufSize >= 0) args << "-precalcIdxBufSize" << QString::number(params.precalcIdxBufSize); | ||
| 104 | + if (params.baseFormatSave) args << "-baseFormatSave"; | ||
| 105 | + if (params.stageType != "") args << "-stageType" << params.stageType; | ||
| 106 | + if (params.featureType != "") args << "-featureType" << params.featureType; | ||
| 107 | + if (params.w >= 0) args << "-w" << QString::number(params.w); | ||
| 108 | + else qFatal("Must specify width"); | ||
| 109 | + if (params.h >= 0) args << "-h" << QString::number(params.h); | ||
| 110 | + else qFatal("Must specify height"); | ||
| 111 | + if (params.bt != "") args << "-bt" << params.bt; | ||
| 112 | + if (params.minHitRate >= 0) args << "-minHitRate" << QString::number(params.minHitRate); | ||
| 113 | + if (params.maxFalseAlarmRate >= 0) args << "-maxFalseAlarmRate" << QString::number(params.maxFalseAlarmRate); | ||
| 114 | + if (params.weightTrimRate >= 0) args << "-weightTrimRate" << QString::number(params.weightTrimRate); | ||
| 115 | + if (params.maxDepth >= 0) args << "-maxDepth" << QString::number(params.maxDepth); | ||
| 116 | + if (params.maxWeakCount >= 0) args << "-maxWeakCount" << QString::number(params.maxWeakCount); | ||
| 117 | + if (params.mode != "") args << "-mode" << params.mode; | ||
| 118 | + return args; | ||
| 119 | +} | ||
| 120 | + | ||
| 121 | +static QStringList buildSampleArgs(const TrainParams ¶ms) | ||
| 122 | +{ | ||
| 123 | + QStringList args; | ||
| 124 | + if (params.vec != "") args << "-vec" << params.vec; | ||
| 125 | + else qFatal("Must specify location of positive vector"); | ||
| 126 | + if (params.img != "") args << "-img" << params.img; | ||
| 127 | + else if (params.info != "") args << "-info" << params.info; | ||
| 128 | + else qFatal("Must specify positive images"); | ||
| 129 | + if (params.bg != "") args << "-bg" << params.bg; | ||
| 130 | + if (params.num > 0) args << "-num" << QString::number(params.num); | ||
| 131 | + if (params.bgcolor >=0 ) args << "-bgcolor" << QString::number(params.bgcolor); | ||
| 132 | + if (params.bgthresh >= 0) args << "-bgthresh" << QString::number(params.bgthresh); | ||
| 133 | + if (params.maxidev >= 0) args << "-maxidev" << QString::number(params.maxidev); | ||
| 134 | + if (params.maxxangle >= 0) args << "-maxxangle" << QString::number(params.maxxangle); | ||
| 135 | + if (params.maxyangle >= 0) args << "-maxyangle" << QString::number(params.maxyangle); | ||
| 136 | + if (params.maxzangle >= 0) args << "-maxzangle" << QString::number(params.maxzangle); | ||
| 137 | + if (params.w >= 0) args << "-w" << QString::number(params.w); | ||
| 138 | + if (params.h >= 0) args << "-h" << QString::number(params.h); | ||
| 139 | + if (params.show) args << "-show"; | ||
| 140 | + if (params.inv) args << "-inv"; | ||
| 141 | + if (params.randinv) args << "-randinv"; | ||
| 142 | + return args; | ||
| 143 | +} | ||
| 144 | + | ||
| 145 | +static void genSamples(const TrainParams ¶ms) | ||
| 26 | { | 146 | { |
| 147 | + const QStringList cmdArgs = buildSampleArgs(params); | ||
| 148 | + QProcess::execute("opencv_createsamples",cmdArgs); | ||
| 149 | +} | ||
| 27 | 150 | ||
| 151 | +static void trainCascade(const TrainParams ¶ms) | ||
| 152 | +{ | ||
| 153 | + const QStringList cmdArgs = buildTrainingArgs(params); | ||
| 154 | + QProcess::execute("opencv_traincascade", cmdArgs); | ||
| 155 | +} | ||
| 156 | + | ||
| 157 | +namespace br | ||
| 158 | +{ | ||
| 159 | + | ||
| 28 | class CascadeResourceMaker : public ResourceMaker<CascadeClassifier> | 160 | class CascadeResourceMaker : public ResourceMaker<CascadeClassifier> |
| 29 | { | 161 | { |
| 30 | QString file; | 162 | QString file; |
| @@ -37,7 +169,20 @@ public: | @@ -37,7 +169,20 @@ public: | ||
| 37 | else if (model == "Eye") file += "haarcascades/haarcascade_eye_tree_eyeglasses.xml"; | 169 | else if (model == "Eye") file += "haarcascades/haarcascade_eye_tree_eyeglasses.xml"; |
| 38 | else if (model == "FrontalFace") file += "haarcascades/haarcascade_frontalface_alt2.xml"; | 170 | else if (model == "FrontalFace") file += "haarcascades/haarcascade_frontalface_alt2.xml"; |
| 39 | else if (model == "ProfileFace") file += "haarcascades/haarcascade_profileface.xml"; | 171 | else if (model == "ProfileFace") file += "haarcascades/haarcascade_profileface.xml"; |
| 40 | - else qFatal("Invalid model."); | 172 | + else{ |
| 173 | + // Create temp folder if does not exist | ||
| 174 | + file = model+QDir::separator()+"cascade.xml"; | ||
| 175 | + QDir dir(model); | ||
| 176 | + if (!dir.exists()) | ||
| 177 | + if (!QDir::current().mkdir(model)) qFatal("Cannot create model."); | ||
| 178 | + | ||
| 179 | + // Make sure file can be created | ||
| 180 | + QFile pathTest(file); | ||
| 181 | + if (pathTest.exists()) pathTest.remove(); | ||
| 182 | + | ||
| 183 | + if (!pathTest.open(QIODevice::WriteOnly | QIODevice::Text)) qFatal("Cannot create model."); | ||
| 184 | + pathTest.remove(); | ||
| 185 | + } | ||
| 41 | } | 186 | } |
| 42 | 187 | ||
| 43 | private: | 188 | private: |
| @@ -54,16 +199,60 @@ private: | @@ -54,16 +199,60 @@ private: | ||
| 54 | * \ingroup transforms | 199 | * \ingroup transforms |
| 55 | * \brief Wraps OpenCV cascade classifier | 200 | * \brief Wraps OpenCV cascade classifier |
| 56 | * \author Josh Klontz \cite jklontz | 201 | * \author Josh Klontz \cite jklontz |
| 202 | + * \author David Crouse \cite dgcrouse | ||
| 57 | */ | 203 | */ |
| 58 | -class CascadeTransform : public UntrainableMetaTransform | 204 | +class CascadeTransform : public MetaTransform |
| 59 | { | 205 | { |
| 60 | Q_OBJECT | 206 | Q_OBJECT |
| 61 | Q_PROPERTY(QString model READ get_model WRITE set_model RESET reset_model STORED false) | 207 | Q_PROPERTY(QString model READ get_model WRITE set_model RESET reset_model STORED false) |
| 62 | Q_PROPERTY(int minSize READ get_minSize WRITE set_minSize RESET reset_minSize STORED false) | 208 | Q_PROPERTY(int minSize READ get_minSize WRITE set_minSize RESET reset_minSize STORED false) |
| 63 | Q_PROPERTY(bool ROCMode READ get_ROCMode WRITE set_ROCMode RESET reset_ROCMode STORED false) | 209 | Q_PROPERTY(bool ROCMode READ get_ROCMode WRITE set_ROCMode RESET reset_ROCMode STORED false) |
| 210 | + | ||
| 211 | + // Training parameters | ||
| 212 | + Q_PROPERTY(int numStages READ get_numStages WRITE set_numStages RESET reset_numStages STORED false) | ||
| 213 | + Q_PROPERTY(int w READ get_w WRITE set_w RESET reset_w STORED false) | ||
| 214 | + Q_PROPERTY(int h READ get_h WRITE set_h RESET reset_h STORED false) | ||
| 215 | + Q_PROPERTY(int numPos READ get_numPos WRITE set_numPos RESET reset_numPos STORED false) | ||
| 216 | + Q_PROPERTY(int numNeg READ get_numNeg WRITE set_numNeg RESET reset_numNeg STORED false) | ||
| 217 | + Q_PROPERTY(int precalcValBufSize READ get_precalcValBufSize WRITE set_precalcValBufSize RESET reset_precalcValBufSize STORED false) | ||
| 218 | + Q_PROPERTY(int precalcIdxBufSize READ get_precalcIdxBufSize WRITE set_precalcIdxBufSize RESET reset_precalcIdxBufSize STORED false) | ||
| 219 | + Q_PROPERTY(double minHitRate READ get_minHitRate WRITE set_minHitRate RESET reset_minHitRate STORED false) | ||
| 220 | + Q_PROPERTY(double maxFalseAlarmRate READ get_maxFalseAlarmRate WRITE set_maxFalseAlarmRate RESET reset_maxFalseAlarmRate STORED false) | ||
| 221 | + Q_PROPERTY(double weightTrimRate READ get_weightTrimRate WRITE set_weightTrimRate RESET reset_weightTrimRate STORED false) | ||
| 222 | + Q_PROPERTY(int maxDepth READ get_maxDepth WRITE set_maxDepth RESET reset_maxDepth STORED false) | ||
| 223 | + Q_PROPERTY(int maxWeakCount READ get_maxWeakCount WRITE set_maxWeakCount RESET reset_maxWeakCount STORED false) | ||
| 224 | + Q_PROPERTY(QString stageType READ get_stageType WRITE set_stageType RESET reset_stageType STORED false) | ||
| 225 | + Q_PROPERTY(QString featureType READ get_featureType WRITE set_featureType RESET reset_featureType STORED false) | ||
| 226 | + Q_PROPERTY(QString bt READ get_bt WRITE set_bt RESET reset_bt STORED false) | ||
| 227 | + Q_PROPERTY(QString mode READ get_mode WRITE set_mode RESET reset_mode STORED false) | ||
| 228 | + Q_PROPERTY(bool show READ get_show WRITE set_show RESET reset_show STORED false) | ||
| 229 | + Q_PROPERTY(bool baseFormatSave READ get_baseFormatSave WRITE set_baseFormatSave RESET reset_baseFormatSave STORED false) | ||
| 230 | + Q_PROPERTY(bool overwrite READ get_overwrite WRITE set_overwrite RESET reset_overwrite STORED false) | ||
| 231 | + | ||
| 64 | BR_PROPERTY(QString, model, "FrontalFace") | 232 | BR_PROPERTY(QString, model, "FrontalFace") |
| 65 | BR_PROPERTY(int, minSize, 64) | 233 | BR_PROPERTY(int, minSize, 64) |
| 66 | BR_PROPERTY(bool, ROCMode, false) | 234 | BR_PROPERTY(bool, ROCMode, false) |
| 235 | + | ||
| 236 | + // Training parameters - Default values provided trigger OpenCV defaults | ||
| 237 | + BR_PROPERTY(int, numStages, -1) | ||
| 238 | + BR_PROPERTY(int, w, -1) | ||
| 239 | + BR_PROPERTY(int, h, -1) | ||
| 240 | + BR_PROPERTY(int, numPos, -1) | ||
| 241 | + BR_PROPERTY(int, numNeg, -1) | ||
| 242 | + BR_PROPERTY(int, precalcValBufSize, -1) | ||
| 243 | + BR_PROPERTY(int, precalcIdxBufSize, -1) | ||
| 244 | + BR_PROPERTY(double, minHitRate, -1) | ||
| 245 | + BR_PROPERTY(double, maxFalseAlarmRate, -1) | ||
| 246 | + BR_PROPERTY(double, weightTrimRate, -1) | ||
| 247 | + BR_PROPERTY(int, maxDepth, -1) | ||
| 248 | + BR_PROPERTY(int, maxWeakCount, -1) | ||
| 249 | + BR_PROPERTY(QString, stageType, "") | ||
| 250 | + BR_PROPERTY(QString, featureType, "") | ||
| 251 | + BR_PROPERTY(QString, bt, "") | ||
| 252 | + BR_PROPERTY(QString, mode, "") | ||
| 253 | + BR_PROPERTY(bool, show, false) | ||
| 254 | + BR_PROPERTY(bool, baseFormatSave, false) | ||
| 255 | + BR_PROPERTY(bool, overwrite, false) | ||
| 67 | 256 | ||
| 68 | Resource<CascadeClassifier> cascadeResource; | 257 | Resource<CascadeClassifier> cascadeResource; |
| 69 | 258 | ||
| @@ -71,6 +260,136 @@ class CascadeTransform : public UntrainableMetaTransform | @@ -71,6 +260,136 @@ class CascadeTransform : public UntrainableMetaTransform | ||
| 71 | { | 260 | { |
| 72 | cascadeResource.setResourceMaker(new CascadeResourceMaker(model)); | 261 | cascadeResource.setResourceMaker(new CascadeResourceMaker(model)); |
| 73 | } | 262 | } |
| 263 | + | ||
| 264 | + // Train transform | ||
| 265 | + void train(const TemplateList& data) | ||
| 266 | + { | ||
| 267 | + if (overwrite) { | ||
| 268 | + QDir dataDir(model); | ||
| 269 | + if (dataDir.exists()) { | ||
| 270 | + dataDir.removeRecursively(); | ||
| 271 | + QDir::current().mkdir(model); | ||
| 272 | + } | ||
| 273 | + } | ||
| 274 | + | ||
| 275 | + const FileList files = data.files(); | ||
| 276 | + | ||
| 277 | + // Open positive and negative list files | ||
| 278 | + const QString posFName = "pos.txt"; | ||
| 279 | + const QString negFName = "neg.txt"; | ||
| 280 | + QFile posFile(posFName); | ||
| 281 | + QFile negFile(negFName); | ||
| 282 | + posFile.open(QIODevice::WriteOnly | QIODevice::Text); | ||
| 283 | + negFile.open(QIODevice::WriteOnly | QIODevice::Text); | ||
| 284 | + QTextStream posStream(&posFile); | ||
| 285 | + QTextStream negStream(&negFile); | ||
| 286 | + | ||
| 287 | + const QString endln = "\r\n"; | ||
| 288 | + | ||
| 289 | + int posCount = 0; | ||
| 290 | + int negCount = 0; | ||
| 291 | + | ||
| 292 | + bool buildPos = false; // If true, build positive vector from single image | ||
| 293 | + | ||
| 294 | + TrainParams params; | ||
| 295 | + | ||
| 296 | + // Fill in from params (param defaults are same as struct defaults, so no checks are needed) | ||
| 297 | + params.numStages = numStages; | ||
| 298 | + params.w = w; | ||
| 299 | + params.h = h; | ||
| 300 | + params.numPos = numPos; | ||
| 301 | + params.numNeg = numNeg; | ||
| 302 | + params.precalcValBufSize = precalcValBufSize; | ||
| 303 | + params.precalcIdxBufSize = precalcIdxBufSize; | ||
| 304 | + params.minHitRate = minHitRate; | ||
| 305 | + params.maxFalseAlarmRate = maxFalseAlarmRate; | ||
| 306 | + params.weightTrimRate = weightTrimRate; | ||
| 307 | + params.maxDepth = maxDepth; | ||
| 308 | + params.maxWeakCount = maxWeakCount; | ||
| 309 | + params.stageType = stageType; | ||
| 310 | + params.featureType = featureType; | ||
| 311 | + params.bt = bt; | ||
| 312 | + params.mode = mode; | ||
| 313 | + params.show = show; | ||
| 314 | + params.baseFormatSave = baseFormatSave; | ||
| 315 | + if (params.w < 0) params.w = minSize; | ||
| 316 | + if (params.h < 0) params.h = minSize; | ||
| 317 | + | ||
| 318 | + for (int i = 0; i < files.length(); i++) { | ||
| 319 | + File f = files[i]; | ||
| 320 | + if (f.contains("training-set")) { | ||
| 321 | + QString tset = f.get<QString>("training-set",QString()).toLower(); | ||
| 322 | + | ||
| 323 | + // Negative samples | ||
| 324 | + if (tset == "neg") { | ||
| 325 | + if (negCount > 0) negStream<<endln; | ||
| 326 | + negStream << f.path() << QDir::separator() << f.fileName(); | ||
| 327 | + negCount++; | ||
| 328 | + | ||
| 329 | + // Positive samples for crop/rescale | ||
| 330 | + }else if (tset == "pos") { | ||
| 331 | + | ||
| 332 | + if (posCount > 0) posStream<<endln; | ||
| 333 | + QString rects = ""; | ||
| 334 | + | ||
| 335 | + // Extract rectangles | ||
| 336 | + for (int j = 0; j < f.rects().length(); j++) { | ||
| 337 | + QRectF r = f.rects()[j]; | ||
| 338 | + rects += " " + QString::number(r.x()) + " " + QString::number(r.y()) + " " + QString::number(r.width()) + " "+ QString::number(r.height()); | ||
| 339 | + posCount++; | ||
| 340 | + } | ||
| 341 | + if (f.rects().length() > 0) | ||
| 342 | + posStream << f.path() << QDir::separator() << f.fileName() << " " << f.rects().length() << " " << rects; | ||
| 343 | + | ||
| 344 | + // Single positive sample for background removal and overlay on negatives | ||
| 345 | + }else if (tset == "pos-base") { | ||
| 346 | + | ||
| 347 | + buildPos = true; | ||
| 348 | + params.img = f.path() + QDir::separator() + f.fileName(); | ||
| 349 | + | ||
| 350 | + // Parse settings (unique to this one tag) | ||
| 351 | + if (f.contains("num")) params.num = f.get<int>("num",0); | ||
| 352 | + if (f.contains("bgcolor")) params.bgcolor = f.get<int>("bgcolor",0); | ||
| 353 | + if (f.contains("bgthresh")) params.bgthresh =f.get<int>("bgthresh",0); | ||
| 354 | + if (f.contains("inv")) params.inv = f.get<bool>("inv",false); | ||
| 355 | + if (f.contains("randinv")) params.randinv = f.get<bool>("randinv",false); | ||
| 356 | + if (f.contains("maxidev")) params.maxidev = f.get<int>("maxidev",0); | ||
| 357 | + if (f.contains("maxxangle")) params.maxxangle = f.get<double>("maxxangle",0); | ||
| 358 | + if (f.contains("maxyangle")) params.maxyangle = f.get<double>("maxyangle",0); | ||
| 359 | + if (f.contains("maxzangle")) params.maxzangle = f.get<double>("maxzangle",0); | ||
| 360 | + } | ||
| 361 | + } | ||
| 362 | + } | ||
| 363 | + | ||
| 364 | + // Fill in remaining params conditionally | ||
| 365 | + posFile.close(); | ||
| 366 | + negFile.close(); | ||
| 367 | + if (buildPos) { | ||
| 368 | + if (params.numPos < 0) { | ||
| 369 | + if (params.num > 0) params.numPos = (int)(params.num*.95); | ||
| 370 | + else params.numPos = 950; | ||
| 371 | + posFile.remove(); | ||
| 372 | + } | ||
| 373 | + }else{ | ||
| 374 | + params.info = posFName; | ||
| 375 | + if (params.numPos < 0) { | ||
| 376 | + params.numPos = (int)(posCount*.95); | ||
| 377 | + } | ||
| 378 | + } | ||
| 379 | + params.bg = negFName; | ||
| 380 | + params.data = model; | ||
| 381 | + if (params.num < 0) { | ||
| 382 | + params.num = posCount; | ||
| 383 | + } | ||
| 384 | + if (params.numNeg < 0) { | ||
| 385 | + params.numNeg = negCount*10; | ||
| 386 | + } | ||
| 387 | + | ||
| 388 | + genSamples(params); | ||
| 389 | + trainCascade(params); | ||
| 390 | + if (posFile.exists()) posFile.remove(); | ||
| 391 | + negFile.remove(); | ||
| 392 | + } | ||
| 74 | 393 | ||
| 75 | void project(const Template &src, Template &dst) const | 394 | void project(const Template &src, Template &dst) const |
| 76 | { | 395 | { |
openbr/plugins/pp5.cpp
| @@ -322,6 +322,11 @@ class PP5CompareDistance : public Distance | @@ -322,6 +322,11 @@ class PP5CompareDistance : public Distance | ||
| 322 | ppr_free_gallery(gallery.gallery); | 322 | ppr_free_gallery(gallery.gallery); |
| 323 | } | 323 | } |
| 324 | 324 | ||
| 325 | + float compare(const cv::Mat &target, const cv::Mat &query) const | ||
| 326 | + { | ||
| 327 | + return compare(Template(target), Template(query)); | ||
| 328 | + } | ||
| 329 | + | ||
| 325 | float compare(const Template &target, const Template &query) const | 330 | float compare(const Template &target, const Template &query) const |
| 326 | { | 331 | { |
| 327 | TemplateList targetList; | 332 | TemplateList targetList; |
scripts/downloadDatasets.sh
| @@ -117,20 +117,7 @@ if [ ! -d ../data/LFW/img ]; then | @@ -117,20 +117,7 @@ if [ ! -d ../data/LFW/img ]; then | ||
| 117 | rm lfw.tgz | 117 | rm lfw.tgz |
| 118 | fi | 118 | fi |
| 119 | 119 | ||
| 120 | -# MEDS | ||
| 121 | -if [ ! -d ../data/MEDS/img ]; then | ||
| 122 | - echo "Downloading MEDS..." | ||
| 123 | - if hash curl 2>/dev/null; then | ||
| 124 | - curl -OL http://nigos.nist.gov:8080/nist/sd/32/NIST_SD32_MEDS-II_face.zip | ||
| 125 | - else | ||
| 126 | - wget http://nigos.nist.gov:8080/nist/sd/32/NIST_SD32_MEDS-II_face.zip | ||
| 127 | - fi | ||
| 128 | - | ||
| 129 | - unzip NIST_SD32_MEDS-II_face.zip | ||
| 130 | - mkdir ../data/MEDS/img | ||
| 131 | - mv data/*/*.jpg ../data/MEDS/img | ||
| 132 | - rm -r data NIST_SD32_MEDS-II_face.zip | ||
| 133 | -fi | 120 | +./downloadMeds.sh |
| 134 | 121 | ||
| 135 | #LFPW | 122 | #LFPW |
| 136 | if [ ! -d ../data/lfpw/trainset ]; then | 123 | if [ ! -d ../data/lfpw/trainset ]; then |
scripts/downloadMEDS.sh
0 → 100644
| 1 | +#!/bin/bash | ||
| 2 | + | ||
| 3 | + | ||
| 4 | +# MEDS | ||
| 5 | +if [ ! -d ../data/MEDS/img ]; then | ||
| 6 | + echo "Downloading MEDS..." | ||
| 7 | + if hash curl 2>/dev/null; then | ||
| 8 | + curl -OL http://nigos.nist.gov:8080/nist/sd/32/NIST_SD32_MEDS-II_face.zip | ||
| 9 | + else | ||
| 10 | + wget http://nigos.nist.gov:8080/nist/sd/32/NIST_SD32_MEDS-II_face.zip | ||
| 11 | + fi | ||
| 12 | + | ||
| 13 | + unzip NIST_SD32_MEDS-II_face.zip | ||
| 14 | + mkdir ../data/MEDS/img | ||
| 15 | + mv data/*/*.jpg ../data/MEDS/img | ||
| 16 | + rm -r data NIST_SD32_MEDS-II_face.zip | ||
| 17 | +fi |
scripts/evalFaceRecognition-MEDS.sh
| @@ -13,7 +13,7 @@ if ! hash br 2>/dev/null; then | @@ -13,7 +13,7 @@ if ! hash br 2>/dev/null; then | ||
| 13 | fi | 13 | fi |
| 14 | 14 | ||
| 15 | # Get the data | 15 | # Get the data |
| 16 | -./downloadDatasets.sh | 16 | +./downloadMEDS.sh |
| 17 | 17 | ||
| 18 | if [ ! -e Algorithm_Dataset ]; then | 18 | if [ ! -e Algorithm_Dataset ]; then |
| 19 | mkdir Algorithm_Dataset | 19 | mkdir Algorithm_Dataset |
share/openbr/openbr.bib
| @@ -38,6 +38,11 @@ | @@ -38,6 +38,11 @@ | ||
| 38 | Author = {Austin Van Blanton}, | 38 | Author = {Austin Van Blanton}, |
| 39 | Howpublished = {https://github.com/imaus10}, | 39 | Howpublished = {https://github.com/imaus10}, |
| 40 | Title = {imaus10 at gmail.com}} | 40 | Title = {imaus10 at gmail.com}} |
| 41 | + | ||
| 42 | + @misc{dgcrouse, | ||
| 43 | + Author = {David G. Crouse}, | ||
| 44 | + Howpublished = {https://github.com/dgcrouse}, | ||
| 45 | + Title = {dgcrouse at gmail.com}} | ||
| 41 | 46 | ||
| 42 | % Software | 47 | % Software |
| 43 | @misc{libface, | 48 | @misc{libface, |